diff --git "a/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" --- "a/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" +++ "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 1.288, "train/learning_rate": 9.405963302752294e-05, "train/epoch": 2.16, "train/global_step": 3500, "_runtime": 50225, "_timestamp": 1651822523, "_step": 3506, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 9.0, 37.0, 77.0, 194.0, 261.0, 226.0, 108.0, 64.0, 28.0, 6.0, 3.0], "bins": [-4.193824768066406, -4.121095180511475, -4.048366069793701, -3.9756367206573486, -3.902907371520996, -3.8301777839660645, -3.757448434829712, -3.6847190856933594, -3.611989736557007, -3.5392603874206543, -3.4665310382843018, -3.393801689147949, -3.3210721015930176, -3.248342752456665, -3.1756134033203125, -3.10288405418396, -3.0301547050476074, -2.957425355911255, -2.8846960067749023, -2.81196665763855, -2.7392373085021973, -2.6665077209472656, -2.593778371810913, -2.5210490226745605, -2.448319673538208, -2.3755903244018555, -2.302860975265503, -2.2301316261291504, -2.1574020385742188, -2.084672689437866, -2.0119433403015137, -1.9392139911651611, -1.8664848804473877, -1.7937555313110352, -1.7210261821746826, -1.6482967138290405, -1.575567364692688, -1.5028380155563354, -1.4301085472106934, -1.3573791980743408, -1.2846498489379883, -1.2119204998016357, -1.1391911506652832, -1.0664616823196411, -0.9937323331832886, -0.921002984046936, -0.8482735753059387, -0.7755441665649414, -0.7028148174285889, -0.6300854682922363, -0.557356059551239, -0.4846266806125641, -0.41189730167388916, -0.33916792273521423, -0.2664385437965393, -0.193709135055542, -0.12097975611686707, -0.04825037717819214, 0.024479001760482788, 0.09720838069915771, 0.16993775963783264, 0.24266713857650757, 0.3153965175151825, 0.3881259262561798, 0.46085527539253235]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 10.0, 6.0, 6.0, 12.0, 12.0, 16.0, 18.0, 20.0, 26.0, 19.0, 27.0, 21.0, 26.0, 31.0, 36.0, 36.0, 34.0, 40.0, 40.0, 41.0, 43.0, 39.0, 34.0, 32.0, 35.0, 36.0, 34.0, 33.0, 25.0, 31.0, 14.0, 27.0, 18.0, 30.0, 12.0, 14.0, 10.0, 7.0, 8.0, 7.0, 8.0, 9.0, 2.0, 6.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.7703433036804199, -0.7468107342720032, -0.7232781648635864, -0.6997455358505249, -0.6762129664421082, -0.6526803970336914, -0.6291478276252747, -0.6056152582168579, -0.5820826292037964, -0.5585500597953796, -0.5350174903869629, -0.5114848613739014, -0.4879522919654846, -0.46441972255706787, -0.4408871531486511, -0.4173545837402344, -0.3938220143318176, -0.3702894449234009, -0.34675684571266174, -0.323224276304245, -0.29969167709350586, -0.2761591076850891, -0.25262653827667236, -0.22909395396709442, -0.20556136965751648, -0.18202878534793854, -0.1584962010383606, -0.13496363162994385, -0.1114310473203659, -0.08789846301078796, -0.06436589360237122, -0.040833309292793274, -0.017300784587860107, 0.006231795996427536, 0.02976437658071518, 0.053296953439712524, 0.07682953774929047, 0.10036212205886841, 0.12389469146728516, 0.1474272757768631, 0.17095986008644104, 0.19449244439601898, 0.21802502870559692, 0.24155759811401367, 0.2650901675224304, 0.28862276673316956, 0.3121553361415863, 0.33568793535232544, 0.3592205047607422, 0.38275307416915894, 0.40628567337989807, 0.4298182427883148, 0.45335084199905396, 0.4768834114074707, 0.5004159808158875, 0.5239485502243042, 0.5474811792373657, 0.5710137486457825, 0.5945463180541992, 0.6180789470672607, 0.6416115164756775, 0.6651440858840942, 0.688676655292511, 0.7122092247009277, 0.7357417941093445]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 2.0, 7.0, 7.0, 9.0, 10.0, 13.0, 21.0, 39.0, 40.0, 73.0, 102.0, 135.0, 211.0, 345.0, 525.0, 800.0, 1292.0, 2252.0, 3907.0, 7417.0, 14680.0, 33012.0, 87782.0, 268560.0, 1118390.0, 1971024.0, 459177.0, 134966.0, 48014.0, 20266.0, 9465.0, 4950.0, 2651.0, 1570.0, 934.0, 596.0, 354.0, 210.0, 171.0, 97.0, 55.0, 53.0, 30.0, 25.0, 12.0, 7.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.041015625, -1.0086822509765625, -0.976348876953125, -0.9440155029296875, -0.91168212890625, -0.8793487548828125, -0.847015380859375, -0.8146820068359375, -0.7823486328125, -0.7500152587890625, -0.717681884765625, -0.6853485107421875, -0.65301513671875, -0.6206817626953125, -0.588348388671875, -0.5560150146484375, -0.523681640625, -0.4913482666015625, -0.459014892578125, -0.4266815185546875, -0.39434814453125, -0.3620147705078125, -0.329681396484375, -0.2973480224609375, -0.2650146484375, -0.2326812744140625, -0.200347900390625, -0.1680145263671875, -0.13568115234375, -0.1033477783203125, -0.071014404296875, -0.0386810302734375, -0.00634765625, 0.0259857177734375, 0.058319091796875, 0.0906524658203125, 0.12298583984375, 0.1553192138671875, 0.187652587890625, 0.2199859619140625, 0.2523193359375, 0.2846527099609375, 0.316986083984375, 0.3493194580078125, 0.38165283203125, 0.4139862060546875, 0.446319580078125, 0.4786529541015625, 0.510986328125, 0.5433197021484375, 0.575653076171875, 0.6079864501953125, 0.64031982421875, 0.6726531982421875, 0.704986572265625, 0.7373199462890625, 0.7696533203125, 0.8019866943359375, 0.834320068359375, 0.8666534423828125, 0.89898681640625, 0.9313201904296875, 0.963653564453125, 0.9959869384765625, 1.0283203125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 3.0, 7.0, 13.0, 16.0, 18.0, 18.0, 21.0, 19.0, 16.0, 24.0, 22.0, 27.0, 34.0, 37.0, 32.0, 35.0, 43.0, 43.0, 40.0, 40.0, 28.0, 32.0, 37.0, 46.0, 34.0, 34.0, 35.0, 27.0, 26.0, 18.0, 24.0, 27.0, 19.0, 15.0, 13.0, 11.0, 13.0, 3.0, 5.0, 6.0, 11.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-1.0927734375, -1.0614395141601562, -1.0301055908203125, -0.9987716674804688, -0.967437744140625, -0.9361038208007812, -0.9047698974609375, -0.8734359741210938, -0.84210205078125, -0.8107681274414062, -0.7794342041015625, -0.7481002807617188, -0.716766357421875, -0.6854324340820312, -0.6540985107421875, -0.6227645874023438, -0.5914306640625, -0.5600967407226562, -0.5287628173828125, -0.49742889404296875, -0.466094970703125, -0.43476104736328125, -0.4034271240234375, -0.37209320068359375, -0.34075927734375, -0.30942535400390625, -0.2780914306640625, -0.24675750732421875, -0.215423583984375, -0.18408966064453125, -0.1527557373046875, -0.12142181396484375, -0.090087890625, -0.05875396728515625, -0.0274200439453125, 0.00391387939453125, 0.035247802734375, 0.06658172607421875, 0.0979156494140625, 0.12924957275390625, 0.16058349609375, 0.19191741943359375, 0.2232513427734375, 0.25458526611328125, 0.285919189453125, 0.31725311279296875, 0.3485870361328125, 0.37992095947265625, 0.4112548828125, 0.44258880615234375, 0.4739227294921875, 0.5052566528320312, 0.536590576171875, 0.5679244995117188, 0.5992584228515625, 0.6305923461914062, 0.66192626953125, 0.6932601928710938, 0.7245941162109375, 0.7559280395507812, 0.787261962890625, 0.8185958862304688, 0.8499298095703125, 0.8812637329101562, 0.91259765625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 18.0, 15.0, 26.0, 45.0, 74.0, 119.0, 224.0, 804.0, 4077684.0, 114119.0, 671.0, 168.0, 88.0, 61.0, 47.0, 26.0, 27.0, 14.0, 17.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4765625, -14.8551025390625, -14.233642578125, -13.6121826171875, -12.99072265625, -12.3692626953125, -11.747802734375, -11.1263427734375, -10.5048828125, -9.8834228515625, -9.261962890625, -8.6405029296875, -8.01904296875, -7.3975830078125, -6.776123046875, -6.1546630859375, -5.533203125, -4.9117431640625, -4.290283203125, -3.6688232421875, -3.04736328125, -2.4259033203125, -1.804443359375, -1.1829833984375, -0.5615234375, 0.0599365234375, 0.681396484375, 1.3028564453125, 1.92431640625, 2.5457763671875, 3.167236328125, 3.7886962890625, 4.41015625, 5.0316162109375, 5.653076171875, 6.2745361328125, 6.89599609375, 7.5174560546875, 8.138916015625, 8.7603759765625, 9.3818359375, 10.0032958984375, 10.624755859375, 11.2462158203125, 11.86767578125, 12.4891357421875, 13.110595703125, 13.7320556640625, 14.353515625, 14.9749755859375, 15.596435546875, 16.2178955078125, 16.83935546875, 17.4608154296875, 18.082275390625, 18.7037353515625, 19.3251953125, 19.9466552734375, 20.568115234375, 21.1895751953125, 21.81103515625, 22.4324951171875, 23.053955078125, 23.6754150390625, 24.296875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 9.0, 5.0, 7.0, 17.0, 25.0, 29.0, 45.0, 73.0, 117.0, 211.0, 546.0, 1543.0, 806.0, 259.0, 126.0, 83.0, 55.0, 33.0, 34.0, 23.0, 12.0, 6.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.63427734375, -0.61212158203125, -0.5899658203125, -0.56781005859375, -0.545654296875, -0.52349853515625, -0.5013427734375, -0.47918701171875, -0.45703125, -0.43487548828125, -0.4127197265625, -0.39056396484375, -0.368408203125, -0.34625244140625, -0.3240966796875, -0.30194091796875, -0.27978515625, -0.25762939453125, -0.2354736328125, -0.21331787109375, -0.191162109375, -0.16900634765625, -0.1468505859375, -0.12469482421875, -0.1025390625, -0.08038330078125, -0.0582275390625, -0.03607177734375, -0.013916015625, 0.00823974609375, 0.0303955078125, 0.05255126953125, 0.07470703125, 0.09686279296875, 0.1190185546875, 0.14117431640625, 0.163330078125, 0.18548583984375, 0.2076416015625, 0.22979736328125, 0.251953125, 0.27410888671875, 0.2962646484375, 0.31842041015625, 0.340576171875, 0.36273193359375, 0.3848876953125, 0.40704345703125, 0.42919921875, 0.45135498046875, 0.4735107421875, 0.49566650390625, 0.517822265625, 0.53997802734375, 0.5621337890625, 0.58428955078125, 0.6064453125, 0.62860107421875, 0.6507568359375, 0.67291259765625, 0.695068359375, 0.71722412109375, 0.7393798828125, 0.76153564453125, 0.78369140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 10.0, 13.0, 8.0, 33.0, 40.0, 49.0, 62.0, 84.0, 94.0, 108.0, 91.0, 87.0, 79.0, 57.0, 60.0, 41.0, 35.0, 19.0, 8.0, 8.0, 10.0, 3.0, 5.0, 4.0], "bins": [-3.4270503520965576, -3.358222484588623, -3.2893948554992676, -3.220566987991333, -3.1517391204833984, -3.082911491394043, -3.0140836238861084, -2.945255994796753, -2.8764281272888184, -2.807600259780884, -2.7387726306915283, -2.6699447631835938, -2.6011171340942383, -2.5322892665863037, -2.463461399078369, -2.3946337699890137, -2.325805902481079, -2.2569780349731445, -2.188150405883789, -2.1193225383758545, -2.05049467086792, -1.9816670417785645, -1.9128391742706299, -1.8440114259719849, -1.7751836776733398, -1.7063559293746948, -1.6375281810760498, -1.5687003135681152, -1.4998725652694702, -1.4310448169708252, -1.3622169494628906, -1.2933892011642456, -1.2245616912841797, -1.1557339429855347, -1.0869061946868896, -1.018078327178955, -0.9492505788803101, -0.880422830581665, -0.8115950226783752, -0.7427672147750854, -0.6739394664764404, -0.6051117181777954, -0.5362839102745056, -0.4674561321735382, -0.3986283540725708, -0.3298005759716034, -0.260972797870636, -0.19214501976966858, -0.12331724166870117, -0.054489463567733765, 0.014338314533233643, 0.08316609263420105, 0.15199387073516846, 0.22082164883613586, 0.28964942693710327, 0.3584772050380707, 0.4273049831390381, 0.4961327612400055, 0.5649605393409729, 0.6337883472442627, 0.7026160955429077, 0.7714438438415527, 0.8402716517448425, 0.9090994596481323, 0.9779272079467773]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 13.0, 8.0, 9.0, 13.0, 10.0, 14.0, 18.0, 21.0, 26.0, 33.0, 22.0, 20.0, 34.0, 30.0, 32.0, 27.0, 34.0, 37.0, 45.0, 38.0, 44.0, 43.0, 35.0, 30.0, 31.0, 29.0, 30.0, 27.0, 22.0, 35.0, 26.0, 29.0, 17.0, 12.0, 19.0, 8.0, 8.0, 11.0, 15.0, 11.0, 11.0, 3.0, 3.0, 0.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-1.1258944272994995, -1.0940678119659424, -1.0622411966323853, -1.0304145812988281, -0.998587965965271, -0.9667613506317139, -0.934934675693512, -0.9031080603599548, -0.8712814450263977, -0.8394548296928406, -0.8076282143592834, -0.7758015990257263, -0.7439749240875244, -0.7121483087539673, -0.6803216934204102, -0.648495078086853, -0.6166684627532959, -0.5848418474197388, -0.5530152320861816, -0.5211886167526245, -0.489361971616745, -0.45753535628318787, -0.42570871114730835, -0.3938820958137512, -0.3620554804801941, -0.33022886514663696, -0.29840224981307983, -0.2665756046772003, -0.2347489893436432, -0.20292237401008606, -0.17109574377536774, -0.13926911354064941, -0.10744249820709229, -0.07561587542295456, -0.043789252638816833, -0.011962629854679108, 0.019863992929458618, 0.05169060826301575, 0.08351723849773407, 0.11534386873245239, 0.14717048406600952, 0.17899709939956665, 0.21082372963428497, 0.2426503598690033, 0.2744769752025604, 0.30630359053611755, 0.33813023567199707, 0.3699568510055542, 0.40178346633911133, 0.43361008167266846, 0.4654366970062256, 0.4972633421421051, 0.5290899276733398, 0.560916543006897, 0.5927432179450989, 0.624569833278656, 0.6563964486122131, 0.6882230639457703, 0.7200496792793274, 0.7518762946128845, 0.7837029695510864, 0.8155295848846436, 0.8473562002182007, 0.8791828155517578, 0.9110094308853149]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 9.0, 22.0, 26.0, 41.0, 70.0, 102.0, 179.0, 261.0, 421.0, 611.0, 1038.0, 1810.0, 2790.0, 4619.0, 7722.0, 13357.0, 23442.0, 41633.0, 76159.0, 136183.0, 206498.0, 209763.0, 140955.0, 78961.0, 43352.0, 24095.0, 13887.0, 8028.0, 4750.0, 2955.0, 1780.0, 1141.0, 735.0, 426.0, 249.0, 178.0, 121.0, 65.0, 37.0, 32.0, 16.0, 15.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3229522705078125, -0.311431884765625, -0.2999114990234375, -0.28839111328125, -0.2768707275390625, -0.265350341796875, -0.2538299560546875, -0.2423095703125, -0.2307891845703125, -0.219268798828125, -0.2077484130859375, -0.19622802734375, -0.1847076416015625, -0.173187255859375, -0.1616668701171875, -0.150146484375, -0.1386260986328125, -0.127105712890625, -0.1155853271484375, -0.10406494140625, -0.0925445556640625, -0.081024169921875, -0.0695037841796875, -0.0579833984375, -0.0464630126953125, -0.034942626953125, -0.0234222412109375, -0.01190185546875, -0.0003814697265625, 0.011138916015625, 0.0226593017578125, 0.0341796875, 0.0457000732421875, 0.057220458984375, 0.0687408447265625, 0.08026123046875, 0.0917816162109375, 0.103302001953125, 0.1148223876953125, 0.1263427734375, 0.1378631591796875, 0.149383544921875, 0.1609039306640625, 0.17242431640625, 0.1839447021484375, 0.195465087890625, 0.2069854736328125, 0.218505859375, 0.2300262451171875, 0.241546630859375, 0.2530670166015625, 0.26458740234375, 0.2761077880859375, 0.287628173828125, 0.2991485595703125, 0.3106689453125, 0.3221893310546875, 0.333709716796875, 0.3452301025390625, 0.35675048828125, 0.3682708740234375, 0.379791259765625, 0.3913116455078125, 0.40283203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 4.0, 8.0, 10.0, 10.0, 13.0, 20.0, 14.0, 27.0, 20.0, 32.0, 25.0, 25.0, 34.0, 26.0, 33.0, 26.0, 37.0, 46.0, 29.0, 42.0, 53.0, 33.0, 40.0, 44.0, 37.0, 31.0, 27.0, 24.0, 25.0, 21.0, 19.0, 25.0, 17.0, 11.0, 20.0, 14.0, 13.0, 7.0, 15.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0], "bins": [-0.79345703125, -0.7706298828125, -0.747802734375, -0.7249755859375, -0.7021484375, -0.6793212890625, -0.656494140625, -0.6336669921875, -0.61083984375, -0.5880126953125, -0.565185546875, -0.5423583984375, -0.51953125, -0.4967041015625, -0.473876953125, -0.4510498046875, -0.42822265625, -0.4053955078125, -0.382568359375, -0.3597412109375, -0.3369140625, -0.3140869140625, -0.291259765625, -0.2684326171875, -0.24560546875, -0.2227783203125, -0.199951171875, -0.1771240234375, -0.154296875, -0.1314697265625, -0.108642578125, -0.0858154296875, -0.06298828125, -0.0401611328125, -0.017333984375, 0.0054931640625, 0.0283203125, 0.0511474609375, 0.073974609375, 0.0968017578125, 0.11962890625, 0.1424560546875, 0.165283203125, 0.1881103515625, 0.2109375, 0.2337646484375, 0.256591796875, 0.2794189453125, 0.30224609375, 0.3250732421875, 0.347900390625, 0.3707275390625, 0.3935546875, 0.4163818359375, 0.439208984375, 0.4620361328125, 0.48486328125, 0.5076904296875, 0.530517578125, 0.5533447265625, 0.576171875, 0.5989990234375, 0.621826171875, 0.6446533203125, 0.66748046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 9.0, 5.0, 14.0, 17.0, 19.0, 35.0, 29.0, 56.0, 66.0, 88.0, 137.0, 209.0, 323.0, 568.0, 1046.0, 2199.0, 4980.0, 13798.0, 45708.0, 192412.0, 500398.0, 211482.0, 49904.0, 14667.0, 5463.0, 2297.0, 1055.0, 529.0, 343.0, 195.0, 127.0, 99.0, 64.0, 45.0, 43.0, 18.0, 21.0, 18.0, 15.0, 12.0, 14.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6259765625, -0.6067352294921875, -0.587493896484375, -0.5682525634765625, -0.54901123046875, -0.5297698974609375, -0.510528564453125, -0.4912872314453125, -0.4720458984375, -0.4528045654296875, -0.433563232421875, -0.4143218994140625, -0.39508056640625, -0.3758392333984375, -0.356597900390625, -0.3373565673828125, -0.318115234375, -0.2988739013671875, -0.279632568359375, -0.2603912353515625, -0.24114990234375, -0.2219085693359375, -0.202667236328125, -0.1834259033203125, -0.1641845703125, -0.1449432373046875, -0.125701904296875, -0.1064605712890625, -0.08721923828125, -0.0679779052734375, -0.048736572265625, -0.0294952392578125, -0.01025390625, 0.0089874267578125, 0.028228759765625, 0.0474700927734375, 0.06671142578125, 0.0859527587890625, 0.105194091796875, 0.1244354248046875, 0.1436767578125, 0.1629180908203125, 0.182159423828125, 0.2014007568359375, 0.22064208984375, 0.2398834228515625, 0.259124755859375, 0.2783660888671875, 0.297607421875, 0.3168487548828125, 0.336090087890625, 0.3553314208984375, 0.37457275390625, 0.3938140869140625, 0.413055419921875, 0.4322967529296875, 0.4515380859375, 0.4707794189453125, 0.490020751953125, 0.5092620849609375, 0.52850341796875, 0.5477447509765625, 0.566986083984375, 0.5862274169921875, 0.60546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 8.0, 10.0, 10.0, 4.0, 11.0, 13.0, 10.0, 12.0, 18.0, 16.0, 25.0, 24.0, 31.0, 35.0, 23.0, 29.0, 27.0, 33.0, 35.0, 41.0, 41.0, 36.0, 59.0, 40.0, 33.0, 45.0, 40.0, 36.0, 31.0, 29.0, 29.0, 27.0, 26.0, 17.0, 20.0, 17.0, 8.0, 7.0, 10.0, 7.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.541015625, -1.4907684326171875, -1.440521240234375, -1.3902740478515625, -1.34002685546875, -1.2897796630859375, -1.239532470703125, -1.1892852783203125, -1.1390380859375, -1.0887908935546875, -1.038543701171875, -0.9882965087890625, -0.93804931640625, -0.8878021240234375, -0.837554931640625, -0.7873077392578125, -0.737060546875, -0.6868133544921875, -0.636566162109375, -0.5863189697265625, -0.53607177734375, -0.4858245849609375, -0.435577392578125, -0.3853302001953125, -0.3350830078125, -0.2848358154296875, -0.234588623046875, -0.1843414306640625, -0.13409423828125, -0.0838470458984375, -0.033599853515625, 0.0166473388671875, 0.06689453125, 0.1171417236328125, 0.167388916015625, 0.2176361083984375, 0.26788330078125, 0.3181304931640625, 0.368377685546875, 0.4186248779296875, 0.4688720703125, 0.5191192626953125, 0.569366455078125, 0.6196136474609375, 0.66986083984375, 0.7201080322265625, 0.770355224609375, 0.8206024169921875, 0.870849609375, 0.9210968017578125, 0.971343994140625, 1.0215911865234375, 1.07183837890625, 1.1220855712890625, 1.172332763671875, 1.2225799560546875, 1.2728271484375, 1.3230743408203125, 1.373321533203125, 1.4235687255859375, 1.47381591796875, 1.5240631103515625, 1.574310302734375, 1.6245574951171875, 1.6748046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 11.0, 10.0, 15.0, 12.0, 25.0, 29.0, 43.0, 76.0, 105.0, 133.0, 195.0, 323.0, 459.0, 832.0, 1305.0, 2597.0, 5152.0, 11022.0, 30933.0, 146879.0, 629825.0, 162527.0, 32937.0, 11629.0, 5055.0, 2599.0, 1422.0, 836.0, 509.0, 350.0, 191.0, 151.0, 100.0, 79.0, 49.0, 35.0, 21.0, 11.0, 15.0, 14.0, 4.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.3066062927246094, -0.29656219482421875, -0.2865180969238281, -0.2764739990234375, -0.2664299011230469, -0.25638580322265625, -0.24634170532226562, -0.236297607421875, -0.22625350952148438, -0.21620941162109375, -0.20616531372070312, -0.1961212158203125, -0.18607711791992188, -0.17603302001953125, -0.16598892211914062, -0.15594482421875, -0.14590072631835938, -0.13585662841796875, -0.12581253051757812, -0.1157684326171875, -0.10572433471679688, -0.09568023681640625, -0.08563613891601562, -0.075592041015625, -0.06554794311523438, -0.05550384521484375, -0.045459747314453125, -0.0354156494140625, -0.025371551513671875, -0.01532745361328125, -0.005283355712890625, 0.0047607421875, 0.014804840087890625, 0.02484893798828125, 0.034893035888671875, 0.0449371337890625, 0.054981231689453125, 0.06502532958984375, 0.07506942749023438, 0.085113525390625, 0.09515762329101562, 0.10520172119140625, 0.11524581909179688, 0.1252899169921875, 0.13533401489257812, 0.14537811279296875, 0.15542221069335938, 0.16546630859375, 0.17551040649414062, 0.18555450439453125, 0.19559860229492188, 0.2056427001953125, 0.21568679809570312, 0.22573089599609375, 0.23577499389648438, 0.245819091796875, 0.2558631896972656, 0.26590728759765625, 0.2759513854980469, 0.2859954833984375, 0.2960395812988281, 0.30608367919921875, 0.3161277770996094, 0.326171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 10.0, 12.0, 13.0, 13.0, 33.0, 23.0, 46.0, 77.0, 90.0, 114.0, 129.0, 125.0, 86.0, 80.0, 37.0, 28.0, 21.0, 21.0, 8.0, 5.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016033649444580078, -0.00015447288751602173, -0.00014860928058624268, -0.00014274567365646362, -0.00013688206672668457, -0.00013101845979690552, -0.00012515485286712646, -0.00011929124593734741, -0.00011342763900756836, -0.0001075640320777893, -0.00010170042514801025, -9.58368182182312e-05, -8.997321128845215e-05, -8.41096043586731e-05, -7.824599742889404e-05, -7.238239049911499e-05, -6.651878356933594e-05, -6.0655176639556885e-05, -5.479156970977783e-05, -4.892796277999878e-05, -4.3064355850219727e-05, -3.7200748920440674e-05, -3.133714199066162e-05, -2.547353506088257e-05, -1.9609928131103516e-05, -1.3746321201324463e-05, -7.88271427154541e-06, -2.0191073417663574e-06, 3.844499588012695e-06, 9.708106517791748e-06, 1.55717134475708e-05, 2.1435320377349854e-05, 2.7298927307128906e-05, 3.316253423690796e-05, 3.902614116668701e-05, 4.4889748096466064e-05, 5.075335502624512e-05, 5.661696195602417e-05, 6.248056888580322e-05, 6.834417581558228e-05, 7.420778274536133e-05, 8.007138967514038e-05, 8.593499660491943e-05, 9.179860353469849e-05, 9.766221046447754e-05, 0.00010352581739425659, 0.00010938942432403564, 0.0001152530312538147, 0.00012111663818359375, 0.0001269802451133728, 0.00013284385204315186, 0.0001387074589729309, 0.00014457106590270996, 0.00015043467283248901, 0.00015629827976226807, 0.00016216188669204712, 0.00016802549362182617, 0.00017388910055160522, 0.00017975270748138428, 0.00018561631441116333, 0.00019147992134094238, 0.00019734352827072144, 0.0002032071352005005, 0.00020907074213027954, 0.0002149343490600586]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 5.0, 5.0, 11.0, 11.0, 18.0, 17.0, 27.0, 44.0, 46.0, 84.0, 279.0, 1482.0, 14263.0, 710706.0, 311467.0, 8564.0, 1024.0, 198.0, 101.0, 38.0, 37.0, 23.0, 22.0, 15.0, 11.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0111083984375, -0.977294921875, -0.9434814453125, -0.90966796875, -0.8758544921875, -0.842041015625, -0.8082275390625, -0.7744140625, -0.7406005859375, -0.706787109375, -0.6729736328125, -0.63916015625, -0.6053466796875, -0.571533203125, -0.5377197265625, -0.50390625, -0.4700927734375, -0.436279296875, -0.4024658203125, -0.36865234375, -0.3348388671875, -0.301025390625, -0.2672119140625, -0.2333984375, -0.1995849609375, -0.165771484375, -0.1319580078125, -0.09814453125, -0.0643310546875, -0.030517578125, 0.0032958984375, 0.037109375, 0.0709228515625, 0.104736328125, 0.1385498046875, 0.17236328125, 0.2061767578125, 0.239990234375, 0.2738037109375, 0.3076171875, 0.3414306640625, 0.375244140625, 0.4090576171875, 0.44287109375, 0.4766845703125, 0.510498046875, 0.5443115234375, 0.578125, 0.6119384765625, 0.645751953125, 0.6795654296875, 0.71337890625, 0.7471923828125, 0.781005859375, 0.8148193359375, 0.8486328125, 0.8824462890625, 0.916259765625, 0.9500732421875, 0.98388671875, 1.0177001953125, 1.051513671875, 1.0853271484375, 1.119140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 13.0, 7.0, 16.0, 11.0, 19.0, 27.0, 23.0, 35.0, 56.0, 66.0, 71.0, 75.0, 66.0, 71.0, 65.0, 60.0, 66.0, 38.0, 36.0, 37.0, 23.0, 19.0, 11.0, 9.0, 14.0, 14.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0780029296875, -0.07548236846923828, -0.07296180725097656, -0.07044124603271484, -0.06792068481445312, -0.0654001235961914, -0.06287956237792969, -0.06035900115966797, -0.05783843994140625, -0.05531787872314453, -0.05279731750488281, -0.050276756286621094, -0.047756195068359375, -0.045235633850097656, -0.04271507263183594, -0.04019451141357422, -0.0376739501953125, -0.03515338897705078, -0.03263282775878906, -0.030112266540527344, -0.027591705322265625, -0.025071144104003906, -0.022550582885742188, -0.02003002166748047, -0.01750946044921875, -0.014988899230957031, -0.012468338012695312, -0.009947776794433594, -0.007427215576171875, -0.004906654357910156, -0.0023860931396484375, 0.00013446807861328125, 0.002655029296875, 0.005175590515136719, 0.0076961517333984375, 0.010216712951660156, 0.012737274169921875, 0.015257835388183594, 0.017778396606445312, 0.02029895782470703, 0.02281951904296875, 0.02534008026123047, 0.027860641479492188, 0.030381202697753906, 0.032901763916015625, 0.035422325134277344, 0.03794288635253906, 0.04046344757080078, 0.0429840087890625, 0.04550457000732422, 0.04802513122558594, 0.050545692443847656, 0.053066253662109375, 0.055586814880371094, 0.05810737609863281, 0.06062793731689453, 0.06314849853515625, 0.06566905975341797, 0.06818962097167969, 0.0707101821899414, 0.07323074340820312, 0.07575130462646484, 0.07827186584472656, 0.08079242706298828, 0.08331298828125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 32.0, 87.0, 231.0, 280.0, 201.0, 105.0, 35.0, 20.0, 5.0, 4.0], "bins": [-7.9226555824279785, -7.78477668762207, -7.646897792816162, -7.509018898010254, -7.371140003204346, -7.2332611083984375, -7.095382213592529, -6.957503318786621, -6.819624900817871, -6.681746006011963, -6.543867111206055, -6.4059882164001465, -6.268109321594238, -6.13023042678833, -5.992351531982422, -5.854473114013672, -5.7165937423706055, -5.578714847564697, -5.440835952758789, -5.302957057952881, -5.165078163146973, -5.0271992683410645, -4.889320373535156, -4.751441955566406, -4.61356258392334, -4.475683689117432, -4.337804794311523, -4.199925899505615, -4.062047004699707, -3.924168109893799, -3.7862894535064697, -3.6484105587005615, -3.510531425476074, -3.372652530670166, -3.234773635864258, -3.0968947410583496, -2.9590158462524414, -2.821136951446533, -2.683258295059204, -2.545379400253296, -2.407500743865967, -2.2696218490600586, -2.1317429542541504, -1.9938641786575317, -1.8559852838516235, -1.7181063890457153, -1.5802276134490967, -1.4423487186431885, -1.3044697046279907, -1.1665908098220825, -1.0287120342254639, -0.8908331394195557, -0.7529542446136475, -0.6150753498077393, -0.47719651460647583, -0.3393176794052124, -0.2014387845993042, -0.06355991959571838, 0.07431894540786743, 0.21219781041145325, 0.35007667541503906, 0.48795557022094727, 0.6258344054222107, 0.7637132406234741, 0.9015921354293823]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 7.0, 8.0, 14.0, 16.0, 9.0, 12.0, 21.0, 32.0, 29.0, 19.0, 30.0, 24.0, 26.0, 23.0, 47.0, 40.0, 32.0, 46.0, 50.0, 42.0, 43.0, 44.0, 34.0, 29.0, 30.0, 33.0, 33.0, 30.0, 29.0, 26.0, 20.0, 16.0, 14.0, 11.0, 17.0, 7.0, 8.0, 9.0, 9.0, 1.0, 5.0, 1.0, 3.0, 5.0, 2.0, 4.0], "bins": [-0.8810598850250244, -0.8572274446487427, -0.8333950042724609, -0.8095625638961792, -0.7857301235198975, -0.761897623538971, -0.7380651831626892, -0.7142327427864075, -0.6904003024101257, -0.666567862033844, -0.6427354216575623, -0.6189029812812805, -0.595070481300354, -0.5712380409240723, -0.5474056005477905, -0.5235731601715088, -0.49974071979522705, -0.4759082794189453, -0.4520758390426636, -0.42824336886405945, -0.4044109284877777, -0.38057848811149597, -0.35674601793289185, -0.3329135775566101, -0.30908113718032837, -0.28524869680404663, -0.2614162564277649, -0.23758378624916077, -0.21375134587287903, -0.1899189054965973, -0.16608645021915436, -0.14225399494171143, -0.11842155456542969, -0.09458910673856735, -0.07075665891170502, -0.04692421108484268, -0.023091763257980347, 0.0007406845688819885, 0.024573132395744324, 0.048405587673187256, 0.072238028049469, 0.09607047587633133, 0.11990292370319366, 0.1437353789806366, 0.16756781935691833, 0.19140025973320007, 0.215232715010643, 0.23906517028808594, 0.2628976106643677, 0.2867300510406494, 0.31056249141693115, 0.3343949615955353, 0.358227401971817, 0.38205984234809875, 0.4058923125267029, 0.4297247529029846, 0.45355719327926636, 0.4773896336555481, 0.5012220740318298, 0.5250545144081116, 0.5488870143890381, 0.5727194547653198, 0.5965518951416016, 0.6203843355178833, 0.644216775894165]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 3.0, 7.0, 8.0, 10.0, 23.0, 30.0, 42.0, 57.0, 74.0, 121.0, 180.0, 289.0, 389.0, 665.0, 967.0, 1591.0, 2807.0, 4721.0, 9295.0, 19553.0, 49026.0, 133165.0, 308850.0, 302368.0, 127270.0, 47062.0, 19321.0, 8847.0, 4726.0, 2660.0, 1588.0, 1010.0, 659.0, 408.0, 242.0, 160.0, 128.0, 72.0, 50.0, 41.0, 19.0, 18.0, 14.0, 6.0, 5.0, 10.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366455078125, -0.3538093566894531, -0.34116363525390625, -0.3285179138183594, -0.3158721923828125, -0.3032264709472656, -0.29058074951171875, -0.2779350280761719, -0.265289306640625, -0.2526435852050781, -0.23999786376953125, -0.22735214233398438, -0.2147064208984375, -0.20206069946289062, -0.18941497802734375, -0.17676925659179688, -0.16412353515625, -0.15147781372070312, -0.13883209228515625, -0.12618637084960938, -0.1135406494140625, -0.10089492797851562, -0.08824920654296875, -0.07560348510742188, -0.062957763671875, -0.050312042236328125, -0.03766632080078125, -0.025020599365234375, -0.0123748779296875, 0.000270843505859375, 0.01291656494140625, 0.025562286376953125, 0.0382080078125, 0.050853729248046875, 0.06349945068359375, 0.07614517211914062, 0.0887908935546875, 0.10143661499023438, 0.11408233642578125, 0.12672805786132812, 0.139373779296875, 0.15201950073242188, 0.16466522216796875, 0.17731094360351562, 0.1899566650390625, 0.20260238647460938, 0.21524810791015625, 0.22789382934570312, 0.24053955078125, 0.2531852722167969, 0.26583099365234375, 0.2784767150878906, 0.2911224365234375, 0.3037681579589844, 0.31641387939453125, 0.3290596008300781, 0.341705322265625, 0.3543510437011719, 0.36699676513671875, 0.3796424865722656, 0.3922882080078125, 0.4049339294433594, 0.41757965087890625, 0.4302253723144531, 0.44287109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 9.0, 6.0, 6.0, 16.0, 18.0, 22.0, 22.0, 27.0, 24.0, 33.0, 41.0, 33.0, 36.0, 53.0, 46.0, 50.0, 54.0, 48.0, 28.0, 49.0, 54.0, 28.0, 38.0, 31.0, 19.0, 23.0, 25.0, 19.0, 20.0, 17.0, 10.0, 9.0, 13.0, 11.0, 8.0, 6.0, 0.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.392578125, -3.297698974609375, -3.20281982421875, -3.107940673828125, -3.0130615234375, -2.918182373046875, -2.82330322265625, -2.728424072265625, -2.633544921875, -2.538665771484375, -2.44378662109375, -2.348907470703125, -2.2540283203125, -2.159149169921875, -2.06427001953125, -1.969390869140625, -1.87451171875, -1.779632568359375, -1.68475341796875, -1.589874267578125, -1.4949951171875, -1.400115966796875, -1.30523681640625, -1.210357666015625, -1.115478515625, -1.020599365234375, -0.92572021484375, -0.830841064453125, -0.7359619140625, -0.641082763671875, -0.54620361328125, -0.451324462890625, -0.3564453125, -0.261566162109375, -0.16668701171875, -0.071807861328125, 0.0230712890625, 0.117950439453125, 0.21282958984375, 0.307708740234375, 0.402587890625, 0.497467041015625, 0.59234619140625, 0.687225341796875, 0.7821044921875, 0.876983642578125, 0.97186279296875, 1.066741943359375, 1.16162109375, 1.256500244140625, 1.35137939453125, 1.446258544921875, 1.5411376953125, 1.636016845703125, 1.73089599609375, 1.825775146484375, 1.920654296875, 2.015533447265625, 2.11041259765625, 2.205291748046875, 2.3001708984375, 2.395050048828125, 2.48992919921875, 2.584808349609375, 2.6796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 4.0, 13.0, 20.0, 24.0, 43.0, 50.0, 43.0, 68.0, 101.0, 120.0, 173.0, 296.0, 624.0, 2299.0, 132478.0, 901979.0, 8173.0, 907.0, 370.0, 228.0, 142.0, 105.0, 77.0, 50.0, 30.0, 28.0, 26.0, 16.0, 14.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.090972900390625, -2.02178955078125, -1.952606201171875, -1.8834228515625, -1.814239501953125, -1.74505615234375, -1.675872802734375, -1.606689453125, -1.537506103515625, -1.46832275390625, -1.399139404296875, -1.3299560546875, -1.260772705078125, -1.19158935546875, -1.122406005859375, -1.05322265625, -0.984039306640625, -0.91485595703125, -0.845672607421875, -0.7764892578125, -0.707305908203125, -0.63812255859375, -0.568939208984375, -0.499755859375, -0.430572509765625, -0.36138916015625, -0.292205810546875, -0.2230224609375, -0.153839111328125, -0.08465576171875, -0.015472412109375, 0.0537109375, 0.122894287109375, 0.19207763671875, 0.261260986328125, 0.3304443359375, 0.399627685546875, 0.46881103515625, 0.537994384765625, 0.607177734375, 0.676361083984375, 0.74554443359375, 0.814727783203125, 0.8839111328125, 0.953094482421875, 1.02227783203125, 1.091461181640625, 1.16064453125, 1.229827880859375, 1.29901123046875, 1.368194580078125, 1.4373779296875, 1.506561279296875, 1.57574462890625, 1.644927978515625, 1.714111328125, 1.783294677734375, 1.85247802734375, 1.921661376953125, 1.9908447265625, 2.060028076171875, 2.12921142578125, 2.198394775390625, 2.267578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 3.0, 4.0, 11.0, 8.0, 14.0, 10.0, 8.0, 10.0, 18.0, 16.0, 23.0, 19.0, 18.0, 31.0, 29.0, 29.0, 31.0, 44.0, 33.0, 40.0, 49.0, 46.0, 30.0, 37.0, 40.0, 48.0, 43.0, 37.0, 34.0, 36.0, 22.0, 24.0, 23.0, 26.0, 23.0, 16.0, 18.0, 12.0, 6.0, 11.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.9765625, -2.882965087890625, -2.78936767578125, -2.695770263671875, -2.6021728515625, -2.508575439453125, -2.41497802734375, -2.321380615234375, -2.227783203125, -2.134185791015625, -2.04058837890625, -1.946990966796875, -1.8533935546875, -1.759796142578125, -1.66619873046875, -1.572601318359375, -1.47900390625, -1.385406494140625, -1.29180908203125, -1.198211669921875, -1.1046142578125, -1.011016845703125, -0.91741943359375, -0.823822021484375, -0.730224609375, -0.636627197265625, -0.54302978515625, -0.449432373046875, -0.3558349609375, -0.262237548828125, -0.16864013671875, -0.075042724609375, 0.0185546875, 0.112152099609375, 0.20574951171875, 0.299346923828125, 0.3929443359375, 0.486541748046875, 0.58013916015625, 0.673736572265625, 0.767333984375, 0.860931396484375, 0.95452880859375, 1.048126220703125, 1.1417236328125, 1.235321044921875, 1.32891845703125, 1.422515869140625, 1.51611328125, 1.609710693359375, 1.70330810546875, 1.796905517578125, 1.8905029296875, 1.984100341796875, 2.07769775390625, 2.171295166015625, 2.264892578125, 2.358489990234375, 2.45208740234375, 2.545684814453125, 2.6392822265625, 2.732879638671875, 2.82647705078125, 2.920074462890625, 3.013671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 11.0, 11.0, 12.0, 22.0, 34.0, 70.0, 96.0, 195.0, 341.0, 676.0, 1388.0, 3651.0, 13208.0, 901591.0, 113979.0, 8316.0, 2623.0, 1093.0, 558.0, 272.0, 162.0, 106.0, 47.0, 32.0, 24.0, 11.0, 9.0, 6.0, 8.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4599609375, -0.44637298583984375, -0.4327850341796875, -0.41919708251953125, -0.405609130859375, -0.39202117919921875, -0.3784332275390625, -0.36484527587890625, -0.35125732421875, -0.33766937255859375, -0.3240814208984375, -0.31049346923828125, -0.296905517578125, -0.28331756591796875, -0.2697296142578125, -0.25614166259765625, -0.2425537109375, -0.22896575927734375, -0.2153778076171875, -0.20178985595703125, -0.188201904296875, -0.17461395263671875, -0.1610260009765625, -0.14743804931640625, -0.13385009765625, -0.12026214599609375, -0.1066741943359375, -0.09308624267578125, -0.079498291015625, -0.06591033935546875, -0.0523223876953125, -0.03873443603515625, -0.025146484375, -0.01155853271484375, 0.0020294189453125, 0.01561737060546875, 0.029205322265625, 0.04279327392578125, 0.0563812255859375, 0.06996917724609375, 0.08355712890625, 0.09714508056640625, 0.1107330322265625, 0.12432098388671875, 0.137908935546875, 0.15149688720703125, 0.1650848388671875, 0.17867279052734375, 0.1922607421875, 0.20584869384765625, 0.2194366455078125, 0.23302459716796875, 0.246612548828125, 0.26020050048828125, 0.2737884521484375, 0.28737640380859375, 0.30096435546875, 0.31455230712890625, 0.3281402587890625, 0.34172821044921875, 0.355316162109375, 0.36890411376953125, 0.3824920654296875, 0.39608001708984375, 0.40966796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 13.0, 14.0, 37.0, 73.0, 229.0, 366.0, 147.0, 53.0, 29.0, 10.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.902217864990234e-05, -6.730575114488602e-05, -6.558932363986969e-05, -6.387289613485336e-05, -6.215646862983704e-05, -6.044004112482071e-05, -5.872361361980438e-05, -5.7007186114788055e-05, -5.529075860977173e-05, -5.35743311047554e-05, -5.1857903599739075e-05, -5.014147609472275e-05, -4.842504858970642e-05, -4.6708621084690094e-05, -4.499219357967377e-05, -4.327576607465744e-05, -4.155933856964111e-05, -3.9842911064624786e-05, -3.812648355960846e-05, -3.641005605459213e-05, -3.4693628549575806e-05, -3.297720104455948e-05, -3.126077353954315e-05, -2.9544346034526825e-05, -2.7827918529510498e-05, -2.611149102449417e-05, -2.4395063519477844e-05, -2.2678636014461517e-05, -2.096220850944519e-05, -1.9245781004428864e-05, -1.7529353499412537e-05, -1.581292599439621e-05, -1.4096498489379883e-05, -1.2380070984363556e-05, -1.0663643479347229e-05, -8.947215974330902e-06, -7.230788469314575e-06, -5.514360964298248e-06, -3.7979334592819214e-06, -2.0815059542655945e-06, -3.650784492492676e-07, 1.3513490557670593e-06, 3.0677765607833862e-06, 4.784204065799713e-06, 6.50063157081604e-06, 8.217059075832367e-06, 9.933486580848694e-06, 1.164991408586502e-05, 1.3366341590881348e-05, 1.5082769095897675e-05, 1.6799196600914e-05, 1.851562410593033e-05, 2.0232051610946655e-05, 2.1948479115962982e-05, 2.366490662097931e-05, 2.5381334125995636e-05, 2.7097761631011963e-05, 2.881418913602829e-05, 3.053061664104462e-05, 3.2247044146060944e-05, 3.396347165107727e-05, 3.56798991560936e-05, 3.7396326661109924e-05, 3.911275416612625e-05, 4.082918167114258e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 7.0, 1.0, 11.0, 11.0, 38.0, 72.0, 151.0, 452.0, 1499.0, 7000.0, 192382.0, 835711.0, 8678.0, 1691.0, 488.0, 202.0, 71.0, 39.0, 15.0, 9.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6201171875, -0.6013565063476562, -0.5825958251953125, -0.5638351440429688, -0.545074462890625, -0.5263137817382812, -0.5075531005859375, -0.48879241943359375, -0.47003173828125, -0.45127105712890625, -0.4325103759765625, -0.41374969482421875, -0.394989013671875, -0.37622833251953125, -0.3574676513671875, -0.33870697021484375, -0.3199462890625, -0.30118560791015625, -0.2824249267578125, -0.26366424560546875, -0.244903564453125, -0.22614288330078125, -0.2073822021484375, -0.18862152099609375, -0.16986083984375, -0.15110015869140625, -0.1323394775390625, -0.11357879638671875, -0.094818115234375, -0.07605743408203125, -0.0572967529296875, -0.03853607177734375, -0.019775390625, -0.00101470947265625, 0.0177459716796875, 0.03650665283203125, 0.055267333984375, 0.07402801513671875, 0.0927886962890625, 0.11154937744140625, 0.13031005859375, 0.14907073974609375, 0.1678314208984375, 0.18659210205078125, 0.205352783203125, 0.22411346435546875, 0.2428741455078125, 0.26163482666015625, 0.2803955078125, 0.29915618896484375, 0.3179168701171875, 0.33667755126953125, 0.355438232421875, 0.37419891357421875, 0.3929595947265625, 0.41172027587890625, 0.43048095703125, 0.44924163818359375, 0.4680023193359375, 0.48676300048828125, 0.505523681640625, 0.5242843627929688, 0.5430450439453125, 0.5618057250976562, 0.58056640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 4.0, 10.0, 24.0, 35.0, 92.0, 417.0, 247.0, 56.0, 31.0, 16.0, 11.0, 8.0, 13.0, 3.0, 7.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11944580078125, -0.11499691009521484, -0.11054801940917969, -0.10609912872314453, -0.10165023803710938, -0.09720134735107422, -0.09275245666503906, -0.0883035659790039, -0.08385467529296875, -0.0794057846069336, -0.07495689392089844, -0.07050800323486328, -0.06605911254882812, -0.06161022186279297, -0.05716133117675781, -0.052712440490722656, -0.0482635498046875, -0.043814659118652344, -0.03936576843261719, -0.03491687774658203, -0.030467987060546875, -0.02601909637451172, -0.021570205688476562, -0.017121315002441406, -0.01267242431640625, -0.008223533630371094, -0.0037746429443359375, 0.0006742477416992188, 0.005123138427734375, 0.009572029113769531, 0.014020919799804688, 0.018469810485839844, 0.022918701171875, 0.027367591857910156, 0.03181648254394531, 0.03626537322998047, 0.040714263916015625, 0.04516315460205078, 0.04961204528808594, 0.054060935974121094, 0.05850982666015625, 0.0629587173461914, 0.06740760803222656, 0.07185649871826172, 0.07630538940429688, 0.08075428009033203, 0.08520317077636719, 0.08965206146240234, 0.0941009521484375, 0.09854984283447266, 0.10299873352050781, 0.10744762420654297, 0.11189651489257812, 0.11634540557861328, 0.12079429626464844, 0.1252431869506836, 0.12969207763671875, 0.1341409683227539, 0.13858985900878906, 0.14303874969482422, 0.14748764038085938, 0.15193653106689453, 0.1563854217529297, 0.16083431243896484, 0.165283203125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 15.0, 42.0, 63.0, 127.0, 179.0, 181.0, 140.0, 118.0, 52.0, 44.0, 19.0, 10.0, 3.0, 8.0], "bins": [-7.642716884613037, -7.5045037269592285, -7.36629056930542, -7.228076934814453, -7.0898637771606445, -6.951650619506836, -6.813437461853027, -6.675224304199219, -6.53701114654541, -6.398797988891602, -6.260584831237793, -6.122371673583984, -5.984158039093018, -5.845944881439209, -5.7077317237854, -5.569518566131592, -5.431304931640625, -5.293091773986816, -5.154878616333008, -5.016665458679199, -4.878451824188232, -4.740238666534424, -4.602025508880615, -4.463812351226807, -4.325599193572998, -4.1873860359191895, -4.049172878265381, -3.910959482192993, -3.7727463245391846, -3.634532928466797, -3.4963197708129883, -3.3581066131591797, -3.219892978668213, -3.0816798210144043, -2.9434664249420166, -2.805253267288208, -2.6670401096343994, -2.5288267135620117, -2.390613555908203, -2.2524003982543945, -2.114187240600586, -1.9759739637374878, -1.8377608060836792, -1.699547529220581, -1.5613343715667725, -1.4231210947036743, -1.2849078178405762, -1.1466946601867676, -1.0084813833236694, -0.8702681660652161, -0.7320549488067627, -0.5938416719436646, -0.4556284546852112, -0.3174152374267578, -0.17920196056365967, -0.0409887433052063, 0.09722447395324707, 0.23543770611286163, 0.3736509382724762, 0.511864185333252, 0.6500774025917053, 0.7882906198501587, 0.9265038967132568, 1.0647170543670654, 1.2029303312301636]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 11.0, 6.0, 8.0, 8.0, 16.0, 7.0, 19.0, 26.0, 22.0, 29.0, 26.0, 29.0, 29.0, 30.0, 41.0, 45.0, 34.0, 38.0, 30.0, 35.0, 44.0, 38.0, 44.0, 42.0, 38.0, 28.0, 27.0, 25.0, 27.0, 28.0, 18.0, 17.0, 20.0, 19.0, 12.0, 13.0, 16.0, 9.0, 6.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.250396251678467, -5.103309631347656, -4.9562225341796875, -4.809135913848877, -4.662048816680908, -4.514962196350098, -4.367875099182129, -4.220788478851318, -4.073701858520508, -3.926614999771118, -3.7795281410217285, -3.632441282272339, -3.485354423522949, -3.3382678031921387, -3.191180944442749, -3.0440940856933594, -2.8970069885253906, -2.749920129776001, -2.6028332710266113, -2.4557464122772217, -2.308659553527832, -2.1615729331970215, -2.014486074447632, -1.8673992156982422, -1.7203123569488525, -1.573225498199463, -1.4261386394500732, -1.2790518999099731, -1.1319650411605835, -0.9848781824111938, -0.837791383266449, -0.6907045841217041, -0.5436172485351562, -0.396530419588089, -0.24944359064102173, -0.10235676169395447, 0.04473006725311279, 0.19181692600250244, 0.3389037251472473, 0.4859905242919922, 0.6330773830413818, 0.7801642417907715, 0.9272510409355164, 1.0743378400802612, 1.2214246988296509, 1.3685115575790405, 1.5155982971191406, 1.6626851558685303, 1.80977201461792, 1.9568588733673096, 2.103945732116699, 2.251032590866089, 2.3981194496154785, 2.545206069946289, 2.6922929286956787, 2.8393797874450684, 2.986466646194458, 3.1335535049438477, 3.2806403636932373, 3.427727222442627, 3.5748138427734375, 3.7219009399414062, 3.868987560272217, 4.016074180603027, 4.163161277770996]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 7.0, 9.0, 17.0, 6.0, 16.0, 11.0, 17.0, 31.0, 50.0, 57.0, 78.0, 139.0, 208.0, 402.0, 825.0, 1865.0, 5047.0, 16806.0, 87382.0, 942823.0, 2769022.0, 310923.0, 41304.0, 10677.0, 3659.0, 1494.0, 622.0, 332.0, 154.0, 96.0, 52.0, 43.0, 19.0, 20.0, 14.0, 15.0, 8.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.7470703125, -1.7002105712890625, -1.653350830078125, -1.6064910888671875, -1.55963134765625, -1.5127716064453125, -1.465911865234375, -1.4190521240234375, -1.3721923828125, -1.3253326416015625, -1.278472900390625, -1.2316131591796875, -1.18475341796875, -1.1378936767578125, -1.091033935546875, -1.0441741943359375, -0.997314453125, -0.9504547119140625, -0.903594970703125, -0.8567352294921875, -0.80987548828125, -0.7630157470703125, -0.716156005859375, -0.6692962646484375, -0.6224365234375, -0.5755767822265625, -0.528717041015625, -0.4818572998046875, -0.43499755859375, -0.3881378173828125, -0.341278076171875, -0.2944183349609375, -0.24755859375, -0.2006988525390625, -0.153839111328125, -0.1069793701171875, -0.06011962890625, -0.0132598876953125, 0.033599853515625, 0.0804595947265625, 0.1273193359375, 0.1741790771484375, 0.221038818359375, 0.2678985595703125, 0.31475830078125, 0.3616180419921875, 0.408477783203125, 0.4553375244140625, 0.502197265625, 0.5490570068359375, 0.595916748046875, 0.6427764892578125, 0.68963623046875, 0.7364959716796875, 0.783355712890625, 0.8302154541015625, 0.8770751953125, 0.9239349365234375, 0.970794677734375, 1.0176544189453125, 1.06451416015625, 1.1113739013671875, 1.158233642578125, 1.2050933837890625, 1.251953125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 14.0, 13.0, 19.0, 16.0, 23.0, 40.0, 28.0, 35.0, 58.0, 55.0, 57.0, 67.0, 47.0, 66.0, 68.0, 70.0, 53.0, 49.0, 44.0, 31.0, 36.0, 20.0, 22.0, 22.0, 13.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.7646484375, -1.7251739501953125, -1.685699462890625, -1.6462249755859375, -1.60675048828125, -1.5672760009765625, -1.527801513671875, -1.4883270263671875, -1.4488525390625, -1.4093780517578125, -1.369903564453125, -1.3304290771484375, -1.29095458984375, -1.2514801025390625, -1.212005615234375, -1.1725311279296875, -1.133056640625, -1.0935821533203125, -1.054107666015625, -1.0146331787109375, -0.97515869140625, -0.9356842041015625, -0.896209716796875, -0.8567352294921875, -0.8172607421875, -0.7777862548828125, -0.738311767578125, -0.6988372802734375, -0.65936279296875, -0.6198883056640625, -0.580413818359375, -0.5409393310546875, -0.50146484375, -0.4619903564453125, -0.422515869140625, -0.3830413818359375, -0.34356689453125, -0.3040924072265625, -0.264617919921875, -0.2251434326171875, -0.1856689453125, -0.1461944580078125, -0.106719970703125, -0.0672454833984375, -0.02777099609375, 0.0117034912109375, 0.051177978515625, 0.0906524658203125, 0.130126953125, 0.1696014404296875, 0.209075927734375, 0.2485504150390625, 0.28802490234375, 0.3274993896484375, 0.366973876953125, 0.4064483642578125, 0.4459228515625, 0.4853973388671875, 0.524871826171875, 0.5643463134765625, 0.60382080078125, 0.6432952880859375, 0.682769775390625, 0.7222442626953125, 0.76171875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 18.0, 24.0, 51.0, 99.0, 351.0, 30195.0, 4162677.0, 580.0, 152.0, 62.0, 32.0, 15.0, 7.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.078125, -21.5782470703125, -21.078369140625, -20.5784912109375, -20.07861328125, -19.5787353515625, -19.078857421875, -18.5789794921875, -18.0791015625, -17.5792236328125, -17.079345703125, -16.5794677734375, -16.07958984375, -15.5797119140625, -15.079833984375, -14.5799560546875, -14.080078125, -13.5802001953125, -13.080322265625, -12.5804443359375, -12.08056640625, -11.5806884765625, -11.080810546875, -10.5809326171875, -10.0810546875, -9.5811767578125, -9.081298828125, -8.5814208984375, -8.08154296875, -7.5816650390625, -7.081787109375, -6.5819091796875, -6.08203125, -5.5821533203125, -5.082275390625, -4.5823974609375, -4.08251953125, -3.5826416015625, -3.082763671875, -2.5828857421875, -2.0830078125, -1.5831298828125, -1.083251953125, -0.5833740234375, -0.08349609375, 0.4163818359375, 0.916259765625, 1.4161376953125, 1.916015625, 2.4158935546875, 2.915771484375, 3.4156494140625, 3.91552734375, 4.4154052734375, 4.915283203125, 5.4151611328125, 5.9150390625, 6.4149169921875, 6.914794921875, 7.4146728515625, 7.91455078125, 8.4144287109375, 8.914306640625, 9.4141845703125, 9.9140625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 10.0, 12.0, 20.0, 42.0, 60.0, 108.0, 167.0, 333.0, 776.0, 1205.0, 668.0, 310.0, 146.0, 84.0, 44.0, 34.0, 14.0, 15.0, 10.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7780418395996094, -0.7596969604492188, -0.7413520812988281, -0.7230072021484375, -0.7046623229980469, -0.6863174438476562, -0.6679725646972656, -0.649627685546875, -0.6312828063964844, -0.6129379272460938, -0.5945930480957031, -0.5762481689453125, -0.5579032897949219, -0.5395584106445312, -0.5212135314941406, -0.50286865234375, -0.4845237731933594, -0.46617889404296875, -0.4478340148925781, -0.4294891357421875, -0.4111442565917969, -0.39279937744140625, -0.3744544982910156, -0.356109619140625, -0.3377647399902344, -0.31941986083984375, -0.3010749816894531, -0.2827301025390625, -0.2643852233886719, -0.24604034423828125, -0.22769546508789062, -0.2093505859375, -0.19100570678710938, -0.17266082763671875, -0.15431594848632812, -0.1359710693359375, -0.11762619018554688, -0.09928131103515625, -0.08093643188476562, -0.062591552734375, -0.044246673583984375, -0.02590179443359375, -0.007556915283203125, 0.0107879638671875, 0.029132843017578125, 0.04747772216796875, 0.06582260131835938, 0.08416748046875, 0.10251235961914062, 0.12085723876953125, 0.13920211791992188, 0.1575469970703125, 0.17589187622070312, 0.19423675537109375, 0.21258163452148438, 0.230926513671875, 0.24927139282226562, 0.26761627197265625, 0.2859611511230469, 0.3043060302734375, 0.3226509094238281, 0.34099578857421875, 0.3593406677246094, 0.377685546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 13.0, 29.0, 52.0, 104.0, 142.0, 175.0, 169.0, 125.0, 76.0, 60.0, 28.0, 12.0, 13.0, 2.0, 1.0, 2.0, 3.0], "bins": [-5.074952602386475, -4.978900909423828, -4.88284969329834, -4.786798000335693, -4.690746784210205, -4.594695091247559, -4.49864387512207, -4.402592182159424, -4.3065409660339355, -4.210489273071289, -4.114438056945801, -4.018386363983154, -3.922335147857666, -3.8262836933135986, -3.7302322387695312, -3.634180784225464, -3.5381293296813965, -3.442077875137329, -3.3460264205932617, -3.2499749660491943, -3.153923511505127, -3.0578720569610596, -2.961820602416992, -2.865769147872925, -2.7697174549102783, -2.673666000366211, -2.5776145458221436, -2.481563091278076, -2.385511636734009, -2.2894601821899414, -2.193408727645874, -2.0973572731018066, -2.0013058185577393, -1.9052543640136719, -1.8092029094696045, -1.713151454925537, -1.6171000003814697, -1.5210485458374023, -1.424997091293335, -1.3289456367492676, -1.2328941822052002, -1.1368427276611328, -1.0407912731170654, -0.944739818572998, -0.8486883640289307, -0.7526369094848633, -0.6565853953361511, -0.5605339407920837, -0.4644824266433716, -0.3684309720993042, -0.2723795175552368, -0.17632803320884705, -0.08027657866477966, 0.01577487587928772, 0.11182636022567749, 0.20787781476974487, 0.30392926931381226, 0.39998072385787964, 0.496032178401947, 0.5920836925506592, 0.6881351470947266, 0.784186601638794, 0.8802380561828613, 0.9762895107269287, 1.072340965270996]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 10.0, 11.0, 20.0, 22.0, 23.0, 12.0, 24.0, 29.0, 23.0, 23.0, 38.0, 42.0, 48.0, 38.0, 43.0, 49.0, 43.0, 36.0, 52.0, 44.0, 34.0, 40.0, 40.0, 24.0, 32.0, 27.0, 19.0, 26.0, 17.0, 15.0, 14.0, 16.0, 2.0, 13.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0], "bins": [-1.1443462371826172, -1.114729881286621, -1.085113525390625, -1.055497169494629, -1.0258808135986328, -0.9962645173072815, -0.9666481614112854, -0.9370318055152893, -0.907415509223938, -0.8777991533279419, -0.8481827974319458, -0.8185664415359497, -0.7889501452445984, -0.7593337893486023, -0.7297174334526062, -0.7001010775566101, -0.670484721660614, -0.6408683657646179, -0.6112520098686218, -0.5816357135772705, -0.5520193576812744, -0.5224030017852783, -0.4927866458892822, -0.46317028999328613, -0.4335539638996124, -0.40393760800361633, -0.3743212819099426, -0.34470492601394653, -0.31508857011795044, -0.28547224402427673, -0.25585588812828064, -0.22623954713344574, -0.19662314653396606, -0.16700680553913116, -0.13739046454429626, -0.10777410864830017, -0.07815776765346527, -0.04854142665863037, -0.018925070762634277, 0.010691270232200623, 0.04030761122703552, 0.06992395222187042, 0.09954030066728592, 0.12915664911270142, 0.15877299010753632, 0.18838933110237122, 0.2180056869983673, 0.2476220279932022, 0.2772383689880371, 0.3068547248840332, 0.3364710509777069, 0.366087406873703, 0.3957037329673767, 0.4253200888633728, 0.4549364447593689, 0.484552800655365, 0.5141690969467163, 0.5437854528427124, 0.5734018087387085, 0.6030181646347046, 0.6326344609260559, 0.662250816822052, 0.6918671727180481, 0.7214835286140442, 0.7510998845100403]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 8.0, 4.0, 10.0, 13.0, 26.0, 25.0, 37.0, 57.0, 73.0, 114.0, 170.0, 279.0, 420.0, 740.0, 1153.0, 2010.0, 3483.0, 6285.0, 12318.0, 25275.0, 57788.0, 134685.0, 289723.0, 279631.0, 128685.0, 54916.0, 24302.0, 11763.0, 6183.0, 3369.0, 1909.0, 1164.0, 683.0, 472.0, 261.0, 155.0, 123.0, 88.0, 37.0, 41.0, 24.0, 18.0, 9.0, 10.0, 4.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39306640625, -0.3811454772949219, -0.36922454833984375, -0.3573036193847656, -0.3453826904296875, -0.3334617614746094, -0.32154083251953125, -0.3096199035644531, -0.297698974609375, -0.2857780456542969, -0.27385711669921875, -0.2619361877441406, -0.2500152587890625, -0.23809432983398438, -0.22617340087890625, -0.21425247192382812, -0.20233154296875, -0.19041061401367188, -0.17848968505859375, -0.16656875610351562, -0.1546478271484375, -0.14272689819335938, -0.13080596923828125, -0.11888504028320312, -0.106964111328125, -0.09504318237304688, -0.08312225341796875, -0.07120132446289062, -0.0592803955078125, -0.047359466552734375, -0.03543853759765625, -0.023517608642578125, -0.0115966796875, 0.000324249267578125, 0.01224517822265625, 0.024166107177734375, 0.0360870361328125, 0.048007965087890625, 0.05992889404296875, 0.07184982299804688, 0.083770751953125, 0.09569168090820312, 0.10761260986328125, 0.11953353881835938, 0.1314544677734375, 0.14337539672851562, 0.15529632568359375, 0.16721725463867188, 0.17913818359375, 0.19105911254882812, 0.20298004150390625, 0.21490097045898438, 0.2268218994140625, 0.23874282836914062, 0.25066375732421875, 0.2625846862792969, 0.274505615234375, 0.2864265441894531, 0.29834747314453125, 0.3102684020996094, 0.3221893310546875, 0.3341102600097656, 0.34603118896484375, 0.3579521179199219, 0.369873046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 5.0, 10.0, 11.0, 17.0, 25.0, 21.0, 24.0, 31.0, 35.0, 44.0, 55.0, 69.0, 42.0, 67.0, 56.0, 60.0, 58.0, 55.0, 57.0, 36.0, 41.0, 42.0, 26.0, 24.0, 12.0, 15.0, 17.0, 14.0, 10.0, 7.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98046875, -0.9536285400390625, -0.926788330078125, -0.8999481201171875, -0.87310791015625, -0.8462677001953125, -0.819427490234375, -0.7925872802734375, -0.7657470703125, -0.7389068603515625, -0.712066650390625, -0.6852264404296875, -0.65838623046875, -0.6315460205078125, -0.604705810546875, -0.5778656005859375, -0.551025390625, -0.5241851806640625, -0.497344970703125, -0.4705047607421875, -0.44366455078125, -0.4168243408203125, -0.389984130859375, -0.3631439208984375, -0.3363037109375, -0.3094635009765625, -0.282623291015625, -0.2557830810546875, -0.22894287109375, -0.2021026611328125, -0.175262451171875, -0.1484222412109375, -0.12158203125, -0.0947418212890625, -0.067901611328125, -0.0410614013671875, -0.01422119140625, 0.0126190185546875, 0.039459228515625, 0.0662994384765625, 0.0931396484375, 0.1199798583984375, 0.146820068359375, 0.1736602783203125, 0.20050048828125, 0.2273406982421875, 0.254180908203125, 0.2810211181640625, 0.307861328125, 0.3347015380859375, 0.361541748046875, 0.3883819580078125, 0.41522216796875, 0.4420623779296875, 0.468902587890625, 0.4957427978515625, 0.5225830078125, 0.5494232177734375, 0.576263427734375, 0.6031036376953125, 0.62994384765625, 0.6567840576171875, 0.683624267578125, 0.7104644775390625, 0.7373046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 2.0, 6.0, 11.0, 9.0, 14.0, 18.0, 30.0, 37.0, 61.0, 106.0, 150.0, 241.0, 407.0, 804.0, 1453.0, 3321.0, 8776.0, 29069.0, 128549.0, 538258.0, 260959.0, 52599.0, 14277.0, 4887.0, 2093.0, 1016.0, 534.0, 291.0, 163.0, 131.0, 85.0, 50.0, 37.0, 28.0, 20.0, 13.0, 12.0, 10.0, 6.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.58935546875, -0.5728530883789062, -0.5563507080078125, -0.5398483276367188, -0.523345947265625, -0.5068435668945312, -0.4903411865234375, -0.47383880615234375, -0.45733642578125, -0.44083404541015625, -0.4243316650390625, -0.40782928466796875, -0.391326904296875, -0.37482452392578125, -0.3583221435546875, -0.34181976318359375, -0.3253173828125, -0.30881500244140625, -0.2923126220703125, -0.27581024169921875, -0.259307861328125, -0.24280548095703125, -0.2263031005859375, -0.20980072021484375, -0.19329833984375, -0.17679595947265625, -0.1602935791015625, -0.14379119873046875, -0.127288818359375, -0.11078643798828125, -0.0942840576171875, -0.07778167724609375, -0.061279296875, -0.04477691650390625, -0.0282745361328125, -0.01177215576171875, 0.004730224609375, 0.02123260498046875, 0.0377349853515625, 0.05423736572265625, 0.07073974609375, 0.08724212646484375, 0.1037445068359375, 0.12024688720703125, 0.136749267578125, 0.15325164794921875, 0.1697540283203125, 0.18625640869140625, 0.2027587890625, 0.21926116943359375, 0.2357635498046875, 0.25226593017578125, 0.268768310546875, 0.28527069091796875, 0.3017730712890625, 0.31827545166015625, 0.33477783203125, 0.35128021240234375, 0.3677825927734375, 0.38428497314453125, 0.400787353515625, 0.41728973388671875, 0.4337921142578125, 0.45029449462890625, 0.466796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 8.0, 4.0, 7.0, 10.0, 14.0, 20.0, 13.0, 18.0, 28.0, 25.0, 29.0, 27.0, 34.0, 37.0, 43.0, 35.0, 40.0, 56.0, 39.0, 46.0, 37.0, 42.0, 41.0, 53.0, 38.0, 39.0, 22.0, 27.0, 18.0, 35.0, 15.0, 13.0, 12.0, 11.0, 15.0, 11.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.22845458984375, -1.1883544921875, -1.14825439453125, -1.108154296875, -1.06805419921875, -1.0279541015625, -0.98785400390625, -0.94775390625, -0.90765380859375, -0.8675537109375, -0.82745361328125, -0.787353515625, -0.74725341796875, -0.7071533203125, -0.66705322265625, -0.626953125, -0.58685302734375, -0.5467529296875, -0.50665283203125, -0.466552734375, -0.42645263671875, -0.3863525390625, -0.34625244140625, -0.30615234375, -0.26605224609375, -0.2259521484375, -0.18585205078125, -0.145751953125, -0.10565185546875, -0.0655517578125, -0.02545166015625, 0.0146484375, 0.05474853515625, 0.0948486328125, 0.13494873046875, 0.175048828125, 0.21514892578125, 0.2552490234375, 0.29534912109375, 0.33544921875, 0.37554931640625, 0.4156494140625, 0.45574951171875, 0.495849609375, 0.53594970703125, 0.5760498046875, 0.61614990234375, 0.65625, 0.69635009765625, 0.7364501953125, 0.77655029296875, 0.816650390625, 0.85675048828125, 0.8968505859375, 0.93695068359375, 0.97705078125, 1.01715087890625, 1.0572509765625, 1.09735107421875, 1.137451171875, 1.17755126953125, 1.2176513671875, 1.25775146484375, 1.2978515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 9.0, 8.0, 21.0, 19.0, 27.0, 53.0, 94.0, 144.0, 178.0, 340.0, 663.0, 1259.0, 2640.0, 6205.0, 17814.0, 71658.0, 472490.0, 387102.0, 61170.0, 15836.0, 5684.0, 2475.0, 1131.0, 612.0, 342.0, 209.0, 129.0, 73.0, 58.0, 29.0, 16.0, 16.0, 14.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228271484375, -0.22064971923828125, -0.2130279541015625, -0.20540618896484375, -0.197784423828125, -0.19016265869140625, -0.1825408935546875, -0.17491912841796875, -0.16729736328125, -0.15967559814453125, -0.1520538330078125, -0.14443206787109375, -0.136810302734375, -0.12918853759765625, -0.1215667724609375, -0.11394500732421875, -0.1063232421875, -0.09870147705078125, -0.0910797119140625, -0.08345794677734375, -0.075836181640625, -0.06821441650390625, -0.0605926513671875, -0.05297088623046875, -0.04534912109375, -0.03772735595703125, -0.0301055908203125, -0.02248382568359375, -0.014862060546875, -0.00724029541015625, 0.0003814697265625, 0.00800323486328125, 0.015625, 0.02324676513671875, 0.0308685302734375, 0.03849029541015625, 0.046112060546875, 0.05373382568359375, 0.0613555908203125, 0.06897735595703125, 0.07659912109375, 0.08422088623046875, 0.0918426513671875, 0.09946441650390625, 0.107086181640625, 0.11470794677734375, 0.1223297119140625, 0.12995147705078125, 0.1375732421875, 0.14519500732421875, 0.1528167724609375, 0.16043853759765625, 0.168060302734375, 0.17568206787109375, 0.1833038330078125, 0.19092559814453125, 0.19854736328125, 0.20616912841796875, 0.2137908935546875, 0.22141265869140625, 0.229034423828125, 0.23665618896484375, 0.2442779541015625, 0.25189971923828125, 0.259521484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 15.0, 16.0, 27.0, 23.0, 40.0, 89.0, 91.0, 138.0, 151.0, 134.0, 84.0, 65.0, 37.0, 26.0, 12.0, 14.0, 4.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012540817260742188, -0.00011981092393398285, -0.00011421367526054382, -0.0001086164265871048, -0.00010301917791366577, -9.742192924022675e-05, -9.182468056678772e-05, -8.62274318933487e-05, -8.063018321990967e-05, -7.503293454647064e-05, -6.943568587303162e-05, -6.383843719959259e-05, -5.8241188526153564e-05, -5.264393985271454e-05, -4.704669117927551e-05, -4.144944250583649e-05, -3.585219383239746e-05, -3.0254945158958435e-05, -2.465769648551941e-05, -1.9060447812080383e-05, -1.3463199138641357e-05, -7.865950465202332e-06, -2.2687017917633057e-06, 3.3285468816757202e-06, 8.925795555114746e-06, 1.4523044228553772e-05, 2.0120292901992798e-05, 2.5717541575431824e-05, 3.131479024887085e-05, 3.6912038922309875e-05, 4.25092875957489e-05, 4.810653626918793e-05, 5.370378494262695e-05, 5.930103361606598e-05, 6.4898282289505e-05, 7.049553096294403e-05, 7.609277963638306e-05, 8.169002830982208e-05, 8.728727698326111e-05, 9.288452565670013e-05, 9.848177433013916e-05, 0.00010407902300357819, 0.00010967627167701721, 0.00011527352035045624, 0.00012087076902389526, 0.0001264680176973343, 0.00013206526637077332, 0.00013766251504421234, 0.00014325976371765137, 0.0001488570123910904, 0.00015445426106452942, 0.00016005150973796844, 0.00016564875841140747, 0.0001712460070848465, 0.00017684325575828552, 0.00018244050443172455, 0.00018803775310516357, 0.0001936350017786026, 0.00019923225045204163, 0.00020482949912548065, 0.00021042674779891968, 0.0002160239964723587, 0.00022162124514579773, 0.00022721849381923676, 0.00023281574249267578]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 8.0, 9.0, 8.0, 14.0, 13.0, 16.0, 23.0, 38.0, 65.0, 138.0, 699.0, 11394.0, 912918.0, 120210.0, 2470.0, 282.0, 97.0, 35.0, 35.0, 21.0, 16.0, 9.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.7338027954101562, -0.7063751220703125, -0.6789474487304688, -0.651519775390625, -0.6240921020507812, -0.5966644287109375, -0.5692367553710938, -0.54180908203125, -0.5143814086914062, -0.4869537353515625, -0.45952606201171875, -0.432098388671875, -0.40467071533203125, -0.3772430419921875, -0.34981536865234375, -0.3223876953125, -0.29496002197265625, -0.2675323486328125, -0.24010467529296875, -0.212677001953125, -0.18524932861328125, -0.1578216552734375, -0.13039398193359375, -0.10296630859375, -0.07553863525390625, -0.0481109619140625, -0.02068328857421875, 0.006744384765625, 0.03417205810546875, 0.0615997314453125, 0.08902740478515625, 0.116455078125, 0.14388275146484375, 0.1713104248046875, 0.19873809814453125, 0.226165771484375, 0.25359344482421875, 0.2810211181640625, 0.30844879150390625, 0.33587646484375, 0.36330413818359375, 0.3907318115234375, 0.41815948486328125, 0.445587158203125, 0.47301483154296875, 0.5004425048828125, 0.5278701782226562, 0.5552978515625, 0.5827255249023438, 0.6101531982421875, 0.6375808715820312, 0.665008544921875, 0.6924362182617188, 0.7198638916015625, 0.7472915649414062, 0.77471923828125, 0.8021469116210938, 0.8295745849609375, 0.8570022583007812, 0.884429931640625, 0.9118576049804688, 0.9392852783203125, 0.9667129516601562, 0.994140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 7.0, 8.0, 4.0, 11.0, 13.0, 18.0, 33.0, 43.0, 55.0, 69.0, 98.0, 87.0, 114.0, 104.0, 71.0, 70.0, 43.0, 34.0, 33.0, 24.0, 10.0, 14.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.077880859375, -0.07568073272705078, -0.07348060607910156, -0.07128047943115234, -0.06908035278320312, -0.0668802261352539, -0.06468009948730469, -0.06247997283935547, -0.06027984619140625, -0.05807971954345703, -0.05587959289550781, -0.053679466247558594, -0.051479339599609375, -0.049279212951660156, -0.04707908630371094, -0.04487895965576172, -0.0426788330078125, -0.04047870635986328, -0.03827857971191406, -0.036078453063964844, -0.033878326416015625, -0.031678199768066406, -0.029478073120117188, -0.02727794647216797, -0.02507781982421875, -0.02287769317626953, -0.020677566528320312, -0.018477439880371094, -0.016277313232421875, -0.014077186584472656, -0.011877059936523438, -0.009676933288574219, -0.007476806640625, -0.005276679992675781, -0.0030765533447265625, -0.0008764266967773438, 0.001323699951171875, 0.0035238265991210938, 0.0057239532470703125, 0.007924079895019531, 0.01012420654296875, 0.012324333190917969, 0.014524459838867188, 0.016724586486816406, 0.018924713134765625, 0.021124839782714844, 0.023324966430664062, 0.02552509307861328, 0.0277252197265625, 0.02992534637451172, 0.03212547302246094, 0.034325599670410156, 0.036525726318359375, 0.038725852966308594, 0.04092597961425781, 0.04312610626220703, 0.04532623291015625, 0.04752635955810547, 0.04972648620605469, 0.051926612854003906, 0.054126739501953125, 0.056326866149902344, 0.05852699279785156, 0.06072711944580078, 0.06292724609375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 13.0, 18.0, 57.0, 123.0, 211.0, 251.0, 158.0, 101.0, 39.0, 17.0, 11.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4172747135162354, -3.336487293243408, -3.25570011138916, -3.174912691116333, -3.094125270843506, -3.013338088989258, -2.9325506687164307, -2.8517632484436035, -2.7709760665893555, -2.6901886463165283, -2.6094014644622803, -2.528614044189453, -2.447826623916626, -2.367039203643799, -2.286252021789551, -2.2054646015167236, -2.1246771812438965, -2.0438897609710693, -1.9631024599075317, -1.8823151588439941, -1.801527738571167, -1.7207404375076294, -1.6399531364440918, -1.5591657161712646, -1.478378415107727, -1.3975911140441895, -1.3168036937713623, -1.2360163927078247, -1.155229091644287, -1.07444167137146, -0.9936543703079224, -0.91286700963974, -0.8320795297622681, -0.7512921690940857, -0.6705048084259033, -0.5897175073623657, -0.5089301466941833, -0.428142786026001, -0.347355455160141, -0.266568124294281, -0.18578076362609863, -0.10499341785907745, -0.024206072092056274, 0.056581273674964905, 0.13736861944198608, 0.21815598011016846, 0.29894331097602844, 0.3797306418418884, 0.4605180025100708, 0.5413053631782532, 0.6220927238464355, 0.7028800249099731, 0.7836673855781555, 0.8644547462463379, 0.9452420473098755, 1.026029348373413, 1.1068167686462402, 1.1876040697097778, 1.268391489982605, 1.3491787910461426, 1.4299662113189697, 1.5107535123825073, 1.591540813446045, 1.672328233718872, 1.7531155347824097]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 9.0, 15.0, 27.0, 20.0, 22.0, 35.0, 32.0, 33.0, 36.0, 62.0, 51.0, 46.0, 73.0, 61.0, 52.0, 65.0, 54.0, 46.0, 40.0, 39.0, 32.0, 29.0, 20.0, 21.0, 14.0, 15.0, 14.0, 4.0, 4.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8841239809989929, -0.8583108186721802, -0.8324977159500122, -0.8066845536231995, -0.7808713912963867, -0.7550582885742188, -0.729245126247406, -0.7034319639205933, -0.6776188611984253, -0.6518056988716125, -0.6259925961494446, -0.6001794338226318, -0.5743663311004639, -0.5485531687736511, -0.5227400064468384, -0.496926873922348, -0.47111374139785767, -0.4453006088733673, -0.41948747634887695, -0.3936743140220642, -0.36786118149757385, -0.3420480489730835, -0.31623488664627075, -0.2904217541217804, -0.26460862159729004, -0.23879548907279968, -0.21298234164714813, -0.18716919422149658, -0.16135606169700623, -0.13554292917251587, -0.10972978174686432, -0.08391663432121277, -0.05810344219207764, -0.03229030221700668, -0.00647716224193573, 0.019335977733135223, 0.04514911770820618, 0.07096225023269653, 0.09677539765834808, 0.12258854508399963, 0.14840167760849, 0.17421481013298035, 0.2000279575586319, 0.22584110498428345, 0.2516542375087738, 0.27746737003326416, 0.3032805323600769, 0.32909366488456726, 0.3549067974090576, 0.380719929933548, 0.40653306245803833, 0.4323462247848511, 0.45815935730934143, 0.4839724898338318, 0.5097856521606445, 0.5355987548828125, 0.5614119172096252, 0.587225079536438, 0.613038182258606, 0.6388513445854187, 0.6646645069122314, 0.6904776096343994, 0.7162907719612122, 0.7421039342880249, 0.7679170370101929]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 6.0, 4.0, 10.0, 10.0, 27.0, 35.0, 91.0, 99.0, 219.0, 454.0, 896.0, 2040.0, 5108.0, 14338.0, 50881.0, 288700.0, 556032.0, 93597.0, 22876.0, 7608.0, 2970.0, 1268.0, 575.0, 320.0, 159.0, 87.0, 61.0, 23.0, 17.0, 9.0, 10.0, 10.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9892578125, -0.9619293212890625, -0.934600830078125, -0.9072723388671875, -0.87994384765625, -0.8526153564453125, -0.825286865234375, -0.7979583740234375, -0.7706298828125, -0.7433013916015625, -0.715972900390625, -0.6886444091796875, -0.66131591796875, -0.6339874267578125, -0.606658935546875, -0.5793304443359375, -0.552001953125, -0.5246734619140625, -0.497344970703125, -0.4700164794921875, -0.44268798828125, -0.4153594970703125, -0.388031005859375, -0.3607025146484375, -0.3333740234375, -0.3060455322265625, -0.278717041015625, -0.2513885498046875, -0.22406005859375, -0.1967315673828125, -0.169403076171875, -0.1420745849609375, -0.11474609375, -0.0874176025390625, -0.060089111328125, -0.0327606201171875, -0.00543212890625, 0.0218963623046875, 0.049224853515625, 0.0765533447265625, 0.1038818359375, 0.1312103271484375, 0.158538818359375, 0.1858673095703125, 0.21319580078125, 0.2405242919921875, 0.267852783203125, 0.2951812744140625, 0.322509765625, 0.3498382568359375, 0.377166748046875, 0.4044952392578125, 0.43182373046875, 0.4591522216796875, 0.486480712890625, 0.5138092041015625, 0.5411376953125, 0.5684661865234375, 0.595794677734375, 0.6231231689453125, 0.65045166015625, 0.6777801513671875, 0.705108642578125, 0.7324371337890625, 0.759765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 8.0, 10.0, 17.0, 13.0, 11.0, 17.0, 31.0, 26.0, 25.0, 34.0, 52.0, 41.0, 50.0, 41.0, 39.0, 57.0, 49.0, 48.0, 38.0, 55.0, 44.0, 44.0, 33.0, 32.0, 34.0, 23.0, 29.0, 14.0, 17.0, 12.0, 7.0, 14.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.385406494140625, -1.33428955078125, -1.283172607421875, -1.2320556640625, -1.180938720703125, -1.12982177734375, -1.078704833984375, -1.027587890625, -0.976470947265625, -0.92535400390625, -0.874237060546875, -0.8231201171875, -0.772003173828125, -0.72088623046875, -0.669769287109375, -0.61865234375, -0.567535400390625, -0.51641845703125, -0.465301513671875, -0.4141845703125, -0.363067626953125, -0.31195068359375, -0.260833740234375, -0.209716796875, -0.158599853515625, -0.10748291015625, -0.056365966796875, -0.0052490234375, 0.045867919921875, 0.09698486328125, 0.148101806640625, 0.19921875, 0.250335693359375, 0.30145263671875, 0.352569580078125, 0.4036865234375, 0.454803466796875, 0.50592041015625, 0.557037353515625, 0.608154296875, 0.659271240234375, 0.71038818359375, 0.761505126953125, 0.8126220703125, 0.863739013671875, 0.91485595703125, 0.965972900390625, 1.01708984375, 1.068206787109375, 1.11932373046875, 1.170440673828125, 1.2215576171875, 1.272674560546875, 1.32379150390625, 1.374908447265625, 1.426025390625, 1.477142333984375, 1.52825927734375, 1.579376220703125, 1.6304931640625, 1.681610107421875, 1.73272705078125, 1.783843994140625, 1.8349609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 10.0, 5.0, 9.0, 9.0, 9.0, 21.0, 38.0, 39.0, 63.0, 49.0, 72.0, 99.0, 312.0, 1033848.0, 13426.0, 159.0, 92.0, 63.0, 56.0, 36.0, 44.0, 28.0, 25.0, 18.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.65869140625, -9.3642578125, -9.06982421875, -8.775390625, -8.48095703125, -8.1865234375, -7.89208984375, -7.59765625, -7.30322265625, -7.0087890625, -6.71435546875, -6.419921875, -6.12548828125, -5.8310546875, -5.53662109375, -5.2421875, -4.94775390625, -4.6533203125, -4.35888671875, -4.064453125, -3.77001953125, -3.4755859375, -3.18115234375, -2.88671875, -2.59228515625, -2.2978515625, -2.00341796875, -1.708984375, -1.41455078125, -1.1201171875, -0.82568359375, -0.53125, -0.23681640625, 0.0576171875, 0.35205078125, 0.646484375, 0.94091796875, 1.2353515625, 1.52978515625, 1.82421875, 2.11865234375, 2.4130859375, 2.70751953125, 3.001953125, 3.29638671875, 3.5908203125, 3.88525390625, 4.1796875, 4.47412109375, 4.7685546875, 5.06298828125, 5.357421875, 5.65185546875, 5.9462890625, 6.24072265625, 6.53515625, 6.82958984375, 7.1240234375, 7.41845703125, 7.712890625, 8.00732421875, 8.3017578125, 8.59619140625, 8.890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 6.0, 7.0, 11.0, 9.0, 10.0, 18.0, 39.0, 33.0, 57.0, 43.0, 54.0, 78.0, 54.0, 76.0, 74.0, 78.0, 63.0, 70.0, 47.0, 40.0, 42.0, 26.0, 22.0, 20.0, 13.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.8792724609375, -2.791748046875, -2.7042236328125, -2.61669921875, -2.5291748046875, -2.441650390625, -2.3541259765625, -2.2666015625, -2.1790771484375, -2.091552734375, -2.0040283203125, -1.91650390625, -1.8289794921875, -1.741455078125, -1.6539306640625, -1.56640625, -1.4788818359375, -1.391357421875, -1.3038330078125, -1.21630859375, -1.1287841796875, -1.041259765625, -0.9537353515625, -0.8662109375, -0.7786865234375, -0.691162109375, -0.6036376953125, -0.51611328125, -0.4285888671875, -0.341064453125, -0.2535400390625, -0.166015625, -0.0784912109375, 0.009033203125, 0.0965576171875, 0.18408203125, 0.2716064453125, 0.359130859375, 0.4466552734375, 0.5341796875, 0.6217041015625, 0.709228515625, 0.7967529296875, 0.88427734375, 0.9718017578125, 1.059326171875, 1.1468505859375, 1.234375, 1.3218994140625, 1.409423828125, 1.4969482421875, 1.58447265625, 1.6719970703125, 1.759521484375, 1.8470458984375, 1.9345703125, 2.0220947265625, 2.109619140625, 2.1971435546875, 2.28466796875, 2.3721923828125, 2.459716796875, 2.5472412109375, 2.634765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 5.0, 9.0, 4.0, 23.0, 34.0, 52.0, 76.0, 129.0, 288.0, 619.0, 1927.0, 8768.0, 67923.0, 837186.0, 114991.0, 12507.0, 2520.0, 721.0, 325.0, 155.0, 104.0, 53.0, 42.0, 20.0, 9.0, 12.0, 10.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5146484375, -0.4993324279785156, -0.48401641845703125, -0.4687004089355469, -0.4533843994140625, -0.4380683898925781, -0.42275238037109375, -0.4074363708496094, -0.392120361328125, -0.3768043518066406, -0.36148834228515625, -0.3461723327636719, -0.3308563232421875, -0.3155403137207031, -0.30022430419921875, -0.2849082946777344, -0.26959228515625, -0.2542762756347656, -0.23896026611328125, -0.22364425659179688, -0.2083282470703125, -0.19301223754882812, -0.17769622802734375, -0.16238021850585938, -0.147064208984375, -0.13174819946289062, -0.11643218994140625, -0.10111618041992188, -0.0858001708984375, -0.07048416137695312, -0.05516815185546875, -0.039852142333984375, -0.0245361328125, -0.009220123291015625, 0.00609588623046875, 0.021411895751953125, 0.0367279052734375, 0.052043914794921875, 0.06735992431640625, 0.08267593383789062, 0.097991943359375, 0.11330795288085938, 0.12862396240234375, 0.14393997192382812, 0.1592559814453125, 0.17457199096679688, 0.18988800048828125, 0.20520401000976562, 0.22052001953125, 0.23583602905273438, 0.25115203857421875, 0.2664680480957031, 0.2817840576171875, 0.2971000671386719, 0.31241607666015625, 0.3277320861816406, 0.343048095703125, 0.3583641052246094, 0.37368011474609375, 0.3889961242675781, 0.4043121337890625, 0.4196281433105469, 0.43494415283203125, 0.4502601623535156, 0.465576171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 10.0, 7.0, 5.0, 16.0, 16.0, 22.0, 49.0, 60.0, 100.0, 173.0, 180.0, 125.0, 63.0, 46.0, 34.0, 20.0, 16.0, 5.0, 8.0, 12.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.942583084106445e-05, -5.7637691497802734e-05, -5.5849552154541016e-05, -5.40614128112793e-05, -5.227327346801758e-05, -5.048513412475586e-05, -4.869699478149414e-05, -4.690885543823242e-05, -4.51207160949707e-05, -4.3332576751708984e-05, -4.1544437408447266e-05, -3.975629806518555e-05, -3.796815872192383e-05, -3.618001937866211e-05, -3.439188003540039e-05, -3.260374069213867e-05, -3.081560134887695e-05, -2.9027462005615234e-05, -2.7239322662353516e-05, -2.5451183319091797e-05, -2.3663043975830078e-05, -2.187490463256836e-05, -2.008676528930664e-05, -1.8298625946044922e-05, -1.6510486602783203e-05, -1.4722347259521484e-05, -1.2934207916259766e-05, -1.1146068572998047e-05, -9.357929229736328e-06, -7.569789886474609e-06, -5.781650543212891e-06, -3.993511199951172e-06, -2.205371856689453e-06, -4.172325134277344e-07, 1.3709068298339844e-06, 3.159046173095703e-06, 4.947185516357422e-06, 6.735324859619141e-06, 8.52346420288086e-06, 1.0311603546142578e-05, 1.2099742889404297e-05, 1.3887882232666016e-05, 1.5676021575927734e-05, 1.7464160919189453e-05, 1.9252300262451172e-05, 2.104043960571289e-05, 2.282857894897461e-05, 2.4616718292236328e-05, 2.6404857635498047e-05, 2.8192996978759766e-05, 2.9981136322021484e-05, 3.17692756652832e-05, 3.355741500854492e-05, 3.534555435180664e-05, 3.713369369506836e-05, 3.892183303833008e-05, 4.07099723815918e-05, 4.2498111724853516e-05, 4.4286251068115234e-05, 4.607439041137695e-05, 4.786252975463867e-05, 4.965066909790039e-05, 5.143880844116211e-05, 5.322694778442383e-05, 5.501508712768555e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 11.0, 19.0, 47.0, 84.0, 347.0, 2704.0, 105909.0, 927216.0, 11127.0, 792.0, 160.0, 52.0, 25.0, 20.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0166015625, -0.9850616455078125, -0.953521728515625, -0.9219818115234375, -0.89044189453125, -0.8589019775390625, -0.827362060546875, -0.7958221435546875, -0.7642822265625, -0.7327423095703125, -0.701202392578125, -0.6696624755859375, -0.63812255859375, -0.6065826416015625, -0.575042724609375, -0.5435028076171875, -0.511962890625, -0.4804229736328125, -0.448883056640625, -0.4173431396484375, -0.38580322265625, -0.3542633056640625, -0.322723388671875, -0.2911834716796875, -0.2596435546875, -0.2281036376953125, -0.196563720703125, -0.1650238037109375, -0.13348388671875, -0.1019439697265625, -0.070404052734375, -0.0388641357421875, -0.00732421875, 0.0242156982421875, 0.055755615234375, 0.0872955322265625, 0.11883544921875, 0.1503753662109375, 0.181915283203125, 0.2134552001953125, 0.2449951171875, 0.2765350341796875, 0.308074951171875, 0.3396148681640625, 0.37115478515625, 0.4026947021484375, 0.434234619140625, 0.4657745361328125, 0.497314453125, 0.5288543701171875, 0.560394287109375, 0.5919342041015625, 0.62347412109375, 0.6550140380859375, 0.686553955078125, 0.7180938720703125, 0.7496337890625, 0.7811737060546875, 0.812713623046875, 0.8442535400390625, 0.87579345703125, 0.9073333740234375, 0.938873291015625, 0.9704132080078125, 1.001953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 10.0, 11.0, 9.0, 11.0, 19.0, 19.0, 32.0, 33.0, 28.0, 53.0, 61.0, 93.0, 185.0, 96.0, 67.0, 44.0, 41.0, 45.0, 34.0, 24.0, 5.0, 14.0, 15.0, 9.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0943603515625, -0.09106159210205078, -0.08776283264160156, -0.08446407318115234, -0.08116531372070312, -0.0778665542602539, -0.07456779479980469, -0.07126903533935547, -0.06797027587890625, -0.06467151641845703, -0.06137275695800781, -0.058073997497558594, -0.054775238037109375, -0.051476478576660156, -0.04817771911621094, -0.04487895965576172, -0.0415802001953125, -0.03828144073486328, -0.03498268127441406, -0.031683921813964844, -0.028385162353515625, -0.025086402893066406, -0.021787643432617188, -0.01848888397216797, -0.01519012451171875, -0.011891365051269531, -0.008592605590820312, -0.005293846130371094, -0.001995086669921875, 0.0013036727905273438, 0.0046024322509765625, 0.007901191711425781, 0.011199951171875, 0.014498710632324219, 0.017797470092773438, 0.021096229553222656, 0.024394989013671875, 0.027693748474121094, 0.030992507934570312, 0.03429126739501953, 0.03759002685546875, 0.04088878631591797, 0.04418754577636719, 0.047486305236816406, 0.050785064697265625, 0.054083824157714844, 0.05738258361816406, 0.06068134307861328, 0.0639801025390625, 0.06727886199951172, 0.07057762145996094, 0.07387638092041016, 0.07717514038085938, 0.0804738998413086, 0.08377265930175781, 0.08707141876220703, 0.09037017822265625, 0.09366893768310547, 0.09696769714355469, 0.1002664566040039, 0.10356521606445312, 0.10686397552490234, 0.11016273498535156, 0.11346149444580078, 0.11676025390625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 21.0, 50.0, 114.0, 170.0, 209.0, 202.0, 113.0, 59.0, 25.0, 23.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4421045780181885, -2.303454875946045, -2.1648051738739014, -2.026155471801758, -1.8875057697296143, -1.7488560676574707, -1.6102063655853271, -1.4715566635131836, -1.33290696144104, -1.1942572593688965, -1.055607557296753, -0.9169578552246094, -0.7783081531524658, -0.6396584510803223, -0.5010087490081787, -0.36235904693603516, -0.2237093448638916, -0.08505964279174805, 0.05359005928039551, 0.19223976135253906, 0.3308894634246826, 0.46953916549682617, 0.6081888675689697, 0.7468385696411133, 0.8854882717132568, 1.0241379737854004, 1.162787675857544, 1.3014373779296875, 1.440087080001831, 1.5787367820739746, 1.7173864841461182, 1.8560361862182617, 1.9946861267089844, 2.133335828781128, 2.2719855308532715, 2.410635232925415, 2.5492849349975586, 2.687934637069702, 2.8265843391418457, 2.9652340412139893, 3.103883743286133, 3.2425334453582764, 3.38118314743042, 3.5198328495025635, 3.658482551574707, 3.7971322536468506, 3.935781955718994, 4.074431419372559, 4.213081359863281, 4.351731300354004, 4.490380764007568, 4.629030227661133, 4.7676801681518555, 4.906330108642578, 5.044979572296143, 5.183629035949707, 5.32227897644043, 5.460928916931152, 5.599578380584717, 5.738227844238281, 5.876877784729004, 6.015527725219727, 6.154177188873291, 6.2928266525268555, 6.431476593017578]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 3.0, 8.0, 12.0, 10.0, 6.0, 8.0, 15.0, 16.0, 13.0, 16.0, 22.0, 33.0, 24.0, 31.0, 29.0, 35.0, 39.0, 34.0, 27.0, 43.0, 45.0, 44.0, 55.0, 39.0, 39.0, 30.0, 44.0, 27.0, 32.0, 30.0, 34.0, 24.0, 17.0, 18.0, 22.0, 19.0, 9.0, 8.0, 8.0, 7.0, 6.0, 1.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 4.0, 2.0], "bins": [-2.5910654067993164, -2.520235776901245, -2.449406147003174, -2.3785765171051025, -2.3077468872070312, -2.23691725730896, -2.1660876274108887, -2.0952582359313965, -2.024428367614746, -1.9535987377166748, -1.8827691078186035, -1.8119394779205322, -1.741109848022461, -1.6702802181243896, -1.599450707435608, -1.5286210775375366, -1.4577915668487549, -1.3869619369506836, -1.3161323070526123, -1.245302677154541, -1.1744730472564697, -1.1036434173583984, -1.0328139066696167, -0.9619842767715454, -0.8911546468734741, -0.8203250169754028, -0.7494953870773315, -0.678665816783905, -0.6078361868858337, -0.5370065569877625, -0.46617695689201355, -0.39534735679626465, -0.3245178461074829, -0.2536882162094116, -0.18285861611366272, -0.11202900111675262, -0.04119938611984253, 0.02963024377822876, 0.10045984387397766, 0.17128944396972656, 0.24211907386779785, 0.31294870376586914, 0.38377830386161804, 0.45460790395736694, 0.5254375338554382, 0.5962671637535095, 0.667096734046936, 0.7379263639450073, 0.8087559938430786, 0.8795856237411499, 0.9504152536392212, 1.0212448835372925, 1.0920743942260742, 1.1629040241241455, 1.2337336540222168, 1.304563283920288, 1.3753929138183594, 1.4462225437164307, 1.517052173614502, 1.5878818035125732, 1.6587114334106445, 1.7295410633087158, 1.8003705739974976, 1.8712002038955688, 1.9420298337936401]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 8.0, 17.0, 20.0, 33.0, 39.0, 72.0, 113.0, 226.0, 473.0, 1266.0, 4059.0, 22332.0, 326808.0, 3594012.0, 219959.0, 19065.0, 3784.0, 1108.0, 433.0, 187.0, 83.0, 68.0, 33.0, 22.0, 13.0, 10.0, 7.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.767578125, -2.6991424560546875, -2.630706787109375, -2.5622711181640625, -2.49383544921875, -2.4253997802734375, -2.356964111328125, -2.2885284423828125, -2.2200927734375, -2.1516571044921875, -2.083221435546875, -2.0147857666015625, -1.94635009765625, -1.8779144287109375, -1.809478759765625, -1.7410430908203125, -1.672607421875, -1.6041717529296875, -1.535736083984375, -1.4673004150390625, -1.39886474609375, -1.3304290771484375, -1.261993408203125, -1.1935577392578125, -1.1251220703125, -1.0566864013671875, -0.988250732421875, -0.9198150634765625, -0.85137939453125, -0.7829437255859375, -0.714508056640625, -0.6460723876953125, -0.57763671875, -0.5092010498046875, -0.440765380859375, -0.3723297119140625, -0.30389404296875, -0.2354583740234375, -0.167022705078125, -0.0985870361328125, -0.0301513671875, 0.0382843017578125, 0.106719970703125, 0.1751556396484375, 0.24359130859375, 0.3120269775390625, 0.380462646484375, 0.4488983154296875, 0.517333984375, 0.5857696533203125, 0.654205322265625, 0.7226409912109375, 0.79107666015625, 0.8595123291015625, 0.927947998046875, 0.9963836669921875, 1.0648193359375, 1.1332550048828125, 1.201690673828125, 1.2701263427734375, 1.33856201171875, 1.4069976806640625, 1.475433349609375, 1.5438690185546875, 1.6123046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 9.0, 10.0, 14.0, 13.0, 22.0, 18.0, 39.0, 34.0, 42.0, 63.0, 54.0, 57.0, 57.0, 66.0, 69.0, 85.0, 64.0, 52.0, 50.0, 46.0, 33.0, 31.0, 19.0, 6.0, 14.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.0933151245117188, -1.0616302490234375, -1.0299453735351562, -0.998260498046875, -0.9665756225585938, -0.9348907470703125, -0.9032058715820312, -0.87152099609375, -0.8398361206054688, -0.8081512451171875, -0.7764663696289062, -0.744781494140625, -0.7130966186523438, -0.6814117431640625, -0.6497268676757812, -0.6180419921875, -0.5863571166992188, -0.5546722412109375, -0.5229873657226562, -0.491302490234375, -0.45961761474609375, -0.4279327392578125, -0.39624786376953125, -0.36456298828125, -0.33287811279296875, -0.3011932373046875, -0.26950836181640625, -0.237823486328125, -0.20613861083984375, -0.1744537353515625, -0.14276885986328125, -0.111083984375, -0.07939910888671875, -0.0477142333984375, -0.01602935791015625, 0.015655517578125, 0.04734039306640625, 0.0790252685546875, 0.11071014404296875, 0.14239501953125, 0.17407989501953125, 0.2057647705078125, 0.23744964599609375, 0.269134521484375, 0.30081939697265625, 0.3325042724609375, 0.36418914794921875, 0.3958740234375, 0.42755889892578125, 0.4592437744140625, 0.49092864990234375, 0.522613525390625, 0.5542984008789062, 0.5859832763671875, 0.6176681518554688, 0.64935302734375, 0.6810379028320312, 0.7127227783203125, 0.7444076538085938, 0.776092529296875, 0.8077774047851562, 0.8394622802734375, 0.8711471557617188, 0.90283203125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 13.0, 20.0, 49.0, 89.0, 544.0, 16393.0, 4168684.0, 7928.0, 385.0, 105.0, 33.0, 12.0, 11.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.655517578125, -8.43603515625, -8.216552734375, -7.9970703125, -7.777587890625, -7.55810546875, -7.338623046875, -7.119140625, -6.899658203125, -6.68017578125, -6.460693359375, -6.2412109375, -6.021728515625, -5.80224609375, -5.582763671875, -5.36328125, -5.143798828125, -4.92431640625, -4.704833984375, -4.4853515625, -4.265869140625, -4.04638671875, -3.826904296875, -3.607421875, -3.387939453125, -3.16845703125, -2.948974609375, -2.7294921875, -2.510009765625, -2.29052734375, -2.071044921875, -1.8515625, -1.632080078125, -1.41259765625, -1.193115234375, -0.9736328125, -0.754150390625, -0.53466796875, -0.315185546875, -0.095703125, 0.123779296875, 0.34326171875, 0.562744140625, 0.7822265625, 1.001708984375, 1.22119140625, 1.440673828125, 1.66015625, 1.879638671875, 2.09912109375, 2.318603515625, 2.5380859375, 2.757568359375, 2.97705078125, 3.196533203125, 3.416015625, 3.635498046875, 3.85498046875, 4.074462890625, 4.2939453125, 4.513427734375, 4.73291015625, 4.952392578125, 5.171875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 11.0, 11.0, 10.0, 15.0, 18.0, 21.0, 45.0, 41.0, 52.0, 93.0, 115.0, 152.0, 231.0, 308.0, 492.0, 711.0, 534.0, 371.0, 255.0, 125.0, 109.0, 73.0, 61.0, 55.0, 42.0, 29.0, 16.0, 16.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.2403697967529297, -0.23134994506835938, -0.22233009338378906, -0.21331024169921875, -0.20429039001464844, -0.19527053833007812, -0.1862506866455078, -0.1772308349609375, -0.1682109832763672, -0.15919113159179688, -0.15017127990722656, -0.14115142822265625, -0.13213157653808594, -0.12311172485351562, -0.11409187316894531, -0.105072021484375, -0.09605216979980469, -0.08703231811523438, -0.07801246643066406, -0.06899261474609375, -0.05997276306152344, -0.050952911376953125, -0.04193305969238281, -0.0329132080078125, -0.023893356323242188, -0.014873504638671875, -0.0058536529541015625, 0.00316619873046875, 0.012186050415039062, 0.021205902099609375, 0.030225753784179688, 0.03924560546875, 0.04826545715332031, 0.057285308837890625, 0.06630516052246094, 0.07532501220703125, 0.08434486389160156, 0.09336471557617188, 0.10238456726074219, 0.1114044189453125, 0.12042427062988281, 0.12944412231445312, 0.13846397399902344, 0.14748382568359375, 0.15650367736816406, 0.16552352905273438, 0.1745433807373047, 0.183563232421875, 0.1925830841064453, 0.20160293579101562, 0.21062278747558594, 0.21964263916015625, 0.22866249084472656, 0.23768234252929688, 0.2467021942138672, 0.2557220458984375, 0.2647418975830078, 0.2737617492675781, 0.28278160095214844, 0.29180145263671875, 0.30082130432128906, 0.3098411560058594, 0.3188610076904297, 0.327880859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 5.0, 13.0, 21.0, 29.0, 32.0, 61.0, 73.0, 105.0, 125.0, 111.0, 105.0, 93.0, 65.0, 40.0, 33.0, 23.0, 17.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.1261439323425293, -2.073329210281372, -2.020514726638794, -1.9677000045776367, -1.914885401725769, -1.8620707988739014, -1.8092561960220337, -1.756441593170166, -1.7036268711090088, -1.6508122682571411, -1.5979976654052734, -1.5451829433441162, -1.4923683404922485, -1.4395537376403809, -1.3867391347885132, -1.3339245319366455, -1.2811099290847778, -1.2282953262329102, -1.1754807233810425, -1.1226661205291748, -1.0698513984680176, -1.01703679561615, -0.9642221927642822, -0.9114075899124146, -0.8585929274559021, -0.8057783246040344, -0.752963662147522, -0.7001490592956543, -0.6473344564437866, -0.5945197939872742, -0.5417051911354065, -0.48889055848121643, -0.4360760450363159, -0.38326141238212585, -0.3304467797279358, -0.2776321768760681, -0.22481754422187805, -0.172002911567688, -0.11918830871582031, -0.06637367606163025, -0.013559043407440186, 0.03925558179616928, 0.09207020699977875, 0.14488482475280762, 0.19769945740699768, 0.25051409006118774, 0.3033286929130554, 0.3561433255672455, 0.40895795822143555, 0.4617725908756256, 0.5145872235298157, 0.5674018263816833, 0.6202164888381958, 0.6730310916900635, 0.7258456945419312, 0.7786602973937988, 0.8314749598503113, 0.884289562702179, 0.9371042251586914, 0.9899188280105591, 1.0427334308624268, 1.095548152923584, 1.148362636566162, 1.2011773586273193, 1.253991961479187]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 4.0, 6.0, 12.0, 6.0, 12.0, 9.0, 12.0, 10.0, 20.0, 22.0, 19.0, 27.0, 38.0, 27.0, 40.0, 44.0, 51.0, 44.0, 50.0, 40.0, 50.0, 47.0, 38.0, 41.0, 48.0, 47.0, 34.0, 40.0, 22.0, 33.0, 23.0, 16.0, 21.0, 9.0, 9.0, 6.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8382196426391602, -0.8120490312576294, -0.7858783602714539, -0.7597077488899231, -0.7335370779037476, -0.7073664665222168, -0.681195855140686, -0.6550252437591553, -0.6288545727729797, -0.602683961391449, -0.5765132904052734, -0.5503426790237427, -0.5241720676422119, -0.4980013966560364, -0.4718307852745056, -0.44566014409065247, -0.4194895029067993, -0.39331886172294617, -0.367148220539093, -0.34097760915756226, -0.3148069679737091, -0.28863632678985596, -0.2624657154083252, -0.23629507422447205, -0.2101244330406189, -0.18395379185676575, -0.1577831655740738, -0.13161253929138184, -0.10544189810752869, -0.07927125692367554, -0.05310063064098358, -0.026930004358291626, -0.0007593035697937012, 0.02541133016347885, 0.051581963896751404, 0.07775259763002396, 0.10392323136329651, 0.13009387254714966, 0.1562644988298416, 0.18243512511253357, 0.20860576629638672, 0.23477640748023987, 0.260947048664093, 0.2871176600456238, 0.31328830122947693, 0.3394589424133301, 0.36562955379486084, 0.391800194978714, 0.41797083616256714, 0.4441414773464203, 0.47031211853027344, 0.4964827299118042, 0.522653341293335, 0.5488240122795105, 0.5749946236610413, 0.6011652946472168, 0.6273359060287476, 0.6535065174102783, 0.6796771883964539, 0.7058477997779846, 0.7320184707641602, 0.7581890821456909, 0.7843596935272217, 0.8105303049087524, 0.836700975894928]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 7.0, 9.0, 16.0, 31.0, 44.0, 78.0, 191.0, 358.0, 909.0, 2350.0, 6703.0, 22151.0, 96274.0, 438663.0, 374908.0, 77913.0, 18651.0, 5685.0, 1995.0, 816.0, 371.0, 194.0, 105.0, 42.0, 26.0, 19.0, 8.0, 5.0, 6.0, 2.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.65625, -0.6398162841796875, -0.623382568359375, -0.6069488525390625, -0.59051513671875, -0.5740814208984375, -0.557647705078125, -0.5412139892578125, -0.5247802734375, -0.5083465576171875, -0.491912841796875, -0.4754791259765625, -0.45904541015625, -0.4426116943359375, -0.426177978515625, -0.4097442626953125, -0.393310546875, -0.3768768310546875, -0.360443115234375, -0.3440093994140625, -0.32757568359375, -0.3111419677734375, -0.294708251953125, -0.2782745361328125, -0.2618408203125, -0.2454071044921875, -0.228973388671875, -0.2125396728515625, -0.19610595703125, -0.1796722412109375, -0.163238525390625, -0.1468048095703125, -0.13037109375, -0.1139373779296875, -0.097503662109375, -0.0810699462890625, -0.06463623046875, -0.0482025146484375, -0.031768798828125, -0.0153350830078125, 0.0010986328125, 0.0175323486328125, 0.033966064453125, 0.0503997802734375, 0.06683349609375, 0.0832672119140625, 0.099700927734375, 0.1161346435546875, 0.132568359375, 0.1490020751953125, 0.165435791015625, 0.1818695068359375, 0.19830322265625, 0.2147369384765625, 0.231170654296875, 0.2476043701171875, 0.2640380859375, 0.2804718017578125, 0.296905517578125, 0.3133392333984375, 0.32977294921875, 0.3462066650390625, 0.362640380859375, 0.3790740966796875, 0.3955078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 6.0, 10.0, 9.0, 14.0, 18.0, 31.0, 44.0, 58.0, 87.0, 88.0, 87.0, 97.0, 89.0, 91.0, 72.0, 50.0, 49.0, 37.0, 19.0, 19.0, 13.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6083984375, -0.5771636962890625, -0.545928955078125, -0.5146942138671875, -0.48345947265625, -0.4522247314453125, -0.420989990234375, -0.3897552490234375, -0.3585205078125, -0.3272857666015625, -0.296051025390625, -0.2648162841796875, -0.23358154296875, -0.2023468017578125, -0.171112060546875, -0.1398773193359375, -0.108642578125, -0.0774078369140625, -0.046173095703125, -0.0149383544921875, 0.01629638671875, 0.0475311279296875, 0.078765869140625, 0.1100006103515625, 0.1412353515625, 0.1724700927734375, 0.203704833984375, 0.2349395751953125, 0.26617431640625, 0.2974090576171875, 0.328643798828125, 0.3598785400390625, 0.39111328125, 0.4223480224609375, 0.453582763671875, 0.4848175048828125, 0.51605224609375, 0.5472869873046875, 0.578521728515625, 0.6097564697265625, 0.6409912109375, 0.6722259521484375, 0.703460693359375, 0.7346954345703125, 0.76593017578125, 0.7971649169921875, 0.828399658203125, 0.8596343994140625, 0.890869140625, 0.9221038818359375, 0.953338623046875, 0.9845733642578125, 1.01580810546875, 1.0470428466796875, 1.078277587890625, 1.1095123291015625, 1.1407470703125, 1.1719818115234375, 1.203216552734375, 1.2344512939453125, 1.26568603515625, 1.2969207763671875, 1.328155517578125, 1.3593902587890625, 1.390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 1.0, 5.0, 9.0, 10.0, 13.0, 15.0, 27.0, 30.0, 48.0, 63.0, 103.0, 142.0, 224.0, 372.0, 611.0, 1100.0, 2183.0, 4806.0, 11479.0, 33044.0, 124476.0, 444696.0, 312250.0, 75181.0, 22118.0, 8078.0, 3553.0, 1721.0, 821.0, 482.0, 291.0, 182.0, 115.0, 74.0, 65.0, 34.0, 32.0, 15.0, 21.0, 14.0, 6.0, 14.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.31884765625, -0.3088264465332031, -0.29880523681640625, -0.2887840270996094, -0.2787628173828125, -0.2687416076660156, -0.25872039794921875, -0.24869918823242188, -0.238677978515625, -0.22865676879882812, -0.21863555908203125, -0.20861434936523438, -0.1985931396484375, -0.18857192993164062, -0.17855072021484375, -0.16852951049804688, -0.15850830078125, -0.14848709106445312, -0.13846588134765625, -0.12844467163085938, -0.1184234619140625, -0.10840225219726562, -0.09838104248046875, -0.08835983276367188, -0.078338623046875, -0.06831741333007812, -0.05829620361328125, -0.048274993896484375, -0.0382537841796875, -0.028232574462890625, -0.01821136474609375, -0.008190155029296875, 0.0018310546875, 0.011852264404296875, 0.02187347412109375, 0.031894683837890625, 0.0419158935546875, 0.051937103271484375, 0.06195831298828125, 0.07197952270507812, 0.082000732421875, 0.09202194213867188, 0.10204315185546875, 0.11206436157226562, 0.1220855712890625, 0.13210678100585938, 0.14212799072265625, 0.15214920043945312, 0.16217041015625, 0.17219161987304688, 0.18221282958984375, 0.19223403930664062, 0.2022552490234375, 0.21227645874023438, 0.22229766845703125, 0.23231887817382812, 0.242340087890625, 0.2523612976074219, 0.26238250732421875, 0.2724037170410156, 0.2824249267578125, 0.2924461364746094, 0.30246734619140625, 0.3124885559082031, 0.322509765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 7.0, 9.0, 13.0, 10.0, 9.0, 13.0, 14.0, 22.0, 27.0, 37.0, 21.0, 32.0, 42.0, 44.0, 41.0, 46.0, 45.0, 45.0, 36.0, 45.0, 47.0, 59.0, 40.0, 30.0, 51.0, 30.0, 26.0, 22.0, 20.0, 24.0, 12.0, 14.0, 9.0, 12.0, 7.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9189453125, -0.8901519775390625, -0.861358642578125, -0.8325653076171875, -0.80377197265625, -0.7749786376953125, -0.746185302734375, -0.7173919677734375, -0.6885986328125, -0.6598052978515625, -0.631011962890625, -0.6022186279296875, -0.57342529296875, -0.5446319580078125, -0.515838623046875, -0.4870452880859375, -0.458251953125, -0.4294586181640625, -0.400665283203125, -0.3718719482421875, -0.34307861328125, -0.3142852783203125, -0.285491943359375, -0.2566986083984375, -0.2279052734375, -0.1991119384765625, -0.170318603515625, -0.1415252685546875, -0.11273193359375, -0.0839385986328125, -0.055145263671875, -0.0263519287109375, 0.00244140625, 0.0312347412109375, 0.060028076171875, 0.0888214111328125, 0.11761474609375, 0.1464080810546875, 0.175201416015625, 0.2039947509765625, 0.2327880859375, 0.2615814208984375, 0.290374755859375, 0.3191680908203125, 0.34796142578125, 0.3767547607421875, 0.405548095703125, 0.4343414306640625, 0.463134765625, 0.4919281005859375, 0.520721435546875, 0.5495147705078125, 0.57830810546875, 0.6071014404296875, 0.635894775390625, 0.6646881103515625, 0.6934814453125, 0.7222747802734375, 0.751068115234375, 0.7798614501953125, 0.80865478515625, 0.8374481201171875, 0.866241455078125, 0.8950347900390625, 0.923828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 18.0, 28.0, 36.0, 54.0, 75.0, 107.0, 200.0, 323.0, 507.0, 879.0, 1565.0, 2894.0, 5775.0, 13100.0, 33716.0, 110654.0, 423219.0, 326564.0, 80924.0, 26635.0, 10584.0, 4866.0, 2475.0, 1360.0, 736.0, 456.0, 268.0, 166.0, 128.0, 82.0, 38.0, 32.0, 19.0, 16.0, 14.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.134765625, -0.130401611328125, -0.12603759765625, -0.121673583984375, -0.1173095703125, -0.112945556640625, -0.10858154296875, -0.104217529296875, -0.099853515625, -0.095489501953125, -0.09112548828125, -0.086761474609375, -0.0823974609375, -0.078033447265625, -0.07366943359375, -0.069305419921875, -0.06494140625, -0.060577392578125, -0.05621337890625, -0.051849365234375, -0.0474853515625, -0.043121337890625, -0.03875732421875, -0.034393310546875, -0.030029296875, -0.025665283203125, -0.02130126953125, -0.016937255859375, -0.0125732421875, -0.008209228515625, -0.00384521484375, 0.000518798828125, 0.0048828125, 0.009246826171875, 0.01361083984375, 0.017974853515625, 0.0223388671875, 0.026702880859375, 0.03106689453125, 0.035430908203125, 0.039794921875, 0.044158935546875, 0.04852294921875, 0.052886962890625, 0.0572509765625, 0.061614990234375, 0.06597900390625, 0.070343017578125, 0.07470703125, 0.079071044921875, 0.08343505859375, 0.087799072265625, 0.0921630859375, 0.096527099609375, 0.10089111328125, 0.105255126953125, 0.109619140625, 0.113983154296875, 0.11834716796875, 0.122711181640625, 0.1270751953125, 0.131439208984375, 0.13580322265625, 0.140167236328125, 0.14453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 5.0, 8.0, 7.0, 15.0, 6.0, 24.0, 46.0, 52.0, 73.0, 107.0, 164.0, 142.0, 111.0, 80.0, 50.0, 23.0, 26.0, 12.0, 9.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012922286987304688, -0.00012488290667533875, -0.00012054294347763062, -0.00011620298027992249, -0.00011186301708221436, -0.00010752305388450623, -0.0001031830906867981, -9.884312748908997e-05, -9.450316429138184e-05, -9.01632010936737e-05, -8.582323789596558e-05, -8.148327469825745e-05, -7.714331150054932e-05, -7.280334830284119e-05, -6.846338510513306e-05, -6.412342190742493e-05, -5.97834587097168e-05, -5.544349551200867e-05, -5.110353231430054e-05, -4.676356911659241e-05, -4.242360591888428e-05, -3.808364272117615e-05, -3.374367952346802e-05, -2.9403716325759888e-05, -2.5063753128051758e-05, -2.0723789930343628e-05, -1.6383826732635498e-05, -1.2043863534927368e-05, -7.703900337219238e-06, -3.3639371395111084e-06, 9.760260581970215e-07, 5.315989255905151e-06, 9.655952453613281e-06, 1.3995915651321411e-05, 1.833587884902954e-05, 2.267584204673767e-05, 2.70158052444458e-05, 3.135576844215393e-05, 3.569573163986206e-05, 4.003569483757019e-05, 4.437565803527832e-05, 4.871562123298645e-05, 5.305558443069458e-05, 5.739554762840271e-05, 6.173551082611084e-05, 6.607547402381897e-05, 7.04154372215271e-05, 7.475540041923523e-05, 7.909536361694336e-05, 8.343532681465149e-05, 8.777529001235962e-05, 9.211525321006775e-05, 9.645521640777588e-05, 0.00010079517960548401, 0.00010513514280319214, 0.00010947510600090027, 0.0001138150691986084, 0.00011815503239631653, 0.00012249499559402466, 0.0001268349587917328, 0.00013117492198944092, 0.00013551488518714905, 0.00013985484838485718, 0.0001441948115825653, 0.00014853477478027344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 10.0, 24.0, 23.0, 49.0, 55.0, 67.0, 114.0, 210.0, 268.0, 419.0, 748.0, 1333.0, 2463.0, 4952.0, 10369.0, 24067.0, 65995.0, 208005.0, 415663.0, 204400.0, 64684.0, 23918.0, 10138.0, 4795.0, 2457.0, 1311.0, 751.0, 434.0, 280.0, 183.0, 99.0, 68.0, 62.0, 40.0, 18.0, 19.0, 12.0, 9.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0], "bins": [-0.133056640625, -0.12919902801513672, -0.12534141540527344, -0.12148380279541016, -0.11762619018554688, -0.1137685775756836, -0.10991096496582031, -0.10605335235595703, -0.10219573974609375, -0.09833812713623047, -0.09448051452636719, -0.0906229019165039, -0.08676528930664062, -0.08290767669677734, -0.07905006408691406, -0.07519245147705078, -0.0713348388671875, -0.06747722625732422, -0.06361961364746094, -0.059762001037597656, -0.055904388427734375, -0.052046775817871094, -0.04818916320800781, -0.04433155059814453, -0.04047393798828125, -0.03661632537841797, -0.03275871276855469, -0.028901100158691406, -0.025043487548828125, -0.021185874938964844, -0.017328262329101562, -0.013470649719238281, -0.009613037109375, -0.005755424499511719, -0.0018978118896484375, 0.0019598007202148438, 0.005817413330078125, 0.009675025939941406, 0.013532638549804688, 0.01739025115966797, 0.02124786376953125, 0.02510547637939453, 0.028963088989257812, 0.032820701599121094, 0.036678314208984375, 0.040535926818847656, 0.04439353942871094, 0.04825115203857422, 0.0521087646484375, 0.05596637725830078, 0.05982398986816406, 0.06368160247802734, 0.06753921508789062, 0.0713968276977539, 0.07525444030761719, 0.07911205291748047, 0.08296966552734375, 0.08682727813720703, 0.09068489074707031, 0.0945425033569336, 0.09840011596679688, 0.10225772857666016, 0.10611534118652344, 0.10997295379638672, 0.11383056640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 5.0, 18.0, 19.0, 24.0, 18.0, 37.0, 54.0, 61.0, 58.0, 73.0, 84.0, 82.0, 80.0, 72.0, 68.0, 48.0, 42.0, 25.0, 24.0, 16.0, 9.0, 17.0, 15.0, 10.0, 10.0, 8.0, 1.0, 6.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036773681640625, -0.03556632995605469, -0.034358978271484375, -0.03315162658691406, -0.03194427490234375, -0.030736923217773438, -0.029529571533203125, -0.028322219848632812, -0.0271148681640625, -0.025907516479492188, -0.024700164794921875, -0.023492813110351562, -0.02228546142578125, -0.021078109741210938, -0.019870758056640625, -0.018663406372070312, -0.0174560546875, -0.016248703002929688, -0.015041351318359375, -0.013833999633789062, -0.01262664794921875, -0.011419296264648438, -0.010211944580078125, -0.009004592895507812, -0.0077972412109375, -0.0065898895263671875, -0.005382537841796875, -0.0041751861572265625, -0.00296783447265625, -0.0017604827880859375, -0.000553131103515625, 0.0006542205810546875, 0.001861572265625, 0.0030689239501953125, 0.004276275634765625, 0.0054836273193359375, 0.00669097900390625, 0.007898330688476562, 0.009105682373046875, 0.010313034057617188, 0.0115203857421875, 0.012727737426757812, 0.013935089111328125, 0.015142440795898438, 0.01634979248046875, 0.017557144165039062, 0.018764495849609375, 0.019971847534179688, 0.02117919921875, 0.022386550903320312, 0.023593902587890625, 0.024801254272460938, 0.02600860595703125, 0.027215957641601562, 0.028423309326171875, 0.029630661010742188, 0.0308380126953125, 0.03204536437988281, 0.033252716064453125, 0.03446006774902344, 0.03566741943359375, 0.03687477111816406, 0.038082122802734375, 0.03928947448730469, 0.040496826171875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 18.0, 26.0, 65.0, 108.0, 161.0, 163.0, 184.0, 108.0, 70.0, 33.0, 13.0, 11.0, 7.0, 10.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1375699043273926, -2.088608503341675, -2.039647102355957, -1.9906858205795288, -1.9417245388031006, -1.8927631378173828, -1.843801736831665, -1.7948404550552368, -1.745879054069519, -1.6969176530838013, -1.647956371307373, -1.5989949703216553, -1.550033688545227, -1.5010722875595093, -1.452111005783081, -1.4031496047973633, -1.3541882038116455, -1.3052268028259277, -1.2562655210494995, -1.2073041200637817, -1.1583428382873535, -1.1093814373016357, -1.060420036315918, -1.0114587545394897, -0.9624974727630615, -0.9135361313819885, -0.8645747900009155, -0.8156133890151978, -0.7666520476341248, -0.7176907062530518, -0.6687293648719788, -0.6197680234909058, -0.570806622505188, -0.521845281124115, -0.4728839099407196, -0.4239225685596466, -0.3749611973762512, -0.3259998559951782, -0.2770385146141052, -0.22807714343070984, -0.17911580204963684, -0.13015444576740265, -0.08119309693574905, -0.03223174810409546, 0.016729608178138733, 0.06569096446037292, 0.11465230584144592, 0.1636136770248413, 0.2125750184059143, 0.2615363597869873, 0.3104977309703827, 0.3594590723514557, 0.4084204435348511, 0.4573817849159241, 0.5063431262969971, 0.5553045272827148, 0.6042658090591431, 0.6532271504402161, 0.7021884918212891, 0.7511498928070068, 0.8001112341880798, 0.8490725755691528, 0.8980339169502258, 0.9469952583312988, 0.9959566593170166]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 12.0, 13.0, 14.0, 19.0, 25.0, 39.0, 40.0, 57.0, 80.0, 84.0, 106.0, 89.0, 95.0, 90.0, 69.0, 53.0, 48.0, 22.0, 18.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5825619697570801, -0.5521473288536072, -0.5217326283454895, -0.4913179874420166, -0.4609033167362213, -0.430488646030426, -0.4000740051269531, -0.36965933442115784, -0.33924466371536255, -0.30882999300956726, -0.278415322303772, -0.24800068140029907, -0.21758601069450378, -0.1871713399887085, -0.1567566841840744, -0.1263420283794403, -0.09592735767364502, -0.06551269441843033, -0.03509803116321564, -0.004683367908000946, 0.025731295347213745, 0.05614596605300903, 0.08656062185764313, 0.11697527766227722, 0.1473899483680725, 0.1778046190738678, 0.2082192748785019, 0.238633930683136, 0.2690486013889313, 0.29946327209472656, 0.32987791299819946, 0.36029258370399475, 0.39070725440979004, 0.4211219251155853, 0.4515365958213806, 0.4819512367248535, 0.5123659372329712, 0.5427805781364441, 0.573195219039917, 0.6036099195480347, 0.6340245604515076, 0.6644392013549805, 0.6948539018630981, 0.725268542766571, 0.755683183670044, 0.7860978841781616, 0.8165125250816345, 0.8469271659851074, 0.8773418664932251, 0.907756507396698, 0.9381712079048157, 0.9685858488082886, 0.9990005493164062, 1.0294151306152344, 1.059829831123352, 1.0902445316314697, 1.1206591129302979, 1.1510738134384155, 1.1814883947372437, 1.2119030952453613, 1.242317795753479, 1.2727324962615967, 1.3031470775604248, 1.3335617780685425, 1.3639764785766602]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 10.0, 5.0, 12.0, 14.0, 25.0, 48.0, 73.0, 123.0, 211.0, 457.0, 929.0, 2116.0, 5569.0, 17391.0, 68852.0, 340352.0, 475597.0, 100606.0, 23907.0, 7274.0, 2718.0, 1078.0, 515.0, 294.0, 154.0, 89.0, 36.0, 31.0, 23.0, 9.0, 6.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.88720703125, -0.859588623046875, -0.83197021484375, -0.804351806640625, -0.7767333984375, -0.749114990234375, -0.72149658203125, -0.693878173828125, -0.666259765625, -0.638641357421875, -0.61102294921875, -0.583404541015625, -0.5557861328125, -0.528167724609375, -0.50054931640625, -0.472930908203125, -0.4453125, -0.417694091796875, -0.39007568359375, -0.362457275390625, -0.3348388671875, -0.307220458984375, -0.27960205078125, -0.251983642578125, -0.224365234375, -0.196746826171875, -0.16912841796875, -0.141510009765625, -0.1138916015625, -0.086273193359375, -0.05865478515625, -0.031036376953125, -0.00341796875, 0.024200439453125, 0.05181884765625, 0.079437255859375, 0.1070556640625, 0.134674072265625, 0.16229248046875, 0.189910888671875, 0.217529296875, 0.245147705078125, 0.27276611328125, 0.300384521484375, 0.3280029296875, 0.355621337890625, 0.38323974609375, 0.410858154296875, 0.4384765625, 0.466094970703125, 0.49371337890625, 0.521331787109375, 0.5489501953125, 0.576568603515625, 0.60418701171875, 0.631805419921875, 0.659423828125, 0.687042236328125, 0.71466064453125, 0.742279052734375, 0.7698974609375, 0.797515869140625, 0.82513427734375, 0.852752685546875, 0.88037109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 5.0, 8.0, 5.0, 1.0, 7.0, 4.0, 5.0, 10.0, 9.0, 13.0, 18.0, 21.0, 16.0, 28.0, 35.0, 34.0, 36.0, 38.0, 43.0, 50.0, 51.0, 53.0, 56.0, 56.0, 47.0, 59.0, 38.0, 49.0, 37.0, 29.0, 31.0, 18.0, 24.0, 10.0, 5.0, 12.0, 9.0, 9.0, 1.0, 8.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.962890625, -0.92828369140625, -0.8936767578125, -0.85906982421875, -0.824462890625, -0.78985595703125, -0.7552490234375, -0.72064208984375, -0.68603515625, -0.65142822265625, -0.6168212890625, -0.58221435546875, -0.547607421875, -0.51300048828125, -0.4783935546875, -0.44378662109375, -0.4091796875, -0.37457275390625, -0.3399658203125, -0.30535888671875, -0.270751953125, -0.23614501953125, -0.2015380859375, -0.16693115234375, -0.13232421875, -0.09771728515625, -0.0631103515625, -0.02850341796875, 0.006103515625, 0.04071044921875, 0.0753173828125, 0.10992431640625, 0.14453125, 0.17913818359375, 0.2137451171875, 0.24835205078125, 0.282958984375, 0.31756591796875, 0.3521728515625, 0.38677978515625, 0.42138671875, 0.45599365234375, 0.4906005859375, 0.52520751953125, 0.559814453125, 0.59442138671875, 0.6290283203125, 0.66363525390625, 0.6982421875, 0.73284912109375, 0.7674560546875, 0.80206298828125, 0.836669921875, 0.87127685546875, 0.9058837890625, 0.94049072265625, 0.97509765625, 1.00970458984375, 1.0443115234375, 1.07891845703125, 1.113525390625, 1.14813232421875, 1.1827392578125, 1.21734619140625, 1.251953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 9.0, 5.0, 10.0, 9.0, 13.0, 12.0, 16.0, 23.0, 30.0, 28.0, 23.0, 32.0, 30.0, 37.0, 57.0, 68.0, 155.0, 1229.0, 255419.0, 788490.0, 2263.0, 178.0, 60.0, 47.0, 44.0, 34.0, 31.0, 23.0, 29.0, 23.0, 18.0, 13.0, 11.0, 16.0, 12.0, 7.0, 9.0, 7.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.53125, -3.41387939453125, -3.2965087890625, -3.17913818359375, -3.061767578125, -2.94439697265625, -2.8270263671875, -2.70965576171875, -2.59228515625, -2.47491455078125, -2.3575439453125, -2.24017333984375, -2.122802734375, -2.00543212890625, -1.8880615234375, -1.77069091796875, -1.6533203125, -1.53594970703125, -1.4185791015625, -1.30120849609375, -1.183837890625, -1.06646728515625, -0.9490966796875, -0.83172607421875, -0.71435546875, -0.59698486328125, -0.4796142578125, -0.36224365234375, -0.244873046875, -0.12750244140625, -0.0101318359375, 0.10723876953125, 0.224609375, 0.34197998046875, 0.4593505859375, 0.57672119140625, 0.694091796875, 0.81146240234375, 0.9288330078125, 1.04620361328125, 1.16357421875, 1.28094482421875, 1.3983154296875, 1.51568603515625, 1.633056640625, 1.75042724609375, 1.8677978515625, 1.98516845703125, 2.1025390625, 2.21990966796875, 2.3372802734375, 2.45465087890625, 2.572021484375, 2.68939208984375, 2.8067626953125, 2.92413330078125, 3.04150390625, 3.15887451171875, 3.2762451171875, 3.39361572265625, 3.510986328125, 3.62835693359375, 3.7457275390625, 3.86309814453125, 3.98046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 10.0, 8.0, 11.0, 8.0, 15.0, 18.0, 21.0, 31.0, 22.0, 26.0, 33.0, 36.0, 37.0, 44.0, 51.0, 38.0, 39.0, 29.0, 34.0, 34.0, 47.0, 38.0, 45.0, 36.0, 35.0, 30.0, 27.0, 30.0, 22.0, 16.0, 21.0, 18.0, 17.0, 12.0, 9.0, 4.0, 5.0, 7.0, 7.0, 2.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0625, -1.0273284912109375, -0.992156982421875, -0.9569854736328125, -0.92181396484375, -0.8866424560546875, -0.851470947265625, -0.8162994384765625, -0.7811279296875, -0.7459564208984375, -0.710784912109375, -0.6756134033203125, -0.64044189453125, -0.6052703857421875, -0.570098876953125, -0.5349273681640625, -0.499755859375, -0.4645843505859375, -0.429412841796875, -0.3942413330078125, -0.35906982421875, -0.3238983154296875, -0.288726806640625, -0.2535552978515625, -0.2183837890625, -0.1832122802734375, -0.148040771484375, -0.1128692626953125, -0.07769775390625, -0.0425262451171875, -0.007354736328125, 0.0278167724609375, 0.06298828125, 0.0981597900390625, 0.133331298828125, 0.1685028076171875, 0.20367431640625, 0.2388458251953125, 0.274017333984375, 0.3091888427734375, 0.3443603515625, 0.3795318603515625, 0.414703369140625, 0.4498748779296875, 0.48504638671875, 0.5202178955078125, 0.555389404296875, 0.5905609130859375, 0.625732421875, 0.6609039306640625, 0.696075439453125, 0.7312469482421875, 0.76641845703125, 0.8015899658203125, 0.836761474609375, 0.8719329833984375, 0.9071044921875, 0.9422760009765625, 0.977447509765625, 1.0126190185546875, 1.04779052734375, 1.0829620361328125, 1.118133544921875, 1.1533050537109375, 1.1884765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 6.0, 11.0, 19.0, 19.0, 27.0, 36.0, 64.0, 139.0, 332.0, 840.0, 2899.0, 14592.0, 239253.0, 751387.0, 31689.0, 5047.0, 1325.0, 454.0, 175.0, 88.0, 56.0, 27.0, 23.0, 10.0, 12.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5484123229980469, -0.5318832397460938, -0.5153541564941406, -0.4988250732421875, -0.4822959899902344, -0.46576690673828125, -0.4492378234863281, -0.432708740234375, -0.4161796569824219, -0.39965057373046875, -0.3831214904785156, -0.3665924072265625, -0.3500633239746094, -0.33353424072265625, -0.3170051574707031, -0.30047607421875, -0.2839469909667969, -0.26741790771484375, -0.2508888244628906, -0.2343597412109375, -0.21783065795898438, -0.20130157470703125, -0.18477249145507812, -0.168243408203125, -0.15171432495117188, -0.13518524169921875, -0.11865615844726562, -0.1021270751953125, -0.08559799194335938, -0.06906890869140625, -0.052539825439453125, -0.0360107421875, -0.019481658935546875, -0.00295257568359375, 0.013576507568359375, 0.0301055908203125, 0.046634674072265625, 0.06316375732421875, 0.07969284057617188, 0.096221923828125, 0.11275100708007812, 0.12928009033203125, 0.14580917358398438, 0.1623382568359375, 0.17886734008789062, 0.19539642333984375, 0.21192550659179688, 0.22845458984375, 0.24498367309570312, 0.26151275634765625, 0.2780418395996094, 0.2945709228515625, 0.3111000061035156, 0.32762908935546875, 0.3441581726074219, 0.360687255859375, 0.3772163391113281, 0.39374542236328125, 0.4102745056152344, 0.4268035888671875, 0.4433326721191406, 0.45986175537109375, 0.4763908386230469, 0.492919921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 7.0, 13.0, 14.0, 25.0, 27.0, 47.0, 79.0, 104.0, 120.0, 131.0, 141.0, 89.0, 61.0, 47.0, 23.0, 19.0, 6.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.650520324707031e-05, -5.495641380548477e-05, -5.340762436389923e-05, -5.185883492231369e-05, -5.031004548072815e-05, -4.876125603914261e-05, -4.721246659755707e-05, -4.566367715597153e-05, -4.4114887714385986e-05, -4.2566098272800446e-05, -4.1017308831214905e-05, -3.9468519389629364e-05, -3.791972994804382e-05, -3.637094050645828e-05, -3.482215106487274e-05, -3.32733616232872e-05, -3.172457218170166e-05, -3.017578274011612e-05, -2.862699329853058e-05, -2.7078203856945038e-05, -2.5529414415359497e-05, -2.3980624973773956e-05, -2.2431835532188416e-05, -2.0883046090602875e-05, -1.9334256649017334e-05, -1.7785467207431793e-05, -1.6236677765846252e-05, -1.4687888324260712e-05, -1.3139098882675171e-05, -1.159030944108963e-05, -1.004151999950409e-05, -8.492730557918549e-06, -6.943941116333008e-06, -5.395151674747467e-06, -3.846362233161926e-06, -2.2975727915763855e-06, -7.487833499908447e-07, 8.00006091594696e-07, 2.348795533180237e-06, 3.897584974765778e-06, 5.446374416351318e-06, 6.995163857936859e-06, 8.5439532995224e-06, 1.009274274110794e-05, 1.1641532182693481e-05, 1.3190321624279022e-05, 1.4739111065864563e-05, 1.6287900507450104e-05, 1.7836689949035645e-05, 1.9385479390621185e-05, 2.0934268832206726e-05, 2.2483058273792267e-05, 2.4031847715377808e-05, 2.558063715696335e-05, 2.712942659854889e-05, 2.867821604013443e-05, 3.022700548171997e-05, 3.177579492330551e-05, 3.332458436489105e-05, 3.487337380647659e-05, 3.6422163248062134e-05, 3.7970952689647675e-05, 3.9519742131233215e-05, 4.1068531572818756e-05, 4.26173210144043e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 12.0, 9.0, 16.0, 21.0, 28.0, 40.0, 83.0, 112.0, 170.0, 325.0, 565.0, 1196.0, 2534.0, 5890.0, 17636.0, 93069.0, 680771.0, 203071.0, 28498.0, 8054.0, 3211.0, 1507.0, 738.0, 406.0, 242.0, 118.0, 76.0, 49.0, 35.0, 23.0, 9.0, 12.0, 4.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24731826782226562, -0.23804473876953125, -0.22877120971679688, -0.2194976806640625, -0.21022415161132812, -0.20095062255859375, -0.19167709350585938, -0.182403564453125, -0.17313003540039062, -0.16385650634765625, -0.15458297729492188, -0.1453094482421875, -0.13603591918945312, -0.12676239013671875, -0.11748886108398438, -0.10821533203125, -0.09894180297851562, -0.08966827392578125, -0.08039474487304688, -0.0711212158203125, -0.061847686767578125, -0.05257415771484375, -0.043300628662109375, -0.034027099609375, -0.024753570556640625, -0.01548004150390625, -0.006206512451171875, 0.0030670166015625, 0.012340545654296875, 0.02161407470703125, 0.030887603759765625, 0.0401611328125, 0.049434661865234375, 0.05870819091796875, 0.06798171997070312, 0.0772552490234375, 0.08652877807617188, 0.09580230712890625, 0.10507583618164062, 0.114349365234375, 0.12362289428710938, 0.13289642333984375, 0.14216995239257812, 0.1514434814453125, 0.16071701049804688, 0.16999053955078125, 0.17926406860351562, 0.18853759765625, 0.19781112670898438, 0.20708465576171875, 0.21635818481445312, 0.2256317138671875, 0.23490524291992188, 0.24417877197265625, 0.2534523010253906, 0.262725830078125, 0.2719993591308594, 0.28127288818359375, 0.2905464172363281, 0.2998199462890625, 0.3090934753417969, 0.31836700439453125, 0.3276405334472656, 0.3369140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 6.0, 7.0, 7.0, 14.0, 20.0, 24.0, 35.0, 76.0, 170.0, 178.0, 170.0, 121.0, 68.0, 41.0, 19.0, 9.0, 9.0, 3.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037353515625, -0.19768714904785156, -0.19163894653320312, -0.1855907440185547, -0.17954254150390625, -0.1734943389892578, -0.16744613647460938, -0.16139793395996094, -0.1553497314453125, -0.14930152893066406, -0.14325332641601562, -0.1372051239013672, -0.13115692138671875, -0.1251087188720703, -0.11906051635742188, -0.11301231384277344, -0.106964111328125, -0.10091590881347656, -0.09486770629882812, -0.08881950378417969, -0.08277130126953125, -0.07672309875488281, -0.07067489624023438, -0.06462669372558594, -0.0585784912109375, -0.05253028869628906, -0.046482086181640625, -0.04043388366699219, -0.03438568115234375, -0.028337478637695312, -0.022289276123046875, -0.016241073608398438, -0.01019287109375, -0.0041446685791015625, 0.001903533935546875, 0.007951736450195312, 0.01399993896484375, 0.020048141479492188, 0.026096343994140625, 0.03214454650878906, 0.0381927490234375, 0.04424095153808594, 0.050289154052734375, 0.05633735656738281, 0.06238555908203125, 0.06843376159667969, 0.07448196411132812, 0.08053016662597656, 0.086578369140625, 0.09262657165527344, 0.09867477416992188, 0.10472297668457031, 0.11077117919921875, 0.11681938171386719, 0.12286758422851562, 0.12891578674316406, 0.1349639892578125, 0.14101219177246094, 0.14706039428710938, 0.1531085968017578, 0.15915679931640625, 0.1652050018310547, 0.17125320434570312, 0.17730140686035156, 0.183349609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 13.0, 166.0, 544.0, 241.0, 34.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6267006397247314, -3.286273241043091, -2.94584584236145, -2.6054186820983887, -2.264991283416748, -1.9245637655258179, -1.5841364860534668, -1.2437090873718262, -0.9032816886901855, -0.5628542900085449, -0.22242695093154907, 0.11800038814544678, 0.4584277868270874, 0.798855185508728, 1.139282464981079, 1.4797098636627197, 1.8201372623443604, 2.160564661026001, 2.5009920597076416, 2.841419219970703, 3.1818466186523438, 3.5222740173339844, 3.862701416015625, 4.203128814697266, 4.543556213378906, 4.883983612060547, 5.2244110107421875, 5.564838409423828, 5.905265808105469, 6.245693206787109, 6.58612060546875, 6.926548004150391, 7.266974449157715, 7.6074018478393555, 7.947829246520996, 8.288256645202637, 8.628684043884277, 8.969111442565918, 9.309538841247559, 9.6499662399292, 9.99039363861084, 10.33082103729248, 10.671248435974121, 11.011675834655762, 11.352103233337402, 11.692530632019043, 12.032958030700684, 12.373385429382324, 12.713811874389648, 13.054239273071289, 13.39466667175293, 13.73509407043457, 14.075521469116211, 14.415948867797852, 14.756376266479492, 15.096803665161133, 15.437231063842773, 15.777658462524414, 16.118085861206055, 16.458513259887695, 16.798940658569336, 17.139368057250977, 17.479795455932617, 17.820222854614258, 18.1606502532959]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 12.0, 19.0, 21.0, 13.0, 19.0, 29.0, 24.0, 37.0, 39.0, 34.0, 46.0, 55.0, 49.0, 57.0, 46.0, 42.0, 45.0, 41.0, 50.0, 27.0, 34.0, 35.0, 32.0, 28.0, 26.0, 22.0, 18.0, 11.0, 17.0, 8.0, 4.0, 10.0, 5.0, 9.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7280319929122925, -1.6656150817871094, -1.6031981706619263, -1.5407812595367432, -1.47836434841156, -1.415947437286377, -1.3535306453704834, -1.2911136150360107, -1.2286968231201172, -1.166279911994934, -1.103863000869751, -1.0414460897445679, -0.9790291786193848, -0.9166122674942017, -0.8541954159736633, -0.7917785048484802, -0.7293615341186523, -0.6669446229934692, -0.6045277118682861, -0.542110800743103, -0.4796939194202423, -0.4172770082950592, -0.3548601269721985, -0.2924432158470154, -0.23002630472183228, -0.16760939359664917, -0.10519249737262726, -0.04277560114860535, 0.01964130997657776, 0.08205822110176086, 0.14447510242462158, 0.2068920135498047, 0.26930904388427734, 0.33172595500946045, 0.39414286613464355, 0.4565597474575043, 0.5189766883850098, 0.5813935995101929, 0.6438104510307312, 0.7062273621559143, 0.7686442732810974, 0.8310611844062805, 0.8934780955314636, 0.955894947052002, 1.018311858177185, 1.0807287693023682, 1.1431456804275513, 1.2055625915527344, 1.2679795026779175, 1.3303964138031006, 1.3928133249282837, 1.4552302360534668, 1.51764714717865, 1.580064058303833, 1.6424808502197266, 1.7048978805541992, 1.7673146724700928, 1.8297315835952759, 1.892148494720459, 1.954565405845642, 2.016982316970825, 2.0793991088867188, 2.1418161392211914, 2.204232931137085, 2.2666499614715576]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 16.0, 17.0, 17.0, 31.0, 37.0, 43.0, 84.0, 154.0, 384.0, 1462.0, 8976.0, 252547.0, 3845120.0, 78625.0, 5248.0, 925.0, 264.0, 117.0, 67.0, 47.0, 27.0, 18.0, 11.0, 19.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.433929443359375, -3.34442138671875, -3.254913330078125, -3.1654052734375, -3.075897216796875, -2.98638916015625, -2.896881103515625, -2.807373046875, -2.717864990234375, -2.62835693359375, -2.538848876953125, -2.4493408203125, -2.359832763671875, -2.27032470703125, -2.180816650390625, -2.09130859375, -2.001800537109375, -1.91229248046875, -1.822784423828125, -1.7332763671875, -1.643768310546875, -1.55426025390625, -1.464752197265625, -1.375244140625, -1.285736083984375, -1.19622802734375, -1.106719970703125, -1.0172119140625, -0.927703857421875, -0.83819580078125, -0.748687744140625, -0.6591796875, -0.569671630859375, -0.48016357421875, -0.390655517578125, -0.3011474609375, -0.211639404296875, -0.12213134765625, -0.032623291015625, 0.056884765625, 0.146392822265625, 0.23590087890625, 0.325408935546875, 0.4149169921875, 0.504425048828125, 0.59393310546875, 0.683441162109375, 0.77294921875, 0.862457275390625, 0.95196533203125, 1.041473388671875, 1.1309814453125, 1.220489501953125, 1.30999755859375, 1.399505615234375, 1.489013671875, 1.578521728515625, 1.66802978515625, 1.757537841796875, 1.8470458984375, 1.936553955078125, 2.02606201171875, 2.115570068359375, 2.205078125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 13.0, 7.0, 13.0, 18.0, 15.0, 22.0, 22.0, 26.0, 25.0, 36.0, 46.0, 45.0, 60.0, 56.0, 54.0, 61.0, 59.0, 46.0, 46.0, 47.0, 57.0, 48.0, 23.0, 29.0, 21.0, 20.0, 13.0, 11.0, 11.0, 8.0, 4.0, 8.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.79931640625, -0.776123046875, -0.7529296875, -0.729736328125, -0.70654296875, -0.683349609375, -0.66015625, -0.636962890625, -0.61376953125, -0.590576171875, -0.5673828125, -0.544189453125, -0.52099609375, -0.497802734375, -0.474609375, -0.451416015625, -0.42822265625, -0.405029296875, -0.3818359375, -0.358642578125, -0.33544921875, -0.312255859375, -0.2890625, -0.265869140625, -0.24267578125, -0.219482421875, -0.1962890625, -0.173095703125, -0.14990234375, -0.126708984375, -0.103515625, -0.080322265625, -0.05712890625, -0.033935546875, -0.0107421875, 0.012451171875, 0.03564453125, 0.058837890625, 0.08203125, 0.105224609375, 0.12841796875, 0.151611328125, 0.1748046875, 0.197998046875, 0.22119140625, 0.244384765625, 0.267578125, 0.290771484375, 0.31396484375, 0.337158203125, 0.3603515625, 0.383544921875, 0.40673828125, 0.429931640625, 0.453125, 0.476318359375, 0.49951171875, 0.522705078125, 0.5458984375, 0.569091796875, 0.59228515625, 0.615478515625, 0.638671875, 0.661865234375, 0.68505859375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 11.0, 24.0, 54.0, 134.0, 556.0, 19706.0, 4162949.0, 10191.0, 459.0, 107.0, 36.0, 13.0, 8.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.22930908203125, -6.0484619140625, -5.86761474609375, -5.686767578125, -5.50592041015625, -5.3250732421875, -5.14422607421875, -4.96337890625, -4.78253173828125, -4.6016845703125, -4.42083740234375, -4.239990234375, -4.05914306640625, -3.8782958984375, -3.69744873046875, -3.5166015625, -3.33575439453125, -3.1549072265625, -2.97406005859375, -2.793212890625, -2.61236572265625, -2.4315185546875, -2.25067138671875, -2.06982421875, -1.88897705078125, -1.7081298828125, -1.52728271484375, -1.346435546875, -1.16558837890625, -0.9847412109375, -0.80389404296875, -0.623046875, -0.44219970703125, -0.2613525390625, -0.08050537109375, 0.100341796875, 0.28118896484375, 0.4620361328125, 0.64288330078125, 0.82373046875, 1.00457763671875, 1.1854248046875, 1.36627197265625, 1.547119140625, 1.72796630859375, 1.9088134765625, 2.08966064453125, 2.2705078125, 2.45135498046875, 2.6322021484375, 2.81304931640625, 2.993896484375, 3.17474365234375, 3.3555908203125, 3.53643798828125, 3.71728515625, 3.89813232421875, 4.0789794921875, 4.25982666015625, 4.440673828125, 4.62152099609375, 4.8023681640625, 4.98321533203125, 5.1640625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 8.0, 15.0, 6.0, 14.0, 17.0, 29.0, 33.0, 50.0, 100.0, 137.0, 164.0, 257.0, 393.0, 611.0, 725.0, 479.0, 328.0, 207.0, 137.0, 81.0, 75.0, 51.0, 39.0, 21.0, 13.0, 19.0, 11.0, 14.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.27099609375, -0.2619972229003906, -0.25299835205078125, -0.24399948120117188, -0.2350006103515625, -0.22600173950195312, -0.21700286865234375, -0.20800399780273438, -0.199005126953125, -0.19000625610351562, -0.18100738525390625, -0.17200851440429688, -0.1630096435546875, -0.15401077270507812, -0.14501190185546875, -0.13601303100585938, -0.12701416015625, -0.11801528930664062, -0.10901641845703125, -0.10001754760742188, -0.0910186767578125, -0.08201980590820312, -0.07302093505859375, -0.06402206420898438, -0.055023193359375, -0.046024322509765625, -0.03702545166015625, -0.028026580810546875, -0.0190277099609375, -0.010028839111328125, -0.00102996826171875, 0.007968902587890625, 0.0169677734375, 0.025966644287109375, 0.03496551513671875, 0.043964385986328125, 0.0529632568359375, 0.061962127685546875, 0.07096099853515625, 0.07995986938476562, 0.088958740234375, 0.09795761108398438, 0.10695648193359375, 0.11595535278320312, 0.1249542236328125, 0.13395309448242188, 0.14295196533203125, 0.15195083618164062, 0.16094970703125, 0.16994857788085938, 0.17894744873046875, 0.18794631958007812, 0.1969451904296875, 0.20594406127929688, 0.21494293212890625, 0.22394180297851562, 0.232940673828125, 0.24193954467773438, 0.25093841552734375, 0.2599372863769531, 0.2689361572265625, 0.2779350280761719, 0.28693389892578125, 0.2959327697753906, 0.304931640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 15.0, 23.0, 40.0, 65.0, 67.0, 96.0, 119.0, 125.0, 118.0, 94.0, 60.0, 45.0, 30.0, 23.0, 10.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7117741107940674, -1.665800929069519, -1.6198277473449707, -1.573854684829712, -1.5278815031051636, -1.4819083213806152, -1.435935139656067, -1.3899619579315186, -1.3439888954162598, -1.2980157136917114, -1.252042531967163, -1.2060694694519043, -1.160096287727356, -1.1141231060028076, -1.0681499242782593, -1.022176742553711, -0.9762036204338074, -0.930230438709259, -0.8842573165893555, -0.8382841348648071, -0.7923110127449036, -0.7463378310203552, -0.7003647089004517, -0.6543915271759033, -0.608418345451355, -0.5624451637268066, -0.5164720416069031, -0.47049885988235474, -0.42452573776245117, -0.37855255603790283, -0.3325794041156769, -0.2866062521934509, -0.24063313007354736, -0.1946599781513214, -0.14868682622909546, -0.10271365940570831, -0.05674050748348236, -0.010767355561256409, 0.03520581126213074, 0.08117896318435669, 0.12715211510658264, 0.1731252670288086, 0.21909841895103455, 0.2650715708732605, 0.31104475259780884, 0.3570178747177124, 0.40299105644226074, 0.4489642083644867, 0.49493736028671265, 0.540910542011261, 0.5868836641311646, 0.6328568458557129, 0.6788299679756165, 0.7248031497001648, 0.7707762718200684, 0.8167494535446167, 0.862722635269165, 0.9086958169937134, 0.9546689391136169, 1.0006420612335205, 1.0466152429580688, 1.0925884246826172, 1.1385616064071655, 1.1845347881317139, 1.2305078506469727]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 7.0, 6.0, 9.0, 10.0, 15.0, 13.0, 18.0, 17.0, 19.0, 27.0, 40.0, 34.0, 45.0, 58.0, 55.0, 54.0, 52.0, 42.0, 54.0, 50.0, 43.0, 45.0, 47.0, 41.0, 41.0, 24.0, 30.0, 19.0, 17.0, 14.0, 12.0, 7.0, 12.0, 3.0, 5.0, 1.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875497102737427, -0.6619414687156677, -0.6363332271575928, -0.6107249855995178, -0.5851167440414429, -0.5595084428787231, -0.5339002013206482, -0.5082919597625732, -0.4826837182044983, -0.45707547664642334, -0.4314672350883484, -0.40585896372795105, -0.3802507221698761, -0.35464248061180115, -0.3290342092514038, -0.30342596769332886, -0.2778177261352539, -0.25220948457717896, -0.2266012281179428, -0.20099297165870667, -0.1753847301006317, -0.14977648854255676, -0.12416823208332062, -0.09855997562408447, -0.07295173406600952, -0.04734348505735397, -0.021735236048698425, 0.003873012959957123, 0.02948126196861267, 0.05508950352668762, 0.08069775998592377, 0.10630601644515991, 0.13191425800323486, 0.15752249956130981, 0.18313075602054596, 0.2087390124797821, 0.23434725403785706, 0.259955495595932, 0.28556376695632935, 0.3111720085144043, 0.33678025007247925, 0.3623884916305542, 0.38799673318862915, 0.4136050045490265, 0.43921324610710144, 0.4648214876651764, 0.49042975902557373, 0.5160380005836487, 0.5416462421417236, 0.5672544836997986, 0.5928627252578735, 0.6184709668159485, 0.6440792083740234, 0.6696875095367432, 0.6952957510948181, 0.7209039926528931, 0.746512234210968, 0.772120475769043, 0.7977287173271179, 0.8233369588851929, 0.8489452600479126, 0.8745534420013428, 0.9001617431640625, 0.9257699847221375, 0.9513782262802124]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 11.0, 18.0, 33.0, 55.0, 109.0, 192.0, 422.0, 920.0, 2373.0, 6786.0, 26600.0, 167301.0, 670373.0, 140018.0, 23575.0, 6058.0, 2064.0, 838.0, 379.0, 192.0, 102.0, 40.0, 25.0, 20.0, 8.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.51171875, -0.4968681335449219, -0.48201751708984375, -0.4671669006347656, -0.4523162841796875, -0.4374656677246094, -0.42261505126953125, -0.4077644348144531, -0.392913818359375, -0.3780632019042969, -0.36321258544921875, -0.3483619689941406, -0.3335113525390625, -0.3186607360839844, -0.30381011962890625, -0.2889595031738281, -0.27410888671875, -0.2592582702636719, -0.24440765380859375, -0.22955703735351562, -0.2147064208984375, -0.19985580444335938, -0.18500518798828125, -0.17015457153320312, -0.155303955078125, -0.14045333862304688, -0.12560272216796875, -0.11075210571289062, -0.0959014892578125, -0.08105087280273438, -0.06620025634765625, -0.051349639892578125, -0.0364990234375, -0.021648406982421875, -0.00679779052734375, 0.008052825927734375, 0.0229034423828125, 0.037754058837890625, 0.05260467529296875, 0.06745529174804688, 0.082305908203125, 0.09715652465820312, 0.11200714111328125, 0.12685775756835938, 0.1417083740234375, 0.15655899047851562, 0.17140960693359375, 0.18626022338867188, 0.20111083984375, 0.21596145629882812, 0.23081207275390625, 0.24566268920898438, 0.2605133056640625, 0.2753639221191406, 0.29021453857421875, 0.3050651550292969, 0.319915771484375, 0.3347663879394531, 0.34961700439453125, 0.3644676208496094, 0.3793182373046875, 0.3941688537597656, 0.40901947021484375, 0.4238700866699219, 0.438720703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 3.0, 2.0, 11.0, 7.0, 10.0, 10.0, 18.0, 24.0, 17.0, 28.0, 28.0, 31.0, 41.0, 40.0, 53.0, 63.0, 50.0, 53.0, 55.0, 47.0, 45.0, 43.0, 45.0, 50.0, 37.0, 34.0, 23.0, 23.0, 15.0, 16.0, 12.0, 13.0, 10.0, 12.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.53564453125, -0.5204238891601562, -0.5052032470703125, -0.48998260498046875, -0.474761962890625, -0.45954132080078125, -0.4443206787109375, -0.42910003662109375, -0.41387939453125, -0.39865875244140625, -0.3834381103515625, -0.36821746826171875, -0.352996826171875, -0.33777618408203125, -0.3225555419921875, -0.30733489990234375, -0.2921142578125, -0.27689361572265625, -0.2616729736328125, -0.24645233154296875, -0.231231689453125, -0.21601104736328125, -0.2007904052734375, -0.18556976318359375, -0.17034912109375, -0.15512847900390625, -0.1399078369140625, -0.12468719482421875, -0.109466552734375, -0.09424591064453125, -0.0790252685546875, -0.06380462646484375, -0.048583984375, -0.03336334228515625, -0.0181427001953125, -0.00292205810546875, 0.012298583984375, 0.02751922607421875, 0.0427398681640625, 0.05796051025390625, 0.07318115234375, 0.08840179443359375, 0.1036224365234375, 0.11884307861328125, 0.134063720703125, 0.14928436279296875, 0.1645050048828125, 0.17972564697265625, 0.1949462890625, 0.21016693115234375, 0.2253875732421875, 0.24060821533203125, 0.255828857421875, 0.27104949951171875, 0.2862701416015625, 0.30149078369140625, 0.31671142578125, 0.33193206787109375, 0.3471527099609375, 0.36237335205078125, 0.377593994140625, 0.39281463623046875, 0.4080352783203125, 0.42325592041015625, 0.4384765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 8.0, 12.0, 26.0, 22.0, 46.0, 42.0, 95.0, 130.0, 266.0, 444.0, 867.0, 1986.0, 4717.0, 14209.0, 55964.0, 345557.0, 509751.0, 84080.0, 19183.0, 6266.0, 2494.0, 1073.0, 527.0, 294.0, 167.0, 110.0, 61.0, 51.0, 24.0, 19.0, 10.0, 10.0, 12.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2998046875, -0.29047393798828125, -0.2811431884765625, -0.27181243896484375, -0.262481689453125, -0.25315093994140625, -0.2438201904296875, -0.23448944091796875, -0.22515869140625, -0.21582794189453125, -0.2064971923828125, -0.19716644287109375, -0.187835693359375, -0.17850494384765625, -0.1691741943359375, -0.15984344482421875, -0.1505126953125, -0.14118194580078125, -0.1318511962890625, -0.12252044677734375, -0.113189697265625, -0.10385894775390625, -0.0945281982421875, -0.08519744873046875, -0.07586669921875, -0.06653594970703125, -0.0572052001953125, -0.04787445068359375, -0.038543701171875, -0.02921295166015625, -0.0198822021484375, -0.01055145263671875, -0.001220703125, 0.00811004638671875, 0.0174407958984375, 0.02677154541015625, 0.036102294921875, 0.04543304443359375, 0.0547637939453125, 0.06409454345703125, 0.07342529296875, 0.08275604248046875, 0.0920867919921875, 0.10141754150390625, 0.110748291015625, 0.12007904052734375, 0.1294097900390625, 0.13874053955078125, 0.1480712890625, 0.15740203857421875, 0.1667327880859375, 0.17606353759765625, 0.185394287109375, 0.19472503662109375, 0.2040557861328125, 0.21338653564453125, 0.22271728515625, 0.23204803466796875, 0.2413787841796875, 0.25070953369140625, 0.260040283203125, 0.26937103271484375, 0.2787017822265625, 0.28803253173828125, 0.29736328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 7.0, 13.0, 5.0, 14.0, 16.0, 20.0, 25.0, 31.0, 32.0, 40.0, 36.0, 42.0, 38.0, 37.0, 40.0, 46.0, 48.0, 48.0, 43.0, 43.0, 39.0, 36.0, 34.0, 30.0, 34.0, 32.0, 26.0, 25.0, 18.0, 20.0, 17.0, 13.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7529220581054688, -0.7270355224609375, -0.7011489868164062, -0.675262451171875, -0.6493759155273438, -0.6234893798828125, -0.5976028442382812, -0.57171630859375, -0.5458297729492188, -0.5199432373046875, -0.49405670166015625, -0.468170166015625, -0.44228363037109375, -0.4163970947265625, -0.39051055908203125, -0.3646240234375, -0.33873748779296875, -0.3128509521484375, -0.28696441650390625, -0.261077880859375, -0.23519134521484375, -0.2093048095703125, -0.18341827392578125, -0.15753173828125, -0.13164520263671875, -0.1057586669921875, -0.07987213134765625, -0.053985595703125, -0.02809906005859375, -0.0022125244140625, 0.02367401123046875, 0.049560546875, 0.07544708251953125, 0.1013336181640625, 0.12722015380859375, 0.153106689453125, 0.17899322509765625, 0.2048797607421875, 0.23076629638671875, 0.25665283203125, 0.28253936767578125, 0.3084259033203125, 0.33431243896484375, 0.360198974609375, 0.38608551025390625, 0.4119720458984375, 0.43785858154296875, 0.4637451171875, 0.48963165283203125, 0.5155181884765625, 0.5414047241210938, 0.567291259765625, 0.5931777954101562, 0.6190643310546875, 0.6449508666992188, 0.67083740234375, 0.6967239379882812, 0.7226104736328125, 0.7484970092773438, 0.774383544921875, 0.8002700805664062, 0.8261566162109375, 0.8520431518554688, 0.8779296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 15.0, 21.0, 32.0, 43.0, 93.0, 187.0, 314.0, 741.0, 1848.0, 5876.0, 33158.0, 694486.0, 287382.0, 17775.0, 4155.0, 1340.0, 551.0, 243.0, 118.0, 65.0, 27.0, 30.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152587890625, -0.14490127563476562, -0.13721466064453125, -0.12952804565429688, -0.1218414306640625, -0.11415481567382812, -0.10646820068359375, -0.09878158569335938, -0.091094970703125, -0.08340835571289062, -0.07572174072265625, -0.06803512573242188, -0.0603485107421875, -0.052661895751953125, -0.04497528076171875, -0.037288665771484375, -0.02960205078125, -0.021915435791015625, -0.01422882080078125, -0.006542205810546875, 0.0011444091796875, 0.008831024169921875, 0.01651763916015625, 0.024204254150390625, 0.031890869140625, 0.039577484130859375, 0.04726409912109375, 0.054950714111328125, 0.0626373291015625, 0.07032394409179688, 0.07801055908203125, 0.08569717407226562, 0.0933837890625, 0.10107040405273438, 0.10875701904296875, 0.11644363403320312, 0.1241302490234375, 0.13181686401367188, 0.13950347900390625, 0.14719009399414062, 0.154876708984375, 0.16256332397460938, 0.17024993896484375, 0.17793655395507812, 0.1856231689453125, 0.19330978393554688, 0.20099639892578125, 0.20868301391601562, 0.21636962890625, 0.22405624389648438, 0.23174285888671875, 0.23942947387695312, 0.2471160888671875, 0.2548027038574219, 0.26248931884765625, 0.2701759338378906, 0.277862548828125, 0.2855491638183594, 0.29323577880859375, 0.3009223937988281, 0.3086090087890625, 0.3162956237792969, 0.32398223876953125, 0.3316688537597656, 0.33935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 14.0, 16.0, 19.0, 25.0, 40.0, 60.0, 98.0, 127.0, 125.0, 126.0, 113.0, 61.0, 48.0, 31.0, 15.0, 16.0, 8.0, 8.0, 7.0, 9.0, 4.0, 4.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.91278076171875e-05, -5.671940743923187e-05, -5.4311007261276245e-05, -5.190260708332062e-05, -4.949420690536499e-05, -4.708580672740936e-05, -4.4677406549453735e-05, -4.226900637149811e-05, -3.986060619354248e-05, -3.745220601558685e-05, -3.5043805837631226e-05, -3.26354056596756e-05, -3.022700548171997e-05, -2.7818605303764343e-05, -2.5410205125808716e-05, -2.300180494785309e-05, -2.059340476989746e-05, -1.8185004591941833e-05, -1.5776604413986206e-05, -1.3368204236030579e-05, -1.0959804058074951e-05, -8.551403880119324e-06, -6.143003702163696e-06, -3.734603524208069e-06, -1.3262033462524414e-06, 1.082196831703186e-06, 3.4905970096588135e-06, 5.898997187614441e-06, 8.307397365570068e-06, 1.0715797543525696e-05, 1.3124197721481323e-05, 1.553259789943695e-05, 1.7940998077392578e-05, 2.0349398255348206e-05, 2.2757798433303833e-05, 2.516619861125946e-05, 2.7574598789215088e-05, 2.9982998967170715e-05, 3.239139914512634e-05, 3.479979932308197e-05, 3.72081995010376e-05, 3.9616599678993225e-05, 4.202499985694885e-05, 4.443340003490448e-05, 4.684180021286011e-05, 4.9250200390815735e-05, 5.165860056877136e-05, 5.406700074672699e-05, 5.647540092468262e-05, 5.8883801102638245e-05, 6.129220128059387e-05, 6.37006014585495e-05, 6.610900163650513e-05, 6.851740181446075e-05, 7.092580199241638e-05, 7.333420217037201e-05, 7.574260234832764e-05, 7.815100252628326e-05, 8.055940270423889e-05, 8.296780288219452e-05, 8.537620306015015e-05, 8.778460323810577e-05, 9.01930034160614e-05, 9.260140359401703e-05, 9.500980377197266e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 6.0, 13.0, 27.0, 25.0, 44.0, 65.0, 88.0, 190.0, 276.0, 509.0, 937.0, 2008.0, 5075.0, 18600.0, 134701.0, 719955.0, 137771.0, 18700.0, 5224.0, 2093.0, 988.0, 494.0, 313.0, 160.0, 97.0, 64.0, 31.0, 27.0, 21.0, 18.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212158203125, -0.20618247985839844, -0.20020675659179688, -0.1942310333251953, -0.18825531005859375, -0.1822795867919922, -0.17630386352539062, -0.17032814025878906, -0.1643524169921875, -0.15837669372558594, -0.15240097045898438, -0.1464252471923828, -0.14044952392578125, -0.1344738006591797, -0.12849807739257812, -0.12252235412597656, -0.116546630859375, -0.11057090759277344, -0.10459518432617188, -0.09861946105957031, -0.09264373779296875, -0.08666801452636719, -0.08069229125976562, -0.07471656799316406, -0.0687408447265625, -0.06276512145996094, -0.056789398193359375, -0.05081367492675781, -0.04483795166015625, -0.03886222839355469, -0.032886505126953125, -0.026910781860351562, -0.02093505859375, -0.014959335327148438, -0.008983612060546875, -0.0030078887939453125, 0.00296783447265625, 0.008943557739257812, 0.014919281005859375, 0.020895004272460938, 0.0268707275390625, 0.03284645080566406, 0.038822174072265625, 0.04479789733886719, 0.05077362060546875, 0.05674934387207031, 0.06272506713867188, 0.06870079040527344, 0.074676513671875, 0.08065223693847656, 0.08662796020507812, 0.09260368347167969, 0.09857940673828125, 0.10455513000488281, 0.11053085327148438, 0.11650657653808594, 0.1224822998046875, 0.12845802307128906, 0.13443374633789062, 0.1404094696044922, 0.14638519287109375, 0.1523609161376953, 0.15833663940429688, 0.16431236267089844, 0.1702880859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 16.0, 8.0, 31.0, 49.0, 59.0, 102.0, 148.0, 147.0, 155.0, 85.0, 67.0, 42.0, 30.0, 18.0, 7.0, 11.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053314208984375, -0.05176115036010742, -0.050208091735839844, -0.048655033111572266, -0.04710197448730469, -0.04554891586303711, -0.04399585723876953, -0.04244279861450195, -0.040889739990234375, -0.0393366813659668, -0.03778362274169922, -0.03623056411743164, -0.03467750549316406, -0.033124446868896484, -0.031571388244628906, -0.030018329620361328, -0.02846527099609375, -0.026912212371826172, -0.025359153747558594, -0.023806095123291016, -0.022253036499023438, -0.02069997787475586, -0.01914691925048828, -0.017593860626220703, -0.016040802001953125, -0.014487743377685547, -0.012934684753417969, -0.01138162612915039, -0.009828567504882812, -0.008275508880615234, -0.006722450256347656, -0.005169391632080078, -0.0036163330078125, -0.002063274383544922, -0.0005102157592773438, 0.0010428428649902344, 0.0025959014892578125, 0.004148960113525391, 0.005702018737792969, 0.007255077362060547, 0.008808135986328125, 0.010361194610595703, 0.011914253234863281, 0.01346731185913086, 0.015020370483398438, 0.016573429107666016, 0.018126487731933594, 0.019679546356201172, 0.02123260498046875, 0.022785663604736328, 0.024338722229003906, 0.025891780853271484, 0.027444839477539062, 0.02899789810180664, 0.03055095672607422, 0.0321040153503418, 0.033657073974609375, 0.03521013259887695, 0.03676319122314453, 0.03831624984741211, 0.03986930847167969, 0.041422367095947266, 0.042975425720214844, 0.04452848434448242, 0.04608154296875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 14.0, 10.0, 24.0, 46.0, 67.0, 101.0, 146.0, 157.0, 157.0, 87.0, 70.0, 41.0, 19.0, 12.0, 9.0, 7.0, 4.0, 7.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3876785039901733, -1.3533293008804321, -1.3189799785614014, -1.2846307754516602, -1.250281572341919, -1.2159322500228882, -1.181583046913147, -1.1472338438034058, -1.112884521484375, -1.0785353183746338, -1.044185996055603, -1.0098367929458618, -0.9754875302314758, -0.9411382675170898, -0.9067890644073486, -0.8724398016929626, -0.8380905985832214, -0.8037413358688354, -0.7693921327590942, -0.7350428700447083, -0.7006936073303223, -0.666344404220581, -0.6319951415061951, -0.5976458787918091, -0.5632966756820679, -0.5289474129676819, -0.4945981800556183, -0.4602489471435547, -0.4258996844291687, -0.3915504515171051, -0.3572012186050415, -0.3228519558906555, -0.28850269317626953, -0.25415346026420593, -0.21980419754981995, -0.18545496463775635, -0.15110571682453156, -0.11675646901130676, -0.08240723609924316, -0.04805798828601837, -0.013708740472793579, 0.020640503615140915, 0.05498974770307541, 0.0893389880657196, 0.1236882358789444, 0.1580374836921692, 0.1923867166042328, 0.22673596441745758, 0.2610852122306824, 0.29543444514274597, 0.32978370785713196, 0.36413294076919556, 0.39848220348358154, 0.43283143639564514, 0.46718066930770874, 0.5015299320220947, 0.5358791351318359, 0.5702283978462219, 0.6045776009559631, 0.6389268636703491, 0.6732761263847351, 0.7076253890991211, 0.7419745922088623, 0.7763238549232483, 0.8106731176376343]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 3.0, 5.0, 9.0, 12.0, 17.0, 16.0, 13.0, 26.0, 26.0, 27.0, 37.0, 47.0, 49.0, 75.0, 54.0, 55.0, 56.0, 56.0, 58.0, 46.0, 50.0, 44.0, 44.0, 30.0, 32.0, 11.0, 17.0, 13.0, 13.0, 13.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4653225243091583, -0.4494207203388214, -0.4335188865661621, -0.4176170825958252, -0.4017152786254883, -0.38581347465515137, -0.36991167068481445, -0.35400983691215515, -0.33810803294181824, -0.3222062289714813, -0.306304395198822, -0.2904025912284851, -0.2745007872581482, -0.2585989832878113, -0.24269716441631317, -0.22679534554481506, -0.21089354157447815, -0.19499173760414124, -0.17908991873264313, -0.16318809986114502, -0.1472862958908081, -0.1313844919204712, -0.11548267304897308, -0.09958086162805557, -0.08367905020713806, -0.06777723878622055, -0.05187542736530304, -0.03597361594438553, -0.020071804523468018, -0.004169993102550507, 0.011731818318367004, 0.027633629739284515, 0.04353541135787964, 0.05943722277879715, 0.07533903419971466, 0.09124084562063217, 0.10714265704154968, 0.1230444684624672, 0.1389462798833847, 0.1548480987548828, 0.17074990272521973, 0.18665170669555664, 0.20255352556705475, 0.21845534443855286, 0.23435714840888977, 0.2502589523792267, 0.266160786151886, 0.2820625901222229, 0.2979643940925598, 0.31386619806289673, 0.32976800203323364, 0.34566983580589294, 0.36157163977622986, 0.3774734437465668, 0.3933752775192261, 0.409277081489563, 0.4251788854598999, 0.4410806894302368, 0.45698249340057373, 0.47288432717323303, 0.48878613114356995, 0.5046879649162292, 0.5205897688865662, 0.5364915728569031, 0.55239337682724]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 9.0, 12.0, 9.0, 28.0, 37.0, 68.0, 99.0, 182.0, 275.0, 497.0, 1003.0, 1855.0, 4036.0, 9772.0, 30354.0, 180402.0, 662631.0, 118373.0, 23823.0, 8023.0, 3358.0, 1643.0, 890.0, 459.0, 287.0, 160.0, 89.0, 75.0, 36.0, 24.0, 13.0, 10.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9541015625, -0.9263687133789062, -0.8986358642578125, -0.8709030151367188, -0.843170166015625, -0.8154373168945312, -0.7877044677734375, -0.7599716186523438, -0.73223876953125, -0.7045059204101562, -0.6767730712890625, -0.6490402221679688, -0.621307373046875, -0.5935745239257812, -0.5658416748046875, -0.5381088256835938, -0.5103759765625, -0.48264312744140625, -0.4549102783203125, -0.42717742919921875, -0.399444580078125, -0.37171173095703125, -0.3439788818359375, -0.31624603271484375, -0.28851318359375, -0.26078033447265625, -0.2330474853515625, -0.20531463623046875, -0.177581787109375, -0.14984893798828125, -0.1221160888671875, -0.09438323974609375, -0.066650390625, -0.03891754150390625, -0.0111846923828125, 0.01654815673828125, 0.044281005859375, 0.07201385498046875, 0.0997467041015625, 0.12747955322265625, 0.15521240234375, 0.18294525146484375, 0.2106781005859375, 0.23841094970703125, 0.266143798828125, 0.29387664794921875, 0.3216094970703125, 0.34934234619140625, 0.3770751953125, 0.40480804443359375, 0.4325408935546875, 0.46027374267578125, 0.488006591796875, 0.5157394409179688, 0.5434722900390625, 0.5712051391601562, 0.59893798828125, 0.6266708374023438, 0.6544036865234375, 0.6821365356445312, 0.709869384765625, 0.7376022338867188, 0.7653350830078125, 0.7930679321289062, 0.82080078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 8.0, 7.0, 7.0, 17.0, 18.0, 26.0, 25.0, 28.0, 38.0, 48.0, 55.0, 48.0, 56.0, 69.0, 69.0, 62.0, 62.0, 52.0, 60.0, 47.0, 34.0, 37.0, 28.0, 23.0, 12.0, 14.0, 12.0, 6.0, 5.0, 5.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2822265625, -1.240234375, -1.1982421875, -1.15625, -1.1142578125, -1.072265625, -1.0302734375, -0.98828125, -0.9462890625, -0.904296875, -0.8623046875, -0.8203125, -0.7783203125, -0.736328125, -0.6943359375, -0.65234375, -0.6103515625, -0.568359375, -0.5263671875, -0.484375, -0.4423828125, -0.400390625, -0.3583984375, -0.31640625, -0.2744140625, -0.232421875, -0.1904296875, -0.1484375, -0.1064453125, -0.064453125, -0.0224609375, 0.01953125, 0.0615234375, 0.103515625, 0.1455078125, 0.1875, 0.2294921875, 0.271484375, 0.3134765625, 0.35546875, 0.3974609375, 0.439453125, 0.4814453125, 0.5234375, 0.5654296875, 0.607421875, 0.6494140625, 0.69140625, 0.7333984375, 0.775390625, 0.8173828125, 0.859375, 0.9013671875, 0.943359375, 0.9853515625, 1.02734375, 1.0693359375, 1.111328125, 1.1533203125, 1.1953125, 1.2373046875, 1.279296875, 1.3212890625, 1.36328125, 1.4052734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 6.0, 10.0, 9.0, 13.0, 16.0, 14.0, 27.0, 27.0, 50.0, 34.0, 38.0, 44.0, 105.0, 300.0, 4763.0, 1001645.0, 40078.0, 862.0, 138.0, 59.0, 45.0, 43.0, 45.0, 25.0, 15.0, 27.0, 19.0, 15.0, 11.0, 8.0, 16.0, 9.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.533538818359375, -4.40301513671875, -4.272491455078125, -4.1419677734375, -4.011444091796875, -3.88092041015625, -3.750396728515625, -3.619873046875, -3.489349365234375, -3.35882568359375, -3.228302001953125, -3.0977783203125, -2.967254638671875, -2.83673095703125, -2.706207275390625, -2.57568359375, -2.445159912109375, -2.31463623046875, -2.184112548828125, -2.0535888671875, -1.923065185546875, -1.79254150390625, -1.662017822265625, -1.531494140625, -1.400970458984375, -1.27044677734375, -1.139923095703125, -1.0093994140625, -0.878875732421875, -0.74835205078125, -0.617828369140625, -0.4873046875, -0.356781005859375, -0.22625732421875, -0.095733642578125, 0.0347900390625, 0.165313720703125, 0.29583740234375, 0.426361083984375, 0.556884765625, 0.687408447265625, 0.81793212890625, 0.948455810546875, 1.0789794921875, 1.209503173828125, 1.34002685546875, 1.470550537109375, 1.60107421875, 1.731597900390625, 1.86212158203125, 1.992645263671875, 2.1231689453125, 2.253692626953125, 2.38421630859375, 2.514739990234375, 2.645263671875, 2.775787353515625, 2.90631103515625, 3.036834716796875, 3.1673583984375, 3.297882080078125, 3.42840576171875, 3.558929443359375, 3.689453125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 8.0, 7.0, 7.0, 15.0, 21.0, 25.0, 18.0, 39.0, 37.0, 49.0, 38.0, 38.0, 61.0, 42.0, 50.0, 36.0, 43.0, 55.0, 39.0, 54.0, 35.0, 40.0, 39.0, 20.0, 30.0, 19.0, 18.0, 18.0, 11.0, 10.0, 10.0, 12.0, 7.0, 12.0, 1.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.3603515625, -1.3231658935546875, -1.285980224609375, -1.2487945556640625, -1.21160888671875, -1.1744232177734375, -1.137237548828125, -1.1000518798828125, -1.0628662109375, -1.0256805419921875, -0.988494873046875, -0.9513092041015625, -0.91412353515625, -0.8769378662109375, -0.839752197265625, -0.8025665283203125, -0.765380859375, -0.7281951904296875, -0.691009521484375, -0.6538238525390625, -0.61663818359375, -0.5794525146484375, -0.542266845703125, -0.5050811767578125, -0.4678955078125, -0.4307098388671875, -0.393524169921875, -0.3563385009765625, -0.31915283203125, -0.2819671630859375, -0.244781494140625, -0.2075958251953125, -0.17041015625, -0.1332244873046875, -0.096038818359375, -0.0588531494140625, -0.02166748046875, 0.0155181884765625, 0.052703857421875, 0.0898895263671875, 0.1270751953125, 0.1642608642578125, 0.201446533203125, 0.2386322021484375, 0.27581787109375, 0.3130035400390625, 0.350189208984375, 0.3873748779296875, 0.424560546875, 0.4617462158203125, 0.498931884765625, 0.5361175537109375, 0.57330322265625, 0.6104888916015625, 0.647674560546875, 0.6848602294921875, 0.7220458984375, 0.7592315673828125, 0.796417236328125, 0.8336029052734375, 0.87078857421875, 0.9079742431640625, 0.945159912109375, 0.9823455810546875, 1.01953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 7.0, 13.0, 9.0, 19.0, 14.0, 28.0, 43.0, 56.0, 80.0, 121.0, 227.0, 444.0, 830.0, 2227.0, 6488.0, 23249.0, 103614.0, 465272.0, 349660.0, 70975.0, 16821.0, 4966.0, 1711.0, 727.0, 373.0, 216.0, 112.0, 72.0, 38.0, 35.0, 40.0, 13.0, 8.0, 13.0, 6.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1634521484375, -0.15798187255859375, -0.1525115966796875, -0.14704132080078125, -0.141571044921875, -0.13610076904296875, -0.1306304931640625, -0.12516021728515625, -0.11968994140625, -0.11421966552734375, -0.1087493896484375, -0.10327911376953125, -0.097808837890625, -0.09233856201171875, -0.0868682861328125, -0.08139801025390625, -0.075927734375, -0.07045745849609375, -0.0649871826171875, -0.05951690673828125, -0.054046630859375, -0.04857635498046875, -0.0431060791015625, -0.03763580322265625, -0.03216552734375, -0.02669525146484375, -0.0212249755859375, -0.01575469970703125, -0.010284423828125, -0.00481414794921875, 0.0006561279296875, 0.00612640380859375, 0.0115966796875, 0.01706695556640625, 0.0225372314453125, 0.02800750732421875, 0.033477783203125, 0.03894805908203125, 0.0444183349609375, 0.04988861083984375, 0.05535888671875, 0.06082916259765625, 0.0662994384765625, 0.07176971435546875, 0.077239990234375, 0.08271026611328125, 0.0881805419921875, 0.09365081787109375, 0.09912109375, 0.10459136962890625, 0.1100616455078125, 0.11553192138671875, 0.121002197265625, 0.12647247314453125, 0.1319427490234375, 0.13741302490234375, 0.14288330078125, 0.14835357666015625, 0.1538238525390625, 0.15929412841796875, 0.164764404296875, 0.17023468017578125, 0.1757049560546875, 0.18117523193359375, 0.1866455078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 13.0, 12.0, 14.0, 19.0, 17.0, 37.0, 39.0, 47.0, 53.0, 66.0, 92.0, 96.0, 81.0, 83.0, 42.0, 49.0, 39.0, 30.0, 38.0, 34.0, 8.0, 15.0, 15.0, 13.0, 6.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3817643523216248e-05, -2.3018568754196167e-05, -2.2219493985176086e-05, -2.1420419216156006e-05, -2.0621344447135925e-05, -1.9822269678115845e-05, -1.9023194909095764e-05, -1.8224120140075684e-05, -1.7425045371055603e-05, -1.6625970602035522e-05, -1.5826895833015442e-05, -1.5027821063995361e-05, -1.422874629497528e-05, -1.34296715259552e-05, -1.263059675693512e-05, -1.1831521987915039e-05, -1.1032447218894958e-05, -1.0233372449874878e-05, -9.434297680854797e-06, -8.635222911834717e-06, -7.836148142814636e-06, -7.037073373794556e-06, -6.237998604774475e-06, -5.4389238357543945e-06, -4.639849066734314e-06, -3.840774297714233e-06, -3.041699528694153e-06, -2.2426247596740723e-06, -1.4435499906539917e-06, -6.444752216339111e-07, 1.5459954738616943e-07, 9.5367431640625e-07, 1.7527490854263306e-06, 2.551823854446411e-06, 3.3508986234664917e-06, 4.149973392486572e-06, 4.949048161506653e-06, 5.748122930526733e-06, 6.547197699546814e-06, 7.3462724685668945e-06, 8.145347237586975e-06, 8.944422006607056e-06, 9.743496775627136e-06, 1.0542571544647217e-05, 1.1341646313667297e-05, 1.2140721082687378e-05, 1.2939795851707458e-05, 1.3738870620727539e-05, 1.453794538974762e-05, 1.53370201587677e-05, 1.613609492778778e-05, 1.693516969680786e-05, 1.7734244465827942e-05, 1.8533319234848022e-05, 1.9332394003868103e-05, 2.0131468772888184e-05, 2.0930543541908264e-05, 2.1729618310928345e-05, 2.2528693079948425e-05, 2.3327767848968506e-05, 2.4126842617988586e-05, 2.4925917387008667e-05, 2.5724992156028748e-05, 2.6524066925048828e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 11.0, 23.0, 25.0, 51.0, 63.0, 126.0, 218.0, 349.0, 680.0, 1319.0, 2810.0, 7821.0, 22574.0, 82795.0, 345696.0, 427833.0, 110891.0, 28993.0, 9321.0, 3604.0, 1592.0, 747.0, 420.0, 225.0, 134.0, 77.0, 50.0, 27.0, 16.0, 17.0, 9.0, 7.0, 6.0, 2.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1788330078125, -0.1740131378173828, -0.16919326782226562, -0.16437339782714844, -0.15955352783203125, -0.15473365783691406, -0.14991378784179688, -0.1450939178466797, -0.1402740478515625, -0.1354541778564453, -0.13063430786132812, -0.12581443786621094, -0.12099456787109375, -0.11617469787597656, -0.11135482788085938, -0.10653495788574219, -0.101715087890625, -0.09689521789550781, -0.09207534790039062, -0.08725547790527344, -0.08243560791015625, -0.07761573791503906, -0.07279586791992188, -0.06797599792480469, -0.0631561279296875, -0.05833625793457031, -0.053516387939453125, -0.04869651794433594, -0.04387664794921875, -0.03905677795410156, -0.034236907958984375, -0.029417037963867188, -0.02459716796875, -0.019777297973632812, -0.014957427978515625, -0.010137557983398438, -0.00531768798828125, -0.0004978179931640625, 0.004322052001953125, 0.009141921997070312, 0.0139617919921875, 0.018781661987304688, 0.023601531982421875, 0.028421401977539062, 0.03324127197265625, 0.03806114196777344, 0.042881011962890625, 0.04770088195800781, 0.052520751953125, 0.05734062194824219, 0.062160491943359375, 0.06698036193847656, 0.07180023193359375, 0.07662010192871094, 0.08143997192382812, 0.08625984191894531, 0.0910797119140625, 0.09589958190917969, 0.10071945190429688, 0.10553932189941406, 0.11035919189453125, 0.11517906188964844, 0.11999893188476562, 0.12481880187988281, 0.129638671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 9.0, 14.0, 18.0, 18.0, 31.0, 44.0, 44.0, 59.0, 66.0, 71.0, 77.0, 70.0, 76.0, 74.0, 61.0, 59.0, 36.0, 27.0, 30.0, 21.0, 25.0, 14.0, 6.0, 7.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059844970703125, -0.05748319625854492, -0.055121421813964844, -0.052759647369384766, -0.05039787292480469, -0.04803609848022461, -0.04567432403564453, -0.04331254959106445, -0.040950775146484375, -0.0385890007019043, -0.03622722625732422, -0.03386545181274414, -0.03150367736816406, -0.029141902923583984, -0.026780128479003906, -0.024418354034423828, -0.02205657958984375, -0.019694805145263672, -0.017333030700683594, -0.014971256256103516, -0.012609481811523438, -0.01024770736694336, -0.007885932922363281, -0.005524158477783203, -0.003162384033203125, -0.0008006095886230469, 0.0015611648559570312, 0.003922939300537109, 0.0062847137451171875, 0.008646488189697266, 0.011008262634277344, 0.013370037078857422, 0.0157318115234375, 0.018093585968017578, 0.020455360412597656, 0.022817134857177734, 0.025178909301757812, 0.02754068374633789, 0.02990245819091797, 0.03226423263549805, 0.034626007080078125, 0.0369877815246582, 0.03934955596923828, 0.04171133041381836, 0.04407310485839844, 0.046434879302978516, 0.048796653747558594, 0.05115842819213867, 0.05352020263671875, 0.05588197708129883, 0.058243751525878906, 0.060605525970458984, 0.06296730041503906, 0.06532907485961914, 0.06769084930419922, 0.0700526237487793, 0.07241439819335938, 0.07477617263793945, 0.07713794708251953, 0.07949972152709961, 0.08186149597167969, 0.08422327041625977, 0.08658504486083984, 0.08894681930541992, 0.09130859375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 7.0, 22.0, 65.0, 138.0, 229.0, 271.0, 136.0, 65.0, 22.0, 15.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.673368453979492, -5.557599067687988, -5.441829204559326, -5.326059818267822, -5.210290431976318, -5.094520568847656, -4.978751182556152, -4.862981796264648, -4.747211933135986, -4.631442546844482, -4.51567268371582, -4.399903297424316, -4.2841339111328125, -4.16836404800415, -4.0525946617126465, -3.9368250370025635, -3.8210556507110596, -3.7052860260009766, -3.5895166397094727, -3.4737470149993896, -3.3579773902893066, -3.2422080039978027, -3.1264383792877197, -3.0106687545776367, -2.894899368286133, -2.77912974357605, -2.663360357284546, -2.547590732574463, -2.43182110786438, -2.316051483154297, -2.200282096862793, -2.08451247215271, -1.9687429666519165, -1.852973461151123, -1.73720383644104, -1.6214343309402466, -1.5056648254394531, -1.3898952007293701, -1.2741256952285767, -1.1583561897277832, -1.0425865650177002, -0.926816999912262, -0.8110474348068237, -0.6952779293060303, -0.579508364200592, -0.4637387990951538, -0.34796929359436035, -0.23219972848892212, -0.11643016338348389, -0.0006606131792068481, 0.11510893702507019, 0.23087847232818604, 0.34664803743362427, 0.4624176025390625, 0.578187108039856, 0.6939566731452942, 0.8097262382507324, 0.9254958033561707, 1.0412653684616089, 1.1570348739624023, 1.2728044986724854, 1.3885740041732788, 1.5043435096740723, 1.6201131343841553, 1.7358826398849487]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 0.0, 7.0, 8.0, 6.0, 7.0, 15.0, 14.0, 26.0, 30.0, 28.0, 27.0, 32.0, 40.0, 44.0, 47.0, 56.0, 43.0, 55.0, 52.0, 52.0, 51.0, 40.0, 40.0, 41.0, 40.0, 37.0, 20.0, 38.0, 27.0, 12.0, 10.0, 14.0, 12.0, 8.0, 6.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1390507221221924, -2.0691416263580322, -1.999232530593872, -1.929323434829712, -1.8594143390655518, -1.7895052433013916, -1.719596266746521, -1.6496871709823608, -1.5797780752182007, -1.5098689794540405, -1.4399598836898804, -1.3700507879257202, -1.3001418113708496, -1.2302327156066895, -1.1603236198425293, -1.0904145240783691, -1.020505428314209, -0.9505963325500488, -0.8806872367858887, -0.8107782006263733, -0.7408691048622131, -0.670960009098053, -0.6010509729385376, -0.5311418771743774, -0.4612327814102173, -0.39132368564605713, -0.32141461968421936, -0.2515055537223816, -0.18159645795822144, -0.11168736219406128, -0.04177829623222351, 0.028130769729614258, 0.09803962707519531, 0.16794870793819427, 0.23785778880119324, 0.307766854763031, 0.37767595052719116, 0.4475850462913513, 0.5174940824508667, 0.5874031782150269, 0.657312273979187, 0.7272213697433472, 0.7971304655075073, 0.8670395016670227, 0.9369485974311829, 1.0068576335906982, 1.0767667293548584, 1.1466758251190186, 1.2165849208831787, 1.2864940166473389, 1.356403112411499, 1.4263122081756592, 1.4962213039398193, 1.5661303997039795, 1.63603937625885, 1.7059484720230103, 1.7758575677871704, 1.8457666635513306, 1.9156757593154907, 1.9855848550796509, 2.0554938316345215, 2.1254029273986816, 2.195312023162842, 2.265221118927002, 2.335130214691162]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 9.0, 12.0, 18.0, 31.0, 33.0, 51.0, 61.0, 90.0, 164.0, 238.0, 421.0, 759.0, 1436.0, 3194.0, 8041.0, 26283.0, 129381.0, 1486747.0, 2300008.0, 186854.0, 33176.0, 9848.0, 3775.0, 1616.0, 775.0, 467.0, 273.0, 156.0, 110.0, 86.0, 58.0, 28.0, 22.0, 20.0, 12.0, 8.0, 1.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.12109375, -1.0908660888671875, -1.060638427734375, -1.0304107666015625, -1.00018310546875, -0.9699554443359375, -0.939727783203125, -0.9095001220703125, -0.8792724609375, -0.8490447998046875, -0.818817138671875, -0.7885894775390625, -0.75836181640625, -0.7281341552734375, -0.697906494140625, -0.6676788330078125, -0.637451171875, -0.6072235107421875, -0.576995849609375, -0.5467681884765625, -0.51654052734375, -0.4863128662109375, -0.456085205078125, -0.4258575439453125, -0.3956298828125, -0.3654022216796875, -0.335174560546875, -0.3049468994140625, -0.27471923828125, -0.2444915771484375, -0.214263916015625, -0.1840362548828125, -0.15380859375, -0.1235809326171875, -0.093353271484375, -0.0631256103515625, -0.03289794921875, -0.0026702880859375, 0.027557373046875, 0.0577850341796875, 0.0880126953125, 0.1182403564453125, 0.148468017578125, 0.1786956787109375, 0.20892333984375, 0.2391510009765625, 0.269378662109375, 0.2996063232421875, 0.329833984375, 0.3600616455078125, 0.390289306640625, 0.4205169677734375, 0.45074462890625, 0.4809722900390625, 0.511199951171875, 0.5414276123046875, 0.5716552734375, 0.6018829345703125, 0.632110595703125, 0.6623382568359375, 0.69256591796875, 0.7227935791015625, 0.753021240234375, 0.7832489013671875, 0.8134765625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 5.0, 7.0, 10.0, 5.0, 12.0, 10.0, 20.0, 17.0, 14.0, 21.0, 36.0, 38.0, 53.0, 39.0, 64.0, 46.0, 52.0, 56.0, 60.0, 53.0, 46.0, 42.0, 53.0, 35.0, 46.0, 31.0, 16.0, 13.0, 17.0, 10.0, 11.0, 12.0, 6.0, 11.0, 3.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53271484375, -0.51336669921875, -0.4940185546875, -0.47467041015625, -0.455322265625, -0.43597412109375, -0.4166259765625, -0.39727783203125, -0.3779296875, -0.35858154296875, -0.3392333984375, -0.31988525390625, -0.300537109375, -0.28118896484375, -0.2618408203125, -0.24249267578125, -0.22314453125, -0.20379638671875, -0.1844482421875, -0.16510009765625, -0.145751953125, -0.12640380859375, -0.1070556640625, -0.08770751953125, -0.068359375, -0.04901123046875, -0.0296630859375, -0.01031494140625, 0.009033203125, 0.02838134765625, 0.0477294921875, 0.06707763671875, 0.08642578125, 0.10577392578125, 0.1251220703125, 0.14447021484375, 0.163818359375, 0.18316650390625, 0.2025146484375, 0.22186279296875, 0.2412109375, 0.26055908203125, 0.2799072265625, 0.29925537109375, 0.318603515625, 0.33795166015625, 0.3572998046875, 0.37664794921875, 0.39599609375, 0.41534423828125, 0.4346923828125, 0.45404052734375, 0.473388671875, 0.49273681640625, 0.5120849609375, 0.53143310546875, 0.55078125, 0.57012939453125, 0.5894775390625, 0.60882568359375, 0.628173828125, 0.64752197265625, 0.6668701171875, 0.68621826171875, 0.70556640625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 9.0, 14.0, 18.0, 15.0, 35.0, 60.0, 81.0, 150.0, 354.0, 1008.0, 5725.0, 116085.0, 3986414.0, 77983.0, 4795.0, 862.0, 292.0, 132.0, 64.0, 60.0, 31.0, 16.0, 9.0, 6.0, 15.0, 8.0, 12.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.69189453125, -1.6279296875, -1.56396484375, -1.5, -1.43603515625, -1.3720703125, -1.30810546875, -1.244140625, -1.18017578125, -1.1162109375, -1.05224609375, -0.98828125, -0.92431640625, -0.8603515625, -0.79638671875, -0.732421875, -0.66845703125, -0.6044921875, -0.54052734375, -0.4765625, -0.41259765625, -0.3486328125, -0.28466796875, -0.220703125, -0.15673828125, -0.0927734375, -0.02880859375, 0.03515625, 0.09912109375, 0.1630859375, 0.22705078125, 0.291015625, 0.35498046875, 0.4189453125, 0.48291015625, 0.546875, 0.61083984375, 0.6748046875, 0.73876953125, 0.802734375, 0.86669921875, 0.9306640625, 0.99462890625, 1.05859375, 1.12255859375, 1.1865234375, 1.25048828125, 1.314453125, 1.37841796875, 1.4423828125, 1.50634765625, 1.5703125, 1.63427734375, 1.6982421875, 1.76220703125, 1.826171875, 1.89013671875, 1.9541015625, 2.01806640625, 2.08203125, 2.14599609375, 2.2099609375, 2.27392578125, 2.337890625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 8.0, 8.0, 14.0, 18.0, 28.0, 31.0, 45.0, 80.0, 108.0, 154.0, 320.0, 568.0, 791.0, 744.0, 419.0, 250.0, 128.0, 106.0, 81.0, 54.0, 29.0, 24.0, 13.0, 15.0, 11.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.299072265625, -0.2909526824951172, -0.2828330993652344, -0.27471351623535156, -0.26659393310546875, -0.25847434997558594, -0.2503547668457031, -0.2422351837158203, -0.2341156005859375, -0.2259960174560547, -0.21787643432617188, -0.20975685119628906, -0.20163726806640625, -0.19351768493652344, -0.18539810180664062, -0.1772785186767578, -0.169158935546875, -0.1610393524169922, -0.15291976928710938, -0.14480018615722656, -0.13668060302734375, -0.12856101989746094, -0.12044143676757812, -0.11232185363769531, -0.1042022705078125, -0.09608268737792969, -0.08796310424804688, -0.07984352111816406, -0.07172393798828125, -0.06360435485839844, -0.055484771728515625, -0.04736518859863281, -0.03924560546875, -0.031126022338867188, -0.023006439208984375, -0.014886856079101562, -0.00676727294921875, 0.0013523101806640625, 0.009471893310546875, 0.017591476440429688, 0.0257110595703125, 0.03383064270019531, 0.041950225830078125, 0.05006980895996094, 0.05818939208984375, 0.06630897521972656, 0.07442855834960938, 0.08254814147949219, 0.090667724609375, 0.09878730773925781, 0.10690689086914062, 0.11502647399902344, 0.12314605712890625, 0.13126564025878906, 0.13938522338867188, 0.1475048065185547, 0.1556243896484375, 0.1637439727783203, 0.17186355590820312, 0.17998313903808594, 0.18810272216796875, 0.19622230529785156, 0.20434188842773438, 0.2124614715576172, 0.2205810546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 16.0, 24.0, 59.0, 97.0, 120.0, 147.0, 165.0, 121.0, 94.0, 51.0, 32.0, 15.0, 17.0, 8.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8327101469039917, -1.780419111251831, -1.72812819480896, -1.6758371591567993, -1.6235461235046387, -1.5712552070617676, -1.518964171409607, -1.4666731357574463, -1.4143821001052856, -1.362091064453125, -1.309800148010254, -1.2575091123580933, -1.2052180767059326, -1.1529271602630615, -1.1006361246109009, -1.0483450889587402, -0.9960541129112244, -0.9437631368637085, -0.8914721012115479, -0.839181125164032, -0.7868900895118713, -0.7345991134643555, -0.6823080778121948, -0.630017101764679, -0.5777261257171631, -0.5254351496696472, -0.4731441140174866, -0.4208531379699707, -0.36856210231781006, -0.3162711262702942, -0.26398012042045593, -0.21168911457061768, -0.15939807891845703, -0.10710707306861877, -0.054816074669361115, -0.0025250762701034546, 0.0497659295797348, 0.10205692052841187, 0.15434792637825012, 0.20663893222808838, 0.25892993807792664, 0.3112209439277649, 0.36351194977760315, 0.4158029556274414, 0.4680939316749573, 0.5203849077224731, 0.5726759433746338, 0.6249669790267944, 0.6772579550743103, 0.7295489311218262, 0.7818399667739868, 0.8341309428215027, 0.8864219784736633, 0.9387129545211792, 0.9910039901733398, 1.043294906616211, 1.0955859422683716, 1.1478769779205322, 1.2001678943634033, 1.252458930015564, 1.3047499656677246, 1.3570408821105957, 1.4093319177627563, 1.461622953414917, 1.5139139890670776]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 13.0, 9.0, 14.0, 19.0, 24.0, 20.0, 26.0, 33.0, 45.0, 41.0, 54.0, 43.0, 58.0, 60.0, 48.0, 54.0, 57.0, 46.0, 55.0, 53.0, 35.0, 42.0, 27.0, 19.0, 20.0, 7.0, 19.0, 6.0, 10.0, 5.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6084237098693848, -0.586319625377655, -0.5642154812812805, -0.5421113967895508, -0.520007312297821, -0.4979031980037689, -0.4757990837097168, -0.45369499921798706, -0.4315909147262573, -0.4094868004322052, -0.38738271594047546, -0.36527860164642334, -0.3431745171546936, -0.3210704028606415, -0.29896628856658936, -0.2768622040748596, -0.2547580897808075, -0.23265399038791656, -0.21054989099502563, -0.1884457767009735, -0.16634169220924377, -0.14423757791519165, -0.12213347852230072, -0.10002937912940979, -0.07792527973651886, -0.05582118034362793, -0.0337170772254467, -0.011612974107265472, 0.010491125285625458, 0.03259522467851639, 0.054699331521987915, 0.07680343091487885, 0.09890753030776978, 0.1210116297006607, 0.14311572909355164, 0.16521984338760376, 0.1873239278793335, 0.20942804217338562, 0.23153214156627655, 0.2536362409591675, 0.2757403254508972, 0.29784443974494934, 0.3199485242366791, 0.3420526385307312, 0.36415672302246094, 0.38626083731651306, 0.4083649516105652, 0.4304690361022949, 0.45257315039634705, 0.47467726469039917, 0.4967813491821289, 0.5188854336738586, 0.5409895777702332, 0.5630936622619629, 0.5851977467536926, 0.6073018312454224, 0.6294059753417969, 0.6515100598335266, 0.6736142039299011, 0.6957182884216309, 0.7178223729133606, 0.7399264574050903, 0.7620306015014648, 0.7841346859931946, 0.8062387704849243]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 13.0, 23.0, 25.0, 46.0, 79.0, 115.0, 216.0, 330.0, 709.0, 1566.0, 3354.0, 7958.0, 22533.0, 72567.0, 296024.0, 462914.0, 124421.0, 34686.0, 11878.0, 4866.0, 2135.0, 954.0, 504.0, 262.0, 139.0, 89.0, 44.0, 25.0, 29.0, 14.0, 8.0, 7.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1577739715576172, -0.15197372436523438, -0.14617347717285156, -0.14037322998046875, -0.13457298278808594, -0.12877273559570312, -0.12297248840332031, -0.1171722412109375, -0.11137199401855469, -0.10557174682617188, -0.09977149963378906, -0.09397125244140625, -0.08817100524902344, -0.08237075805664062, -0.07657051086425781, -0.070770263671875, -0.06497001647949219, -0.059169769287109375, -0.05336952209472656, -0.04756927490234375, -0.04176902770996094, -0.035968780517578125, -0.030168533325195312, -0.0243682861328125, -0.018568038940429688, -0.012767791748046875, -0.0069675445556640625, -0.00116729736328125, 0.0046329498291015625, 0.010433197021484375, 0.016233444213867188, 0.02203369140625, 0.027833938598632812, 0.033634185791015625, 0.03943443298339844, 0.04523468017578125, 0.05103492736816406, 0.056835174560546875, 0.06263542175292969, 0.0684356689453125, 0.07423591613769531, 0.08003616333007812, 0.08583641052246094, 0.09163665771484375, 0.09743690490722656, 0.10323715209960938, 0.10903739929199219, 0.114837646484375, 0.12063789367675781, 0.12643814086914062, 0.13223838806152344, 0.13803863525390625, 0.14383888244628906, 0.14963912963867188, 0.1554393768310547, 0.1612396240234375, 0.1670398712158203, 0.17284011840820312, 0.17864036560058594, 0.18444061279296875, 0.19024085998535156, 0.19604110717773438, 0.2018413543701172, 0.2076416015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 13.0, 16.0, 10.0, 19.0, 22.0, 28.0, 48.0, 48.0, 55.0, 67.0, 87.0, 77.0, 71.0, 69.0, 72.0, 73.0, 51.0, 48.0, 28.0, 17.0, 15.0, 14.0, 11.0, 10.0, 2.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48046875, -0.46120452880859375, -0.4419403076171875, -0.42267608642578125, -0.403411865234375, -0.38414764404296875, -0.3648834228515625, -0.34561920166015625, -0.32635498046875, -0.30709075927734375, -0.2878265380859375, -0.26856231689453125, -0.249298095703125, -0.23003387451171875, -0.2107696533203125, -0.19150543212890625, -0.1722412109375, -0.15297698974609375, -0.1337127685546875, -0.11444854736328125, -0.095184326171875, -0.07592010498046875, -0.0566558837890625, -0.03739166259765625, -0.01812744140625, 0.00113677978515625, 0.0204010009765625, 0.03966522216796875, 0.058929443359375, 0.07819366455078125, 0.0974578857421875, 0.11672210693359375, 0.135986328125, 0.15525054931640625, 0.1745147705078125, 0.19377899169921875, 0.213043212890625, 0.23230743408203125, 0.2515716552734375, 0.27083587646484375, 0.29010009765625, 0.30936431884765625, 0.3286285400390625, 0.34789276123046875, 0.367156982421875, 0.38642120361328125, 0.4056854248046875, 0.42494964599609375, 0.4442138671875, 0.46347808837890625, 0.4827423095703125, 0.5020065307617188, 0.521270751953125, 0.5405349731445312, 0.5597991943359375, 0.5790634155273438, 0.59832763671875, 0.6175918579101562, 0.6368560791015625, 0.6561203002929688, 0.675384521484375, 0.6946487426757812, 0.7139129638671875, 0.7331771850585938, 0.75244140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 5.0, 10.0, 14.0, 20.0, 20.0, 35.0, 56.0, 78.0, 130.0, 187.0, 367.0, 669.0, 1501.0, 3642.0, 11155.0, 44158.0, 233856.0, 571010.0, 139780.0, 28753.0, 7798.0, 2773.0, 1165.0, 569.0, 291.0, 177.0, 106.0, 69.0, 54.0, 46.0, 31.0, 12.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2052001953125, -0.19939613342285156, -0.19359207153320312, -0.1877880096435547, -0.18198394775390625, -0.1761798858642578, -0.17037582397460938, -0.16457176208496094, -0.1587677001953125, -0.15296363830566406, -0.14715957641601562, -0.1413555145263672, -0.13555145263671875, -0.1297473907470703, -0.12394332885742188, -0.11813926696777344, -0.112335205078125, -0.10653114318847656, -0.10072708129882812, -0.09492301940917969, -0.08911895751953125, -0.08331489562988281, -0.07751083374023438, -0.07170677185058594, -0.0659027099609375, -0.06009864807128906, -0.054294586181640625, -0.04849052429199219, -0.04268646240234375, -0.03688240051269531, -0.031078338623046875, -0.025274276733398438, -0.01947021484375, -0.013666152954101562, -0.007862091064453125, -0.0020580291748046875, 0.00374603271484375, 0.009550094604492188, 0.015354156494140625, 0.021158218383789062, 0.0269622802734375, 0.03276634216308594, 0.038570404052734375, 0.04437446594238281, 0.05017852783203125, 0.05598258972167969, 0.061786651611328125, 0.06759071350097656, 0.073394775390625, 0.07919883728027344, 0.08500289916992188, 0.09080696105957031, 0.09661102294921875, 0.10241508483886719, 0.10821914672851562, 0.11402320861816406, 0.1198272705078125, 0.12563133239746094, 0.13143539428710938, 0.1372394561767578, 0.14304351806640625, 0.1488475799560547, 0.15465164184570312, 0.16045570373535156, 0.166259765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 5.0, 13.0, 14.0, 6.0, 13.0, 22.0, 21.0, 17.0, 32.0, 25.0, 30.0, 47.0, 34.0, 52.0, 32.0, 44.0, 61.0, 45.0, 49.0, 48.0, 47.0, 38.0, 43.0, 39.0, 28.0, 38.0, 19.0, 20.0, 25.0, 18.0, 13.0, 12.0, 8.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7607421875, -0.73699951171875, -0.7132568359375, -0.68951416015625, -0.665771484375, -0.64202880859375, -0.6182861328125, -0.59454345703125, -0.57080078125, -0.54705810546875, -0.5233154296875, -0.49957275390625, -0.475830078125, -0.45208740234375, -0.4283447265625, -0.40460205078125, -0.380859375, -0.35711669921875, -0.3333740234375, -0.30963134765625, -0.285888671875, -0.26214599609375, -0.2384033203125, -0.21466064453125, -0.19091796875, -0.16717529296875, -0.1434326171875, -0.11968994140625, -0.095947265625, -0.07220458984375, -0.0484619140625, -0.02471923828125, -0.0009765625, 0.02276611328125, 0.0465087890625, 0.07025146484375, 0.093994140625, 0.11773681640625, 0.1414794921875, 0.16522216796875, 0.18896484375, 0.21270751953125, 0.2364501953125, 0.26019287109375, 0.283935546875, 0.30767822265625, 0.3314208984375, 0.35516357421875, 0.37890625, 0.40264892578125, 0.4263916015625, 0.45013427734375, 0.473876953125, 0.49761962890625, 0.5213623046875, 0.54510498046875, 0.56884765625, 0.59259033203125, 0.6163330078125, 0.64007568359375, 0.663818359375, 0.68756103515625, 0.7113037109375, 0.73504638671875, 0.7587890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 18.0, 14.0, 19.0, 27.0, 52.0, 88.0, 125.0, 218.0, 359.0, 644.0, 1219.0, 2385.0, 5109.0, 12823.0, 36920.0, 135936.0, 493904.0, 262111.0, 62660.0, 19763.0, 7445.0, 3241.0, 1467.0, 786.0, 469.0, 220.0, 197.0, 111.0, 57.0, 45.0, 32.0, 26.0, 14.0, 12.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06485128402709961, -0.06286907196044922, -0.06088685989379883, -0.05890464782714844, -0.05692243576049805, -0.054940223693847656, -0.052958011627197266, -0.050975799560546875, -0.048993587493896484, -0.047011375427246094, -0.0450291633605957, -0.04304695129394531, -0.04106473922729492, -0.03908252716064453, -0.03710031509399414, -0.03511810302734375, -0.03313589096069336, -0.03115367889404297, -0.029171466827392578, -0.027189254760742188, -0.025207042694091797, -0.023224830627441406, -0.021242618560791016, -0.019260406494140625, -0.017278194427490234, -0.015295982360839844, -0.013313770294189453, -0.011331558227539062, -0.009349346160888672, -0.007367134094238281, -0.005384922027587891, -0.0034027099609375, -0.0014204978942871094, 0.0005617141723632812, 0.002543926239013672, 0.0045261383056640625, 0.006508350372314453, 0.008490562438964844, 0.010472774505615234, 0.012454986572265625, 0.014437198638916016, 0.016419410705566406, 0.018401622772216797, 0.020383834838867188, 0.022366046905517578, 0.02434825897216797, 0.02633047103881836, 0.02831268310546875, 0.03029489517211914, 0.03227710723876953, 0.03425931930541992, 0.03624153137207031, 0.0382237434387207, 0.040205955505371094, 0.042188167572021484, 0.044170379638671875, 0.046152591705322266, 0.048134803771972656, 0.05011701583862305, 0.05209922790527344, 0.05408143997192383, 0.05606365203857422, 0.05804586410522461, 0.060028076171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 11.0, 12.0, 24.0, 20.0, 43.0, 46.0, 58.0, 87.0, 113.0, 134.0, 128.0, 85.0, 68.0, 34.0, 43.0, 18.0, 16.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17692756652832e-05, -3.0279159545898438e-05, -2.8789043426513672e-05, -2.7298927307128906e-05, -2.580881118774414e-05, -2.4318695068359375e-05, -2.282857894897461e-05, -2.1338462829589844e-05, -1.9848346710205078e-05, -1.8358230590820312e-05, -1.6868114471435547e-05, -1.537799835205078e-05, -1.3887882232666016e-05, -1.239776611328125e-05, -1.0907649993896484e-05, -9.417533874511719e-06, -7.927417755126953e-06, -6.4373016357421875e-06, -4.947185516357422e-06, -3.4570693969726562e-06, -1.9669532775878906e-06, -4.76837158203125e-07, 1.0132789611816406e-06, 2.5033950805664062e-06, 3.993511199951172e-06, 5.4836273193359375e-06, 6.973743438720703e-06, 8.463859558105469e-06, 9.953975677490234e-06, 1.1444091796875e-05, 1.2934207916259766e-05, 1.4424324035644531e-05, 1.5914440155029297e-05, 1.7404556274414062e-05, 1.8894672393798828e-05, 2.0384788513183594e-05, 2.187490463256836e-05, 2.3365020751953125e-05, 2.485513687133789e-05, 2.6345252990722656e-05, 2.7835369110107422e-05, 2.9325485229492188e-05, 3.081560134887695e-05, 3.230571746826172e-05, 3.3795833587646484e-05, 3.528594970703125e-05, 3.6776065826416016e-05, 3.826618194580078e-05, 3.975629806518555e-05, 4.124641418457031e-05, 4.273653030395508e-05, 4.4226646423339844e-05, 4.571676254272461e-05, 4.7206878662109375e-05, 4.869699478149414e-05, 5.0187110900878906e-05, 5.167722702026367e-05, 5.316734313964844e-05, 5.46574592590332e-05, 5.614757537841797e-05, 5.7637691497802734e-05, 5.91278076171875e-05, 6.0617923736572266e-05, 6.210803985595703e-05, 6.35981559753418e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 10.0, 16.0, 31.0, 33.0, 59.0, 90.0, 143.0, 232.0, 457.0, 869.0, 1929.0, 4378.0, 11090.0, 31345.0, 100134.0, 354506.0, 378828.0, 109563.0, 34002.0, 12042.0, 4793.0, 1957.0, 944.0, 469.0, 239.0, 144.0, 83.0, 47.0, 29.0, 23.0, 16.0, 15.0, 10.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061309814453125, -0.05933427810668945, -0.057358741760253906, -0.05538320541381836, -0.05340766906738281, -0.051432132720947266, -0.04945659637451172, -0.04748106002807617, -0.045505523681640625, -0.04352998733520508, -0.04155445098876953, -0.039578914642333984, -0.03760337829589844, -0.03562784194946289, -0.033652305603027344, -0.0316767692565918, -0.02970123291015625, -0.027725696563720703, -0.025750160217285156, -0.02377462387084961, -0.021799087524414062, -0.019823551177978516, -0.01784801483154297, -0.015872478485107422, -0.013896942138671875, -0.011921405792236328, -0.009945869445800781, -0.007970333099365234, -0.0059947967529296875, -0.004019260406494141, -0.0020437240600585938, -6.818771362304688e-05, 0.0019073486328125, 0.003882884979248047, 0.005858421325683594, 0.00783395767211914, 0.009809494018554688, 0.011785030364990234, 0.013760566711425781, 0.015736103057861328, 0.017711639404296875, 0.019687175750732422, 0.02166271209716797, 0.023638248443603516, 0.025613784790039062, 0.02758932113647461, 0.029564857482910156, 0.0315403938293457, 0.03351593017578125, 0.0354914665222168, 0.037467002868652344, 0.03944253921508789, 0.04141807556152344, 0.043393611907958984, 0.04536914825439453, 0.04734468460083008, 0.049320220947265625, 0.05129575729370117, 0.05327129364013672, 0.055246829986572266, 0.05722236633300781, 0.05919790267944336, 0.061173439025878906, 0.06314897537231445, 0.06512451171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 4.0, 9.0, 4.0, 10.0, 9.0, 14.0, 11.0, 22.0, 12.0, 26.0, 35.0, 31.0, 33.0, 40.0, 46.0, 57.0, 71.0, 72.0, 60.0, 47.0, 58.0, 45.0, 40.0, 43.0, 31.0, 32.0, 23.0, 23.0, 13.0, 10.0, 13.0, 14.0, 11.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.013397216796875, -0.012999773025512695, -0.01260232925415039, -0.012204885482788086, -0.011807441711425781, -0.011409997940063477, -0.011012554168701172, -0.010615110397338867, -0.010217666625976562, -0.009820222854614258, -0.009422779083251953, -0.009025335311889648, -0.008627891540527344, -0.008230447769165039, -0.007833003997802734, -0.00743556022644043, -0.007038116455078125, -0.00664067268371582, -0.006243228912353516, -0.005845785140991211, -0.005448341369628906, -0.0050508975982666016, -0.004653453826904297, -0.004256010055541992, -0.0038585662841796875, -0.003461122512817383, -0.003063678741455078, -0.0026662349700927734, -0.0022687911987304688, -0.001871347427368164, -0.0014739036560058594, -0.0010764598846435547, -0.00067901611328125, -0.0002815723419189453, 0.00011587142944335938, 0.0005133152008056641, 0.0009107589721679688, 0.0013082027435302734, 0.0017056465148925781, 0.002103090286254883, 0.0025005340576171875, 0.002897977828979492, 0.003295421600341797, 0.0036928653717041016, 0.004090309143066406, 0.004487752914428711, 0.004885196685791016, 0.00528264045715332, 0.005680084228515625, 0.00607752799987793, 0.006474971771240234, 0.006872415542602539, 0.007269859313964844, 0.0076673030853271484, 0.008064746856689453, 0.008462190628051758, 0.008859634399414062, 0.009257078170776367, 0.009654521942138672, 0.010051965713500977, 0.010449409484863281, 0.010846853256225586, 0.01124429702758789, 0.011641740798950195, 0.0120391845703125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 11.0, 15.0, 36.0, 73.0, 114.0, 190.0, 210.0, 143.0, 93.0, 39.0, 21.0, 22.0, 9.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5127205848693848, -1.4721118211746216, -1.4315029382705688, -1.3908941745758057, -1.350285291671753, -1.3096765279769897, -1.2690677642822266, -1.2284588813781738, -1.1878501176834106, -1.1472413539886475, -1.1066324710845947, -1.0660237073898315, -1.0254149436950684, -0.9848060607910156, -0.9441972970962524, -0.9035884737968445, -0.8629796504974365, -0.8223708271980286, -0.7817620038986206, -0.7411532402038574, -0.7005444169044495, -0.6599355936050415, -0.6193268299102783, -0.5787180066108704, -0.5381091833114624, -0.49750036001205444, -0.45689156651496887, -0.4162827730178833, -0.37567394971847534, -0.3350651264190674, -0.2944563329219818, -0.25384753942489624, -0.21323871612548828, -0.17262990772724152, -0.13202109932899475, -0.09141229093074799, -0.05080348253250122, -0.010194674134254456, 0.03041413426399231, 0.07102292776107788, 0.11163175106048584, 0.1522405594587326, 0.19284936785697937, 0.23345817625522614, 0.2740669846534729, 0.31467580795288086, 0.35528460144996643, 0.395893394947052, 0.43650221824645996, 0.4771110415458679, 0.5177198648452759, 0.5583286285400391, 0.598937451839447, 0.639546275138855, 0.6801550388336182, 0.7207638621330261, 0.7613726854324341, 0.801981508731842, 0.84259033203125, 0.8831990957260132, 0.9238079190254211, 0.9644167423248291, 1.0050255060195923, 1.0456342697143555, 1.0862431526184082]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 8.0, 12.0, 16.0, 19.0, 34.0, 39.0, 53.0, 84.0, 61.0, 81.0, 88.0, 86.0, 80.0, 79.0, 68.0, 54.0, 32.0, 26.0, 17.0, 18.0, 12.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4622107148170471, -0.4412214159965515, -0.4202321171760559, -0.3992428183555603, -0.3782535195350647, -0.3572642207145691, -0.3362749218940735, -0.3152856230735779, -0.2942963242530823, -0.27330702543258667, -0.25231772661209106, -0.23132842779159546, -0.21033912897109985, -0.18934983015060425, -0.16836051642894745, -0.14737121760845184, -0.12638190388679504, -0.10539260506629944, -0.08440330624580383, -0.06341399997472763, -0.042424701154232025, -0.02143540233373642, -0.0004460960626602173, 0.020543202757835388, 0.041532501578330994, 0.0625218003988266, 0.0835110992193222, 0.10450040549039841, 0.1254897117614746, 0.14647901058197021, 0.16746830940246582, 0.18845760822296143, 0.20944690704345703, 0.23043620586395264, 0.25142550468444824, 0.27241480350494385, 0.29340410232543945, 0.31439340114593506, 0.33538269996643066, 0.35637199878692627, 0.3773612976074219, 0.3983505964279175, 0.4193398952484131, 0.4403291940689087, 0.4613184928894043, 0.4823077917098999, 0.5032970905303955, 0.5242863893508911, 0.5452756881713867, 0.5662649869918823, 0.5872542858123779, 0.6082435846328735, 0.6292328834533691, 0.6502221822738647, 0.6712114810943604, 0.692200779914856, 0.7131901383399963, 0.7341794371604919, 0.7551687359809875, 0.7761580348014832, 0.7971473336219788, 0.8181366324424744, 0.83912593126297, 0.8601152300834656, 0.8811045289039612]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 1.0, 5.0, 12.0, 21.0, 26.0, 51.0, 71.0, 170.0, 346.0, 1022.0, 4003.0, 29785.0, 756761.0, 239546.0, 13249.0, 2246.0, 658.0, 266.0, 110.0, 64.0, 34.0, 22.0, 16.0, 18.0, 12.0, 7.0, 6.0, 6.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.373046875, -1.3336181640625, -1.294189453125, -1.2547607421875, -1.21533203125, -1.1759033203125, -1.136474609375, -1.0970458984375, -1.0576171875, -1.0181884765625, -0.978759765625, -0.9393310546875, -0.89990234375, -0.8604736328125, -0.821044921875, -0.7816162109375, -0.7421875, -0.7027587890625, -0.663330078125, -0.6239013671875, -0.58447265625, -0.5450439453125, -0.505615234375, -0.4661865234375, -0.4267578125, -0.3873291015625, -0.347900390625, -0.3084716796875, -0.26904296875, -0.2296142578125, -0.190185546875, -0.1507568359375, -0.111328125, -0.0718994140625, -0.032470703125, 0.0069580078125, 0.04638671875, 0.0858154296875, 0.125244140625, 0.1646728515625, 0.2041015625, 0.2435302734375, 0.282958984375, 0.3223876953125, 0.36181640625, 0.4012451171875, 0.440673828125, 0.4801025390625, 0.51953125, 0.5589599609375, 0.598388671875, 0.6378173828125, 0.67724609375, 0.7166748046875, 0.756103515625, 0.7955322265625, 0.8349609375, 0.8743896484375, 0.913818359375, 0.9532470703125, 0.99267578125, 1.0321044921875, 1.071533203125, 1.1109619140625, 1.150390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 25.0, 34.0, 58.0, 90.0, 93.0, 154.0, 121.0, 120.0, 118.0, 61.0, 35.0, 23.0, 19.0, 16.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95947265625, -0.8924484252929688, -0.8254241943359375, -0.7583999633789062, -0.691375732421875, -0.6243515014648438, -0.5573272705078125, -0.49030303955078125, -0.42327880859375, -0.35625457763671875, -0.2892303466796875, -0.22220611572265625, -0.155181884765625, -0.08815765380859375, -0.0211334228515625, 0.04589080810546875, 0.1129150390625, 0.17993927001953125, 0.2469635009765625, 0.31398773193359375, 0.381011962890625, 0.44803619384765625, 0.5150604248046875, 0.5820846557617188, 0.64910888671875, 0.7161331176757812, 0.7831573486328125, 0.8501815795898438, 0.917205810546875, 0.9842300415039062, 1.0512542724609375, 1.1182785034179688, 1.185302734375, 1.2523269653320312, 1.3193511962890625, 1.3863754272460938, 1.453399658203125, 1.5204238891601562, 1.5874481201171875, 1.6544723510742188, 1.72149658203125, 1.7885208129882812, 1.8555450439453125, 1.9225692749023438, 1.989593505859375, 2.0566177368164062, 2.1236419677734375, 2.1906661987304688, 2.2576904296875, 2.3247146606445312, 2.3917388916015625, 2.4587631225585938, 2.525787353515625, 2.5928115844726562, 2.6598358154296875, 2.7268600463867188, 2.79388427734375, 2.8609085083007812, 2.9279327392578125, 2.9949569702148438, 3.061981201171875, 3.1290054321289062, 3.1960296630859375, 3.2630538940429688, 3.330078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 18.0, 9.0, 25.0, 12.0, 22.0, 28.0, 29.0, 48.0, 61.0, 67.0, 97.0, 132.0, 227.0, 500.0, 1553.0, 7529.0, 146891.0, 857348.0, 28591.0, 3382.0, 917.0, 351.0, 180.0, 122.0, 83.0, 77.0, 49.0, 31.0, 27.0, 27.0, 21.0, 14.0, 20.0, 5.0, 8.0, 4.0, 5.0, 6.0, 4.0, 0.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.072265625, -1.0356292724609375, -0.998992919921875, -0.9623565673828125, -0.92572021484375, -0.8890838623046875, -0.852447509765625, -0.8158111572265625, -0.7791748046875, -0.7425384521484375, -0.705902099609375, -0.6692657470703125, -0.63262939453125, -0.5959930419921875, -0.559356689453125, -0.5227203369140625, -0.486083984375, -0.4494476318359375, -0.412811279296875, -0.3761749267578125, -0.33953857421875, -0.3029022216796875, -0.266265869140625, -0.2296295166015625, -0.1929931640625, -0.1563568115234375, -0.119720458984375, -0.0830841064453125, -0.04644775390625, -0.0098114013671875, 0.026824951171875, 0.0634613037109375, 0.10009765625, 0.1367340087890625, 0.173370361328125, 0.2100067138671875, 0.24664306640625, 0.2832794189453125, 0.319915771484375, 0.3565521240234375, 0.3931884765625, 0.4298248291015625, 0.466461181640625, 0.5030975341796875, 0.53973388671875, 0.5763702392578125, 0.613006591796875, 0.6496429443359375, 0.686279296875, 0.7229156494140625, 0.759552001953125, 0.7961883544921875, 0.83282470703125, 0.8694610595703125, 0.906097412109375, 0.9427337646484375, 0.9793701171875, 1.0160064697265625, 1.052642822265625, 1.0892791748046875, 1.12591552734375, 1.1625518798828125, 1.199188232421875, 1.2358245849609375, 1.2724609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 7.0, 10.0, 17.0, 12.0, 14.0, 16.0, 20.0, 28.0, 18.0, 39.0, 27.0, 32.0, 25.0, 35.0, 45.0, 37.0, 44.0, 44.0, 38.0, 51.0, 44.0, 47.0, 45.0, 38.0, 29.0, 38.0, 29.0, 24.0, 17.0, 20.0, 15.0, 21.0, 7.0, 12.0, 6.0, 3.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.767578125, -0.7418060302734375, -0.716033935546875, -0.6902618408203125, -0.66448974609375, -0.6387176513671875, -0.612945556640625, -0.5871734619140625, -0.5614013671875, -0.5356292724609375, -0.509857177734375, -0.4840850830078125, -0.45831298828125, -0.4325408935546875, -0.406768798828125, -0.3809967041015625, -0.355224609375, -0.3294525146484375, -0.303680419921875, -0.2779083251953125, -0.25213623046875, -0.2263641357421875, -0.200592041015625, -0.1748199462890625, -0.1490478515625, -0.1232757568359375, -0.097503662109375, -0.0717315673828125, -0.04595947265625, -0.0201873779296875, 0.005584716796875, 0.0313568115234375, 0.05712890625, 0.0829010009765625, 0.108673095703125, 0.1344451904296875, 0.16021728515625, 0.1859893798828125, 0.211761474609375, 0.2375335693359375, 0.2633056640625, 0.2890777587890625, 0.314849853515625, 0.3406219482421875, 0.36639404296875, 0.3921661376953125, 0.417938232421875, 0.4437103271484375, 0.469482421875, 0.4952545166015625, 0.521026611328125, 0.5467987060546875, 0.57257080078125, 0.5983428955078125, 0.624114990234375, 0.6498870849609375, 0.6756591796875, 0.7014312744140625, 0.727203369140625, 0.7529754638671875, 0.77874755859375, 0.8045196533203125, 0.830291748046875, 0.8560638427734375, 0.8818359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 2.0, 10.0, 14.0, 23.0, 35.0, 41.0, 72.0, 103.0, 167.0, 252.0, 443.0, 813.0, 1649.0, 3227.0, 7235.0, 18422.0, 53551.0, 194502.0, 504200.0, 181999.0, 50500.0, 17720.0, 6955.0, 3092.0, 1498.0, 828.0, 413.0, 297.0, 153.0, 98.0, 75.0, 43.0, 44.0, 19.0, 12.0, 8.0, 9.0, 6.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1246337890625, -0.12067413330078125, -0.1167144775390625, -0.11275482177734375, -0.108795166015625, -0.10483551025390625, -0.1008758544921875, -0.09691619873046875, -0.09295654296875, -0.08899688720703125, -0.0850372314453125, -0.08107757568359375, -0.077117919921875, -0.07315826416015625, -0.0691986083984375, -0.06523895263671875, -0.061279296875, -0.05731964111328125, -0.0533599853515625, -0.04940032958984375, -0.045440673828125, -0.04148101806640625, -0.0375213623046875, -0.03356170654296875, -0.02960205078125, -0.02564239501953125, -0.0216827392578125, -0.01772308349609375, -0.013763427734375, -0.00980377197265625, -0.0058441162109375, -0.00188446044921875, 0.0020751953125, 0.00603485107421875, 0.0099945068359375, 0.01395416259765625, 0.017913818359375, 0.02187347412109375, 0.0258331298828125, 0.02979278564453125, 0.03375244140625, 0.03771209716796875, 0.0416717529296875, 0.04563140869140625, 0.049591064453125, 0.05355072021484375, 0.0575103759765625, 0.06147003173828125, 0.0654296875, 0.06938934326171875, 0.0733489990234375, 0.07730865478515625, 0.081268310546875, 0.08522796630859375, 0.0891876220703125, 0.09314727783203125, 0.09710693359375, 0.10106658935546875, 0.1050262451171875, 0.10898590087890625, 0.112945556640625, 0.11690521240234375, 0.1208648681640625, 0.12482452392578125, 0.1287841796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 11.0, 6.0, 12.0, 14.0, 20.0, 26.0, 38.0, 29.0, 49.0, 59.0, 94.0, 83.0, 109.0, 104.0, 79.0, 59.0, 51.0, 41.0, 30.0, 26.0, 14.0, 7.0, 5.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.300739288330078e-05, -2.2224150598049164e-05, -2.1440908312797546e-05, -2.065766602754593e-05, -1.987442374229431e-05, -1.9091181457042694e-05, -1.8307939171791077e-05, -1.752469688653946e-05, -1.6741454601287842e-05, -1.5958212316036224e-05, -1.5174970030784607e-05, -1.439172774553299e-05, -1.3608485460281372e-05, -1.2825243175029755e-05, -1.2042000889778137e-05, -1.125875860452652e-05, -1.0475516319274902e-05, -9.692274034023285e-06, -8.909031748771667e-06, -8.12578946352005e-06, -7.342547178268433e-06, -6.559304893016815e-06, -5.776062607765198e-06, -4.99282032251358e-06, -4.209578037261963e-06, -3.4263357520103455e-06, -2.643093466758728e-06, -1.8598511815071106e-06, -1.0766088962554932e-06, -2.9336661100387573e-07, 4.898756742477417e-07, 1.2731179594993591e-06, 2.0563602447509766e-06, 2.839602530002594e-06, 3.6228448152542114e-06, 4.406087100505829e-06, 5.189329385757446e-06, 5.972571671009064e-06, 6.755813956260681e-06, 7.539056241512299e-06, 8.322298526763916e-06, 9.105540812015533e-06, 9.888783097267151e-06, 1.0672025382518768e-05, 1.1455267667770386e-05, 1.2238509953022003e-05, 1.302175223827362e-05, 1.3804994523525238e-05, 1.4588236808776855e-05, 1.5371479094028473e-05, 1.615472137928009e-05, 1.6937963664531708e-05, 1.7721205949783325e-05, 1.8504448235034943e-05, 1.928769052028656e-05, 2.0070932805538177e-05, 2.0854175090789795e-05, 2.1637417376041412e-05, 2.242065966129303e-05, 2.3203901946544647e-05, 2.3987144231796265e-05, 2.4770386517047882e-05, 2.55536288022995e-05, 2.6336871087551117e-05, 2.7120113372802734e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 7.0, 15.0, 13.0, 31.0, 32.0, 44.0, 59.0, 118.0, 189.0, 272.0, 416.0, 746.0, 1470.0, 2739.0, 5830.0, 13833.0, 36685.0, 118906.0, 426771.0, 311079.0, 81902.0, 26790.0, 10637.0, 4692.0, 2338.0, 1199.0, 668.0, 380.0, 243.0, 138.0, 99.0, 72.0, 42.0, 32.0, 21.0, 13.0, 7.0, 11.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12615966796875, -0.1220703125, -0.11798095703125, -0.1138916015625, -0.10980224609375, -0.105712890625, -0.10162353515625, -0.0975341796875, -0.09344482421875, -0.08935546875, -0.08526611328125, -0.0811767578125, -0.07708740234375, -0.072998046875, -0.06890869140625, -0.0648193359375, -0.06072998046875, -0.056640625, -0.05255126953125, -0.0484619140625, -0.04437255859375, -0.040283203125, -0.03619384765625, -0.0321044921875, -0.02801513671875, -0.02392578125, -0.01983642578125, -0.0157470703125, -0.01165771484375, -0.007568359375, -0.00347900390625, 0.0006103515625, 0.00469970703125, 0.0087890625, 0.01287841796875, 0.0169677734375, 0.02105712890625, 0.025146484375, 0.02923583984375, 0.0333251953125, 0.03741455078125, 0.04150390625, 0.04559326171875, 0.0496826171875, 0.05377197265625, 0.057861328125, 0.06195068359375, 0.0660400390625, 0.07012939453125, 0.07421875, 0.07830810546875, 0.0823974609375, 0.08648681640625, 0.090576171875, 0.09466552734375, 0.0987548828125, 0.10284423828125, 0.10693359375, 0.11102294921875, 0.1151123046875, 0.11920166015625, 0.123291015625, 0.12738037109375, 0.1314697265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 7.0, 9.0, 13.0, 7.0, 16.0, 11.0, 15.0, 27.0, 34.0, 36.0, 39.0, 58.0, 54.0, 82.0, 73.0, 66.0, 58.0, 62.0, 55.0, 42.0, 33.0, 27.0, 22.0, 32.0, 18.0, 22.0, 12.0, 9.0, 9.0, 10.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050384521484375, -0.048601627349853516, -0.04681873321533203, -0.04503583908081055, -0.04325294494628906, -0.04147005081176758, -0.039687156677246094, -0.03790426254272461, -0.036121368408203125, -0.03433847427368164, -0.032555580139160156, -0.030772686004638672, -0.028989791870117188, -0.027206897735595703, -0.02542400360107422, -0.023641109466552734, -0.02185821533203125, -0.020075321197509766, -0.01829242706298828, -0.016509532928466797, -0.014726638793945312, -0.012943744659423828, -0.011160850524902344, -0.00937795639038086, -0.007595062255859375, -0.005812168121337891, -0.004029273986816406, -0.002246379852294922, -0.0004634857177734375, 0.0013194084167480469, 0.0031023025512695312, 0.004885196685791016, 0.0066680908203125, 0.008450984954833984, 0.010233879089355469, 0.012016773223876953, 0.013799667358398438, 0.015582561492919922, 0.017365455627441406, 0.01914834976196289, 0.020931243896484375, 0.02271413803100586, 0.024497032165527344, 0.026279926300048828, 0.028062820434570312, 0.029845714569091797, 0.03162860870361328, 0.033411502838134766, 0.03519439697265625, 0.036977291107177734, 0.03876018524169922, 0.0405430793762207, 0.04232597351074219, 0.04410886764526367, 0.045891761779785156, 0.04767465591430664, 0.049457550048828125, 0.05124044418334961, 0.053023338317871094, 0.05480623245239258, 0.05658912658691406, 0.05837202072143555, 0.06015491485595703, 0.061937808990478516, 0.063720703125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 37.0, 67.0, 102.0, 164.0, 185.0, 150.0, 99.0, 62.0, 40.0, 21.0, 10.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5216164588928223, -2.448578357696533, -2.375540256500244, -2.302502155303955, -2.229464054107666, -2.156425952911377, -2.083387851715088, -2.010349750518799, -1.9373116493225098, -1.8642735481262207, -1.7912354469299316, -1.7181973457336426, -1.6451592445373535, -1.5721211433410645, -1.4990830421447754, -1.4260449409484863, -1.3530068397521973, -1.2799687385559082, -1.2069306373596191, -1.13389253616333, -1.060854434967041, -0.987816333770752, -0.9147782325744629, -0.8417401313781738, -0.7687020301818848, -0.6956639289855957, -0.6226258277893066, -0.5495877265930176, -0.4765496253967285, -0.40351152420043945, -0.3304734230041504, -0.25743532180786133, -0.18439698219299316, -0.1113588809967041, -0.03832077980041504, 0.03471732139587402, 0.10775542259216309, 0.18079352378845215, 0.2538316249847412, 0.3268697261810303, 0.39990782737731934, 0.4729459285736084, 0.5459840297698975, 0.6190221309661865, 0.6920602321624756, 0.7650983333587646, 0.8381364345550537, 0.9111745357513428, 0.9842126369476318, 1.057250738143921, 1.13028883934021, 1.203326940536499, 1.276365041732788, 1.3494031429290771, 1.4224412441253662, 1.4954793453216553, 1.5685174465179443, 1.6415555477142334, 1.7145936489105225, 1.7876317501068115, 1.8606698513031006, 1.9337079524993896, 2.0067460536956787, 2.0797841548919678, 2.152822256088257]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 10.0, 10.0, 25.0, 34.0, 42.0, 71.0, 77.0, 83.0, 89.0, 83.0, 78.0, 73.0, 82.0, 68.0, 60.0, 36.0, 26.0, 19.0, 16.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8335562944412231, -1.7361416816711426, -1.6387271881103516, -1.541312575340271, -1.4438979625701904, -1.3464834690093994, -1.2490688562393188, -1.1516542434692383, -1.0542397499084473, -0.9568251967430115, -0.8594105839729309, -0.7619960308074951, -0.6645814180374146, -0.5671668648719788, -0.46975231170654297, -0.3723376989364624, -0.27492308616638184, -0.17750850319862366, -0.08009393513202667, 0.017320632934570312, 0.11473521590232849, 0.21214979887008667, 0.30956435203552246, 0.406978964805603, 0.5043935179710388, 0.6018080711364746, 0.6992226839065552, 0.796637237071991, 0.8940517902374268, 0.9914664030075073, 1.088881015777588, 1.186295509338379, 1.283710241317749, 1.3811248540878296, 1.4785393476486206, 1.5759539604187012, 1.6733685731887817, 1.7707831859588623, 1.8681976795196533, 1.9656122922897339, 2.0630269050598145, 2.1604413986206055, 2.2578561305999756, 2.3552706241607666, 2.4526851177215576, 2.5500998497009277, 2.6475143432617188, 2.7449288368225098, 2.842343330383301, 2.939757823944092, 3.037172555923462, 3.134587049484253, 3.232001543045044, 3.329416275024414, 3.426830768585205, 3.524245262145996, 3.621659994125366, 3.7190744876861572, 3.8164892196655273, 3.9139037132263184, 4.011318206787109, 4.1087327003479, 4.206147193908691, 4.303562164306641, 4.400976657867432]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 9.0, 11.0, 19.0, 11.0, 25.0, 38.0, 57.0, 72.0, 98.0, 163.0, 226.0, 369.0, 572.0, 900.0, 1699.0, 3198.0, 7241.0, 19009.0, 67912.0, 404439.0, 2884403.0, 668016.0, 93994.0, 24540.0, 8678.0, 3796.0, 1898.0, 1091.0, 652.0, 378.0, 246.0, 182.0, 90.0, 85.0, 56.0, 30.0, 22.0, 20.0, 16.0, 7.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.74237060546875, -0.7196044921875, -0.69683837890625, -0.674072265625, -0.65130615234375, -0.6285400390625, -0.60577392578125, -0.5830078125, -0.56024169921875, -0.5374755859375, -0.51470947265625, -0.491943359375, -0.46917724609375, -0.4464111328125, -0.42364501953125, -0.40087890625, -0.37811279296875, -0.3553466796875, -0.33258056640625, -0.309814453125, -0.28704833984375, -0.2642822265625, -0.24151611328125, -0.21875, -0.19598388671875, -0.1732177734375, -0.15045166015625, -0.127685546875, -0.10491943359375, -0.0821533203125, -0.05938720703125, -0.03662109375, -0.01385498046875, 0.0089111328125, 0.03167724609375, 0.054443359375, 0.07720947265625, 0.0999755859375, 0.12274169921875, 0.1455078125, 0.16827392578125, 0.1910400390625, 0.21380615234375, 0.236572265625, 0.25933837890625, 0.2821044921875, 0.30487060546875, 0.32763671875, 0.35040283203125, 0.3731689453125, 0.39593505859375, 0.418701171875, 0.44146728515625, 0.4642333984375, 0.48699951171875, 0.509765625, 0.53253173828125, 0.5552978515625, 0.57806396484375, 0.600830078125, 0.62359619140625, 0.6463623046875, 0.66912841796875, 0.69189453125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 11.0, 7.0, 16.0, 13.0, 23.0, 40.0, 41.0, 42.0, 59.0, 52.0, 63.0, 69.0, 70.0, 67.0, 66.0, 56.0, 61.0, 46.0, 41.0, 33.0, 22.0, 17.0, 18.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.77294921875, -0.7512664794921875, -0.729583740234375, -0.7079010009765625, -0.68621826171875, -0.6645355224609375, -0.642852783203125, -0.6211700439453125, -0.5994873046875, -0.5778045654296875, -0.556121826171875, -0.5344390869140625, -0.51275634765625, -0.4910736083984375, -0.469390869140625, -0.4477081298828125, -0.426025390625, -0.4043426513671875, -0.382659912109375, -0.3609771728515625, -0.33929443359375, -0.3176116943359375, -0.295928955078125, -0.2742462158203125, -0.2525634765625, -0.2308807373046875, -0.209197998046875, -0.1875152587890625, -0.16583251953125, -0.1441497802734375, -0.122467041015625, -0.1007843017578125, -0.0791015625, -0.0574188232421875, -0.035736083984375, -0.0140533447265625, 0.00762939453125, 0.0293121337890625, 0.050994873046875, 0.0726776123046875, 0.0943603515625, 0.1160430908203125, 0.137725830078125, 0.1594085693359375, 0.18109130859375, 0.2027740478515625, 0.224456787109375, 0.2461395263671875, 0.267822265625, 0.2895050048828125, 0.311187744140625, 0.3328704833984375, 0.35455322265625, 0.3762359619140625, 0.397918701171875, 0.4196014404296875, 0.4412841796875, 0.4629669189453125, 0.484649658203125, 0.5063323974609375, 0.52801513671875, 0.5496978759765625, 0.571380615234375, 0.5930633544921875, 0.61474609375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 8.0, 16.0, 17.0, 38.0, 54.0, 121.0, 264.0, 871.0, 5237.0, 108795.0, 4022005.0, 52155.0, 3563.0, 664.0, 217.0, 98.0, 62.0, 26.0, 18.0, 10.0, 12.0, 9.0, 7.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.2282257080078125, -2.161529541015625, -2.0948333740234375, -2.02813720703125, -1.9614410400390625, -1.894744873046875, -1.8280487060546875, -1.7613525390625, -1.6946563720703125, -1.627960205078125, -1.5612640380859375, -1.49456787109375, -1.4278717041015625, -1.361175537109375, -1.2944793701171875, -1.227783203125, -1.1610870361328125, -1.094390869140625, -1.0276947021484375, -0.96099853515625, -0.8943023681640625, -0.827606201171875, -0.7609100341796875, -0.6942138671875, -0.6275177001953125, -0.560821533203125, -0.4941253662109375, -0.42742919921875, -0.3607330322265625, -0.294036865234375, -0.2273406982421875, -0.16064453125, -0.0939483642578125, -0.027252197265625, 0.0394439697265625, 0.10614013671875, 0.1728363037109375, 0.239532470703125, 0.3062286376953125, 0.3729248046875, 0.4396209716796875, 0.506317138671875, 0.5730133056640625, 0.63970947265625, 0.7064056396484375, 0.773101806640625, 0.8397979736328125, 0.906494140625, 0.9731903076171875, 1.039886474609375, 1.1065826416015625, 1.17327880859375, 1.2399749755859375, 1.306671142578125, 1.3733673095703125, 1.4400634765625, 1.5067596435546875, 1.573455810546875, 1.6401519775390625, 1.70684814453125, 1.7735443115234375, 1.840240478515625, 1.9069366455078125, 1.9736328125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 11.0, 9.0, 12.0, 11.0, 19.0, 25.0, 35.0, 52.0, 71.0, 117.0, 169.0, 317.0, 607.0, 1023.0, 651.0, 363.0, 184.0, 132.0, 79.0, 48.0, 40.0, 31.0, 12.0, 14.0, 11.0, 10.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.303466796875, -0.2956066131591797, -0.2877464294433594, -0.27988624572753906, -0.27202606201171875, -0.26416587829589844, -0.2563056945800781, -0.2484455108642578, -0.2405853271484375, -0.2327251434326172, -0.22486495971679688, -0.21700477600097656, -0.20914459228515625, -0.20128440856933594, -0.19342422485351562, -0.1855640411376953, -0.177703857421875, -0.1698436737060547, -0.16198348999023438, -0.15412330627441406, -0.14626312255859375, -0.13840293884277344, -0.13054275512695312, -0.12268257141113281, -0.1148223876953125, -0.10696220397949219, -0.09910202026367188, -0.09124183654785156, -0.08338165283203125, -0.07552146911621094, -0.06766128540039062, -0.05980110168457031, -0.05194091796875, -0.04408073425292969, -0.036220550537109375, -0.028360366821289062, -0.02050018310546875, -0.012639999389648438, -0.004779815673828125, 0.0030803680419921875, 0.0109405517578125, 0.018800735473632812, 0.026660919189453125, 0.03452110290527344, 0.04238128662109375, 0.05024147033691406, 0.058101654052734375, 0.06596183776855469, 0.073822021484375, 0.08168220520019531, 0.08954238891601562, 0.09740257263183594, 0.10526275634765625, 0.11312294006347656, 0.12098312377929688, 0.1288433074951172, 0.1367034912109375, 0.1445636749267578, 0.15242385864257812, 0.16028404235839844, 0.16814422607421875, 0.17600440979003906, 0.18386459350585938, 0.1917247772216797, 0.1995849609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 8.0, 10.0, 16.0, 20.0, 37.0, 49.0, 76.0, 128.0, 144.0, 115.0, 119.0, 89.0, 64.0, 39.0, 21.0, 15.0, 16.0, 9.0, 8.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9965784549713135, -0.9553521871566772, -0.914125919342041, -0.8728996515274048, -0.8316733837127686, -0.7904471158981323, -0.7492208480834961, -0.7079945802688599, -0.6667683124542236, -0.6255420446395874, -0.5843157768249512, -0.5430895090103149, -0.5018632411956787, -0.4606369733810425, -0.41941070556640625, -0.37818443775177, -0.3369581699371338, -0.29573190212249756, -0.25450563430786133, -0.2132793664932251, -0.17205309867858887, -0.13082683086395264, -0.0896005630493164, -0.048374295234680176, -0.007148027420043945, 0.034078240394592285, 0.07530450820922852, 0.11653077602386475, 0.15775704383850098, 0.1989833116531372, 0.24020957946777344, 0.28143584728240967, 0.3226621150970459, 0.36388838291168213, 0.40511465072631836, 0.4463409185409546, 0.4875671863555908, 0.528793454170227, 0.5700197219848633, 0.6112459897994995, 0.6524722576141357, 0.693698525428772, 0.7349247932434082, 0.7761510610580444, 0.8173773288726807, 0.8586035966873169, 0.8998298645019531, 0.9410561323165894, 0.9822824001312256, 1.0235086679458618, 1.064734935760498, 1.1059612035751343, 1.1471874713897705, 1.1884137392044067, 1.229640007019043, 1.2708662748336792, 1.3120925426483154, 1.3533188104629517, 1.394545078277588, 1.4357713460922241, 1.4769976139068604, 1.5182238817214966, 1.5594501495361328, 1.600676417350769, 1.6419026851654053]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 3.0, 9.0, 9.0, 17.0, 16.0, 17.0, 30.0, 37.0, 31.0, 29.0, 42.0, 33.0, 49.0, 68.0, 56.0, 56.0, 50.0, 52.0, 35.0, 43.0, 38.0, 44.0, 34.0, 28.0, 18.0, 29.0, 22.0, 12.0, 14.0, 7.0, 8.0, 11.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6031824946403503, -0.5844428539276123, -0.5657031536102295, -0.5469635128974915, -0.5282238721847534, -0.5094842314720154, -0.49074456095695496, -0.47200489044189453, -0.4532652497291565, -0.43452560901641846, -0.41578593850135803, -0.3970462679862976, -0.37830662727355957, -0.35956698656082153, -0.3408273160457611, -0.3220876455307007, -0.30334800481796265, -0.2846083641052246, -0.2658686935901642, -0.24712903797626495, -0.22838938236236572, -0.2096497267484665, -0.19091007113456726, -0.17217041552066803, -0.1534307599067688, -0.13469110429286957, -0.11595144867897034, -0.0972117930650711, -0.07847213745117188, -0.059732481837272644, -0.04099282622337341, -0.022253170609474182, -0.0035134553909301758, 0.015226200222969055, 0.033965855836868286, 0.05270551145076752, 0.07144516706466675, 0.09018482267856598, 0.10892447829246521, 0.12766413390636444, 0.14640378952026367, 0.1651434451341629, 0.18388310074806213, 0.20262275636196136, 0.2213624119758606, 0.24010206758975983, 0.25884172320365906, 0.2775813937187195, 0.2963210344314575, 0.31506067514419556, 0.333800345659256, 0.3525400161743164, 0.37127965688705444, 0.3900192975997925, 0.4087589681148529, 0.42749863862991333, 0.44623827934265137, 0.4649779200553894, 0.48371759057044983, 0.5024572610855103, 0.5211969017982483, 0.5399365425109863, 0.5586762428283691, 0.5774158835411072, 0.5961555242538452]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 10.0, 24.0, 22.0, 28.0, 52.0, 60.0, 104.0, 172.0, 262.0, 393.0, 682.0, 1094.0, 1848.0, 3374.0, 6428.0, 13543.0, 32840.0, 123183.0, 615980.0, 175779.0, 40603.0, 15528.0, 7441.0, 3790.0, 2072.0, 1225.0, 724.0, 433.0, 288.0, 172.0, 116.0, 92.0, 37.0, 43.0, 27.0, 23.0, 17.0, 11.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2105712890625, -0.20411109924316406, -0.19765090942382812, -0.1911907196044922, -0.18473052978515625, -0.1782703399658203, -0.17181015014648438, -0.16534996032714844, -0.1588897705078125, -0.15242958068847656, -0.14596939086914062, -0.1395092010498047, -0.13304901123046875, -0.1265888214111328, -0.12012863159179688, -0.11366844177246094, -0.107208251953125, -0.10074806213378906, -0.09428787231445312, -0.08782768249511719, -0.08136749267578125, -0.07490730285644531, -0.06844711303710938, -0.06198692321777344, -0.0555267333984375, -0.04906654357910156, -0.042606353759765625, -0.03614616394042969, -0.02968597412109375, -0.023225784301757812, -0.016765594482421875, -0.010305404663085938, -0.00384521484375, 0.0026149749755859375, 0.009075164794921875, 0.015535354614257812, 0.02199554443359375, 0.028455734252929688, 0.034915924072265625, 0.04137611389160156, 0.0478363037109375, 0.05429649353027344, 0.060756683349609375, 0.06721687316894531, 0.07367706298828125, 0.08013725280761719, 0.08659744262695312, 0.09305763244628906, 0.099517822265625, 0.10597801208496094, 0.11243820190429688, 0.11889839172363281, 0.12535858154296875, 0.1318187713623047, 0.13827896118164062, 0.14473915100097656, 0.1511993408203125, 0.15765953063964844, 0.16411972045898438, 0.1705799102783203, 0.17704010009765625, 0.1835002899169922, 0.18996047973632812, 0.19642066955566406, 0.202880859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 9.0, 7.0, 9.0, 8.0, 7.0, 21.0, 18.0, 32.0, 37.0, 54.0, 39.0, 68.0, 66.0, 86.0, 63.0, 70.0, 72.0, 50.0, 61.0, 48.0, 40.0, 30.0, 22.0, 19.0, 20.0, 8.0, 8.0, 11.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.481689453125, -0.4642295837402344, -0.44676971435546875, -0.4293098449707031, -0.4118499755859375, -0.3943901062011719, -0.37693023681640625, -0.3594703674316406, -0.342010498046875, -0.3245506286621094, -0.30709075927734375, -0.2896308898925781, -0.2721710205078125, -0.2547111511230469, -0.23725128173828125, -0.21979141235351562, -0.20233154296875, -0.18487167358398438, -0.16741180419921875, -0.14995193481445312, -0.1324920654296875, -0.11503219604492188, -0.09757232666015625, -0.08011245727539062, -0.062652587890625, -0.045192718505859375, -0.02773284912109375, -0.010272979736328125, 0.0071868896484375, 0.024646759033203125, 0.04210662841796875, 0.059566497802734375, 0.0770263671875, 0.09448623657226562, 0.11194610595703125, 0.12940597534179688, 0.1468658447265625, 0.16432571411132812, 0.18178558349609375, 0.19924545288085938, 0.216705322265625, 0.23416519165039062, 0.25162506103515625, 0.2690849304199219, 0.2865447998046875, 0.3040046691894531, 0.32146453857421875, 0.3389244079589844, 0.35638427734375, 0.3738441467285156, 0.39130401611328125, 0.4087638854980469, 0.4262237548828125, 0.4436836242675781, 0.46114349365234375, 0.4786033630371094, 0.496063232421875, 0.5135231018066406, 0.5309829711914062, 0.5484428405761719, 0.5659027099609375, 0.5833625793457031, 0.6008224487304688, 0.6182823181152344, 0.6357421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 5.0, 4.0, 14.0, 9.0, 9.0, 20.0, 30.0, 35.0, 52.0, 69.0, 127.0, 184.0, 320.0, 625.0, 1163.0, 2484.0, 6066.0, 18653.0, 93241.0, 682731.0, 198798.0, 28933.0, 8511.0, 3231.0, 1461.0, 711.0, 358.0, 222.0, 149.0, 105.0, 64.0, 38.0, 31.0, 16.0, 18.0, 13.0, 10.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16881370544433594, -0.16196823120117188, -0.1551227569580078, -0.14827728271484375, -0.1414318084716797, -0.13458633422851562, -0.12774085998535156, -0.1208953857421875, -0.11404991149902344, -0.10720443725585938, -0.10035896301269531, -0.09351348876953125, -0.08666801452636719, -0.07982254028320312, -0.07297706604003906, -0.066131591796875, -0.05928611755371094, -0.052440643310546875, -0.04559516906738281, -0.03874969482421875, -0.03190422058105469, -0.025058746337890625, -0.018213272094726562, -0.0113677978515625, -0.0045223236083984375, 0.002323150634765625, 0.009168624877929688, 0.01601409912109375, 0.022859573364257812, 0.029705047607421875, 0.03655052185058594, 0.04339599609375, 0.05024147033691406, 0.057086944580078125, 0.06393241882324219, 0.07077789306640625, 0.07762336730957031, 0.08446884155273438, 0.09131431579589844, 0.0981597900390625, 0.10500526428222656, 0.11185073852539062, 0.11869621276855469, 0.12554168701171875, 0.1323871612548828, 0.13923263549804688, 0.14607810974121094, 0.152923583984375, 0.15976905822753906, 0.16661453247070312, 0.1734600067138672, 0.18030548095703125, 0.1871509552001953, 0.19399642944335938, 0.20084190368652344, 0.2076873779296875, 0.21453285217285156, 0.22137832641601562, 0.2282238006591797, 0.23506927490234375, 0.2419147491455078, 0.24876022338867188, 0.25560569763183594, 0.262451171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 10.0, 8.0, 3.0, 7.0, 14.0, 12.0, 7.0, 23.0, 17.0, 26.0, 26.0, 28.0, 47.0, 36.0, 52.0, 54.0, 58.0, 44.0, 49.0, 49.0, 35.0, 49.0, 45.0, 47.0, 46.0, 44.0, 36.0, 21.0, 27.0, 10.0, 19.0, 11.0, 8.0, 11.0, 8.0, 4.0, 4.0, 2.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84814453125, -0.8212203979492188, -0.7942962646484375, -0.7673721313476562, -0.740447998046875, -0.7135238647460938, -0.6865997314453125, -0.6596755981445312, -0.63275146484375, -0.6058273315429688, -0.5789031982421875, -0.5519790649414062, -0.525054931640625, -0.49813079833984375, -0.4712066650390625, -0.44428253173828125, -0.4173583984375, -0.39043426513671875, -0.3635101318359375, -0.33658599853515625, -0.309661865234375, -0.28273773193359375, -0.2558135986328125, -0.22888946533203125, -0.20196533203125, -0.17504119873046875, -0.1481170654296875, -0.12119293212890625, -0.094268798828125, -0.06734466552734375, -0.0404205322265625, -0.01349639892578125, 0.013427734375, 0.04035186767578125, 0.0672760009765625, 0.09420013427734375, 0.121124267578125, 0.14804840087890625, 0.1749725341796875, 0.20189666748046875, 0.22882080078125, 0.25574493408203125, 0.2826690673828125, 0.30959320068359375, 0.336517333984375, 0.36344146728515625, 0.3903656005859375, 0.41728973388671875, 0.4442138671875, 0.47113800048828125, 0.4980621337890625, 0.5249862670898438, 0.551910400390625, 0.5788345336914062, 0.6057586669921875, 0.6326828002929688, 0.65960693359375, 0.6865310668945312, 0.7134552001953125, 0.7403793334960938, 0.767303466796875, 0.7942276000976562, 0.8211517333984375, 0.8480758666992188, 0.875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 5.0, 8.0, 8.0, 19.0, 21.0, 22.0, 64.0, 84.0, 158.0, 247.0, 450.0, 880.0, 1886.0, 4508.0, 13778.0, 81713.0, 830321.0, 90887.0, 14715.0, 4735.0, 2021.0, 934.0, 447.0, 250.0, 139.0, 98.0, 56.0, 31.0, 20.0, 12.0, 13.0, 12.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1717529296875, -0.16717529296875, -0.16259765625, -0.15802001953125, -0.1534423828125, -0.14886474609375, -0.144287109375, -0.13970947265625, -0.1351318359375, -0.13055419921875, -0.1259765625, -0.12139892578125, -0.1168212890625, -0.11224365234375, -0.107666015625, -0.10308837890625, -0.0985107421875, -0.09393310546875, -0.08935546875, -0.08477783203125, -0.0802001953125, -0.07562255859375, -0.071044921875, -0.06646728515625, -0.0618896484375, -0.05731201171875, -0.052734375, -0.04815673828125, -0.0435791015625, -0.03900146484375, -0.034423828125, -0.02984619140625, -0.0252685546875, -0.02069091796875, -0.01611328125, -0.01153564453125, -0.0069580078125, -0.00238037109375, 0.002197265625, 0.00677490234375, 0.0113525390625, 0.01593017578125, 0.0205078125, 0.02508544921875, 0.0296630859375, 0.03424072265625, 0.038818359375, 0.04339599609375, 0.0479736328125, 0.05255126953125, 0.05712890625, 0.06170654296875, 0.0662841796875, 0.07086181640625, 0.075439453125, 0.08001708984375, 0.0845947265625, 0.08917236328125, 0.09375, 0.09832763671875, 0.1029052734375, 0.10748291015625, 0.112060546875, 0.11663818359375, 0.1212158203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 4.0, 16.0, 27.0, 37.0, 68.0, 87.0, 153.0, 205.0, 151.0, 88.0, 57.0, 25.0, 21.0, 14.0, 1.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.511543273925781e-05, -8.277781307697296e-05, -8.044019341468811e-05, -7.810257375240326e-05, -7.576495409011841e-05, -7.342733442783356e-05, -7.10897147655487e-05, -6.875209510326385e-05, -6.6414475440979e-05, -6.407685577869415e-05, -6.17392361164093e-05, -5.940161645412445e-05, -5.70639967918396e-05, -5.472637712955475e-05, -5.23887574672699e-05, -5.0051137804985046e-05, -4.7713518142700195e-05, -4.5375898480415344e-05, -4.303827881813049e-05, -4.070065915584564e-05, -3.836303949356079e-05, -3.602541983127594e-05, -3.368780016899109e-05, -3.135018050670624e-05, -2.9012560844421387e-05, -2.6674941182136536e-05, -2.4337321519851685e-05, -2.1999701857566833e-05, -1.9662082195281982e-05, -1.732446253299713e-05, -1.498684287071228e-05, -1.264922320842743e-05, -1.0311603546142578e-05, -7.973983883857727e-06, -5.636364221572876e-06, -3.298744559288025e-06, -9.611248970031738e-07, 1.3764947652816772e-06, 3.7141144275665283e-06, 6.051734089851379e-06, 8.38935375213623e-06, 1.0726973414421082e-05, 1.3064593076705933e-05, 1.5402212738990784e-05, 1.7739832401275635e-05, 2.0077452063560486e-05, 2.2415071725845337e-05, 2.4752691388130188e-05, 2.709031105041504e-05, 2.942793071269989e-05, 3.176555037498474e-05, 3.410317003726959e-05, 3.644078969955444e-05, 3.8778409361839294e-05, 4.1116029024124146e-05, 4.3453648686408997e-05, 4.579126834869385e-05, 4.81288880109787e-05, 5.046650767326355e-05, 5.28041273355484e-05, 5.514174699783325e-05, 5.74793666601181e-05, 5.9816986322402954e-05, 6.21546059846878e-05, 6.449222564697266e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 6.0, 7.0, 8.0, 12.0, 22.0, 40.0, 51.0, 95.0, 143.0, 238.0, 447.0, 817.0, 1711.0, 3899.0, 9490.0, 32878.0, 345629.0, 587621.0, 44746.0, 11823.0, 4593.0, 2105.0, 973.0, 510.0, 263.0, 143.0, 96.0, 73.0, 23.0, 22.0, 13.0, 11.0, 9.0, 16.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.14306640625, -0.13898944854736328, -0.13491249084472656, -0.13083553314208984, -0.12675857543945312, -0.1226816177368164, -0.11860466003417969, -0.11452770233154297, -0.11045074462890625, -0.10637378692626953, -0.10229682922363281, -0.0982198715209961, -0.09414291381835938, -0.09006595611572266, -0.08598899841308594, -0.08191204071044922, -0.0778350830078125, -0.07375812530517578, -0.06968116760253906, -0.06560420989990234, -0.061527252197265625, -0.057450294494628906, -0.05337333679199219, -0.04929637908935547, -0.04521942138671875, -0.04114246368408203, -0.03706550598144531, -0.032988548278808594, -0.028911590576171875, -0.024834632873535156, -0.020757675170898438, -0.01668071746826172, -0.012603759765625, -0.008526802062988281, -0.0044498443603515625, -0.00037288665771484375, 0.003704071044921875, 0.007781028747558594, 0.011857986450195312, 0.01593494415283203, 0.02001190185546875, 0.02408885955810547, 0.028165817260742188, 0.032242774963378906, 0.036319732666015625, 0.040396690368652344, 0.04447364807128906, 0.04855060577392578, 0.0526275634765625, 0.05670452117919922, 0.06078147888183594, 0.06485843658447266, 0.06893539428710938, 0.0730123519897461, 0.07708930969238281, 0.08116626739501953, 0.08524322509765625, 0.08932018280029297, 0.09339714050292969, 0.0974740982055664, 0.10155105590820312, 0.10562801361083984, 0.10970497131347656, 0.11378192901611328, 0.11785888671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 9.0, 10.0, 14.0, 16.0, 34.0, 40.0, 79.0, 111.0, 156.0, 154.0, 110.0, 71.0, 57.0, 33.0, 24.0, 12.0, 15.0, 10.0, 6.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023895263671875, -0.022979259490966797, -0.022063255310058594, -0.02114725112915039, -0.020231246948242188, -0.019315242767333984, -0.01839923858642578, -0.017483234405517578, -0.016567230224609375, -0.015651226043701172, -0.014735221862792969, -0.013819217681884766, -0.012903213500976562, -0.01198720932006836, -0.011071205139160156, -0.010155200958251953, -0.00923919677734375, -0.008323192596435547, -0.007407188415527344, -0.006491184234619141, -0.0055751800537109375, -0.004659175872802734, -0.0037431716918945312, -0.002827167510986328, -0.001911163330078125, -0.0009951591491699219, -7.915496826171875e-05, 0.0008368492126464844, 0.0017528533935546875, 0.0026688575744628906, 0.0035848617553710938, 0.004500865936279297, 0.0054168701171875, 0.006332874298095703, 0.007248878479003906, 0.00816488265991211, 0.009080886840820312, 0.009996891021728516, 0.010912895202636719, 0.011828899383544922, 0.012744903564453125, 0.013660907745361328, 0.014576911926269531, 0.015492916107177734, 0.016408920288085938, 0.01732492446899414, 0.018240928649902344, 0.019156932830810547, 0.02007293701171875, 0.020988941192626953, 0.021904945373535156, 0.02282094955444336, 0.023736953735351562, 0.024652957916259766, 0.02556896209716797, 0.026484966278076172, 0.027400970458984375, 0.028316974639892578, 0.02923297882080078, 0.030148983001708984, 0.031064987182617188, 0.03198099136352539, 0.032896995544433594, 0.0338129997253418, 0.03472900390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 13.0, 22.0, 48.0, 71.0, 119.0, 163.0, 183.0, 142.0, 90.0, 42.0, 25.0, 14.0, 17.0, 10.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8666658401489258, -0.8335991501808167, -0.8005324602127075, -0.7674657702445984, -0.7343990802764893, -0.7013323307037354, -0.6682656407356262, -0.6351989507675171, -0.602132260799408, -0.5690655708312988, -0.5359988808631897, -0.5029321908950806, -0.46986547112464905, -0.4367987811565399, -0.4037320613861084, -0.37066537141799927, -0.33759868144989014, -0.304531991481781, -0.2714653015136719, -0.23839858174324036, -0.20533189177513123, -0.1722652018070221, -0.13919849693775177, -0.10613179206848145, -0.07306510210037231, -0.03999840468168259, -0.006931707262992859, 0.02613499015569687, 0.0592016875743866, 0.09226837754249573, 0.12533508241176605, 0.15840178728103638, 0.1914684772491455, 0.22453516721725464, 0.25760185718536377, 0.2906685769557953, 0.3237352669239044, 0.35680195689201355, 0.38986867666244507, 0.4229353666305542, 0.45600205659866333, 0.48906874656677246, 0.5221354365348816, 0.5552021265029907, 0.5882688760757446, 0.621335506439209, 0.6544022560119629, 0.687468945980072, 0.7205356359481812, 0.7536023259162903, 0.7866690158843994, 0.8197357058525085, 0.8528023958206177, 0.8858691453933716, 0.9189358353614807, 0.9520025253295898, 0.985069215297699, 1.018135905265808, 1.051202654838562, 1.0842692852020264, 1.1173360347747803, 1.1504026651382446, 1.1834694147109985, 1.216536045074463, 1.2496027946472168]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 13.0, 16.0, 25.0, 26.0, 27.0, 47.0, 40.0, 55.0, 54.0, 60.0, 72.0, 80.0, 57.0, 49.0, 57.0, 49.0, 41.0, 32.0, 33.0, 25.0, 26.0, 14.0, 12.0, 13.0, 14.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4369208514690399, -0.42228955030441284, -0.4076582193374634, -0.3930269181728363, -0.37839561700820923, -0.36376428604125977, -0.3491329848766327, -0.3345016837120056, -0.31987035274505615, -0.3052390515804291, -0.2906077206134796, -0.27597641944885254, -0.2613450884819031, -0.246713787317276, -0.23208248615264893, -0.21745117008686066, -0.2028198540210724, -0.18818853795528412, -0.17355722188949585, -0.15892592072486877, -0.1442946046590805, -0.12966328859329224, -0.11503197997808456, -0.10040067136287689, -0.08576935529708862, -0.07113803923130035, -0.05650673061609268, -0.04187541827559471, -0.02724410593509674, -0.012612789869308472, 0.0020185187458992004, 0.016649827361106873, 0.031281113624572754, 0.045912425965070724, 0.060543738305568695, 0.07517504692077637, 0.08980636298656464, 0.1044376790523529, 0.11906898766756058, 0.13370029628276825, 0.14833161234855652, 0.1629629284143448, 0.17759424448013306, 0.19222554564476013, 0.2068568617105484, 0.22148817777633667, 0.23611947894096375, 0.2507507801055908, 0.2653821110725403, 0.28001341223716736, 0.2946447432041168, 0.3092760443687439, 0.32390737533569336, 0.33853867650032043, 0.3531699776649475, 0.367801308631897, 0.38243260979652405, 0.3970639109611511, 0.4116952419281006, 0.42632654309272766, 0.44095784425735474, 0.4555891752243042, 0.4702204763889313, 0.48485177755355835, 0.4994831085205078]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 11.0, 24.0, 41.0, 72.0, 167.0, 477.0, 1439.0, 5063.0, 21775.0, 153691.0, 751909.0, 92917.0, 15365.0, 3699.0, 1180.0, 377.0, 142.0, 70.0, 33.0, 22.0, 11.0, 9.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80859375, -0.78363037109375, -0.7586669921875, -0.73370361328125, -0.708740234375, -0.68377685546875, -0.6588134765625, -0.63385009765625, -0.60888671875, -0.58392333984375, -0.5589599609375, -0.53399658203125, -0.509033203125, -0.48406982421875, -0.4591064453125, -0.43414306640625, -0.4091796875, -0.38421630859375, -0.3592529296875, -0.33428955078125, -0.309326171875, -0.28436279296875, -0.2593994140625, -0.23443603515625, -0.20947265625, -0.18450927734375, -0.1595458984375, -0.13458251953125, -0.109619140625, -0.08465576171875, -0.0596923828125, -0.03472900390625, -0.009765625, 0.01519775390625, 0.0401611328125, 0.06512451171875, 0.090087890625, 0.11505126953125, 0.1400146484375, 0.16497802734375, 0.18994140625, 0.21490478515625, 0.2398681640625, 0.26483154296875, 0.289794921875, 0.31475830078125, 0.3397216796875, 0.36468505859375, 0.3896484375, 0.41461181640625, 0.4395751953125, 0.46453857421875, 0.489501953125, 0.51446533203125, 0.5394287109375, 0.56439208984375, 0.58935546875, 0.61431884765625, 0.6392822265625, 0.66424560546875, 0.689208984375, 0.71417236328125, 0.7391357421875, 0.76409912109375, 0.7890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 17.0, 23.0, 41.0, 74.0, 101.0, 126.0, 167.0, 136.0, 118.0, 65.0, 43.0, 28.0, 24.0, 12.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9563446044921875, -0.880462646484375, -0.8045806884765625, -0.72869873046875, -0.6528167724609375, -0.576934814453125, -0.5010528564453125, -0.4251708984375, -0.3492889404296875, -0.273406982421875, -0.1975250244140625, -0.12164306640625, -0.0457611083984375, 0.030120849609375, 0.1060028076171875, 0.181884765625, 0.2577667236328125, 0.333648681640625, 0.4095306396484375, 0.48541259765625, 0.5612945556640625, 0.637176513671875, 0.7130584716796875, 0.7889404296875, 0.8648223876953125, 0.940704345703125, 1.0165863037109375, 1.09246826171875, 1.1683502197265625, 1.244232177734375, 1.3201141357421875, 1.39599609375, 1.4718780517578125, 1.547760009765625, 1.6236419677734375, 1.69952392578125, 1.7754058837890625, 1.851287841796875, 1.9271697998046875, 2.0030517578125, 2.0789337158203125, 2.154815673828125, 2.2306976318359375, 2.30657958984375, 2.3824615478515625, 2.458343505859375, 2.5342254638671875, 2.610107421875, 2.6859893798828125, 2.761871337890625, 2.8377532958984375, 2.91363525390625, 2.9895172119140625, 3.065399169921875, 3.1412811279296875, 3.2171630859375, 3.2930450439453125, 3.368927001953125, 3.4448089599609375, 3.52069091796875, 3.5965728759765625, 3.672454833984375, 3.7483367919921875, 3.82421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 8.0, 14.0, 11.0, 20.0, 27.0, 25.0, 54.0, 58.0, 70.0, 111.0, 150.0, 266.0, 508.0, 990.0, 2578.0, 7229.0, 26607.0, 141281.0, 681608.0, 146684.0, 27633.0, 7589.0, 2573.0, 1065.0, 506.0, 313.0, 159.0, 98.0, 80.0, 67.0, 32.0, 34.0, 19.0, 17.0, 10.0, 9.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.49169921875, -0.4770240783691406, -0.46234893798828125, -0.4476737976074219, -0.4329986572265625, -0.4183235168457031, -0.40364837646484375, -0.3889732360839844, -0.374298095703125, -0.3596229553222656, -0.34494781494140625, -0.3302726745605469, -0.3155975341796875, -0.3009223937988281, -0.28624725341796875, -0.2715721130371094, -0.25689697265625, -0.24222183227539062, -0.22754669189453125, -0.21287155151367188, -0.1981964111328125, -0.18352127075195312, -0.16884613037109375, -0.15417098999023438, -0.139495849609375, -0.12482070922851562, -0.11014556884765625, -0.09547042846679688, -0.0807952880859375, -0.06612014770507812, -0.05144500732421875, -0.036769866943359375, -0.0220947265625, -0.007419586181640625, 0.00725555419921875, 0.021930694580078125, 0.0366058349609375, 0.051280975341796875, 0.06595611572265625, 0.08063125610351562, 0.095306396484375, 0.10998153686523438, 0.12465667724609375, 0.13933181762695312, 0.1540069580078125, 0.16868209838867188, 0.18335723876953125, 0.19803237915039062, 0.21270751953125, 0.22738265991210938, 0.24205780029296875, 0.2567329406738281, 0.2714080810546875, 0.2860832214355469, 0.30075836181640625, 0.3154335021972656, 0.330108642578125, 0.3447837829589844, 0.35945892333984375, 0.3741340637207031, 0.3888092041015625, 0.4034843444824219, 0.41815948486328125, 0.4328346252441406, 0.447509765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 8.0, 10.0, 5.0, 4.0, 8.0, 20.0, 11.0, 11.0, 21.0, 15.0, 29.0, 29.0, 32.0, 35.0, 27.0, 39.0, 41.0, 45.0, 48.0, 47.0, 49.0, 53.0, 41.0, 43.0, 28.0, 28.0, 35.0, 42.0, 32.0, 31.0, 20.0, 16.0, 19.0, 14.0, 14.0, 11.0, 11.0, 5.0, 7.0, 3.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -1.0006637573242188, -0.9691009521484375, -0.9375381469726562, -0.905975341796875, -0.8744125366210938, -0.8428497314453125, -0.8112869262695312, -0.77972412109375, -0.7481613159179688, -0.7165985107421875, -0.6850357055664062, -0.653472900390625, -0.6219100952148438, -0.5903472900390625, -0.5587844848632812, -0.5272216796875, -0.49565887451171875, -0.4640960693359375, -0.43253326416015625, -0.400970458984375, -0.36940765380859375, -0.3378448486328125, -0.30628204345703125, -0.27471923828125, -0.24315643310546875, -0.2115936279296875, -0.18003082275390625, -0.148468017578125, -0.11690521240234375, -0.0853424072265625, -0.05377960205078125, -0.022216796875, 0.00934600830078125, 0.0409088134765625, 0.07247161865234375, 0.104034423828125, 0.13559722900390625, 0.1671600341796875, 0.19872283935546875, 0.23028564453125, 0.26184844970703125, 0.2934112548828125, 0.32497406005859375, 0.356536865234375, 0.38809967041015625, 0.4196624755859375, 0.45122528076171875, 0.4827880859375, 0.5143508911132812, 0.5459136962890625, 0.5774765014648438, 0.609039306640625, 0.6406021118164062, 0.6721649169921875, 0.7037277221679688, 0.73529052734375, 0.7668533325195312, 0.7984161376953125, 0.8299789428710938, 0.861541748046875, 0.8931045532226562, 0.9246673583984375, 0.9562301635742188, 0.98779296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 18.0, 22.0, 40.0, 62.0, 101.0, 179.0, 341.0, 684.0, 1568.0, 4593.0, 15899.0, 92898.0, 765449.0, 137357.0, 20337.0, 5413.0, 1913.0, 776.0, 398.0, 207.0, 118.0, 51.0, 29.0, 34.0, 15.0, 13.0, 12.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19446754455566406, -0.18715286254882812, -0.1798381805419922, -0.17252349853515625, -0.1652088165283203, -0.15789413452148438, -0.15057945251464844, -0.1432647705078125, -0.13595008850097656, -0.12863540649414062, -0.12132072448730469, -0.11400604248046875, -0.10669136047363281, -0.09937667846679688, -0.09206199645996094, -0.084747314453125, -0.07743263244628906, -0.07011795043945312, -0.06280326843261719, -0.05548858642578125, -0.04817390441894531, -0.040859222412109375, -0.03354454040527344, -0.0262298583984375, -0.018915176391601562, -0.011600494384765625, -0.0042858123779296875, 0.00302886962890625, 0.010343551635742188, 0.017658233642578125, 0.024972915649414062, 0.03228759765625, 0.03960227966308594, 0.046916961669921875, 0.05423164367675781, 0.06154632568359375, 0.06886100769042969, 0.07617568969726562, 0.08349037170410156, 0.0908050537109375, 0.09811973571777344, 0.10543441772460938, 0.11274909973144531, 0.12006378173828125, 0.1273784637451172, 0.13469314575195312, 0.14200782775878906, 0.149322509765625, 0.15663719177246094, 0.16395187377929688, 0.1712665557861328, 0.17858123779296875, 0.1858959197998047, 0.19321060180664062, 0.20052528381347656, 0.2078399658203125, 0.21515464782714844, 0.22246932983398438, 0.2297840118408203, 0.23709869384765625, 0.2444133758544922, 0.2517280578613281, 0.25904273986816406, 0.266357421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 9.0, 17.0, 19.0, 22.0, 52.0, 64.0, 108.0, 185.0, 174.0, 100.0, 66.0, 55.0, 35.0, 21.0, 15.0, 11.0, 11.0, 2.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.14984130859375e-05, -5.0212256610393524e-05, -4.892610013484955e-05, -4.763994365930557e-05, -4.63537871837616e-05, -4.506763070821762e-05, -4.3781474232673645e-05, -4.249531775712967e-05, -4.120916128158569e-05, -3.992300480604172e-05, -3.863684833049774e-05, -3.7350691854953766e-05, -3.606453537940979e-05, -3.4778378903865814e-05, -3.349222242832184e-05, -3.220606595277786e-05, -3.091990947723389e-05, -2.963375300168991e-05, -2.8347596526145935e-05, -2.706144005060196e-05, -2.5775283575057983e-05, -2.4489127099514008e-05, -2.3202970623970032e-05, -2.1916814148426056e-05, -2.063065767288208e-05, -1.9344501197338104e-05, -1.805834472179413e-05, -1.6772188246250153e-05, -1.5486031770706177e-05, -1.4199875295162201e-05, -1.2913718819618225e-05, -1.162756234407425e-05, -1.0341405868530273e-05, -9.055249392986298e-06, -7.769092917442322e-06, -6.482936441898346e-06, -5.19677996635437e-06, -3.910623490810394e-06, -2.6244670152664185e-06, -1.3383105397224426e-06, -5.21540641784668e-08, 1.234002411365509e-06, 2.520158886909485e-06, 3.8063153624534607e-06, 5.0924718379974365e-06, 6.378628313541412e-06, 7.664784789085388e-06, 8.950941264629364e-06, 1.023709774017334e-05, 1.1523254215717316e-05, 1.2809410691261292e-05, 1.4095567166805267e-05, 1.5381723642349243e-05, 1.666788011789322e-05, 1.7954036593437195e-05, 1.924019306898117e-05, 2.0526349544525146e-05, 2.1812506020069122e-05, 2.3098662495613098e-05, 2.4384818971157074e-05, 2.567097544670105e-05, 2.6957131922245026e-05, 2.8243288397789e-05, 2.9529444873332977e-05, 3.081560134887695e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 4.0, 15.0, 20.0, 21.0, 36.0, 45.0, 61.0, 90.0, 135.0, 233.0, 382.0, 732.0, 1360.0, 2654.0, 5972.0, 16109.0, 55539.0, 421764.0, 455298.0, 58688.0, 16824.0, 6452.0, 2797.0, 1440.0, 703.0, 387.0, 280.0, 169.0, 109.0, 71.0, 42.0, 28.0, 26.0, 17.0, 10.0, 7.0, 4.0, 2.0, 4.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.2064208984375, -0.20068931579589844, -0.19495773315429688, -0.1892261505126953, -0.18349456787109375, -0.1777629852294922, -0.17203140258789062, -0.16629981994628906, -0.1605682373046875, -0.15483665466308594, -0.14910507202148438, -0.1433734893798828, -0.13764190673828125, -0.1319103240966797, -0.12617874145507812, -0.12044715881347656, -0.114715576171875, -0.10898399353027344, -0.10325241088867188, -0.09752082824707031, -0.09178924560546875, -0.08605766296386719, -0.08032608032226562, -0.07459449768066406, -0.0688629150390625, -0.06313133239746094, -0.057399749755859375, -0.05166816711425781, -0.04593658447265625, -0.04020500183105469, -0.034473419189453125, -0.028741836547851562, -0.02301025390625, -0.017278671264648438, -0.011547088623046875, -0.0058155059814453125, -8.392333984375e-05, 0.0056476593017578125, 0.011379241943359375, 0.017110824584960938, 0.0228424072265625, 0.028573989868164062, 0.034305572509765625, 0.04003715515136719, 0.04576873779296875, 0.05150032043457031, 0.057231903076171875, 0.06296348571777344, 0.068695068359375, 0.07442665100097656, 0.08015823364257812, 0.08588981628417969, 0.09162139892578125, 0.09735298156738281, 0.10308456420898438, 0.10881614685058594, 0.1145477294921875, 0.12027931213378906, 0.12601089477539062, 0.1317424774169922, 0.13747406005859375, 0.1432056427001953, 0.14893722534179688, 0.15466880798339844, 0.160400390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 14.0, 20.0, 19.0, 30.0, 44.0, 64.0, 104.0, 170.0, 165.0, 111.0, 61.0, 41.0, 42.0, 24.0, 19.0, 11.0, 10.0, 10.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09783935546875, -0.09422016143798828, -0.09060096740722656, -0.08698177337646484, -0.08336257934570312, -0.0797433853149414, -0.07612419128417969, -0.07250499725341797, -0.06888580322265625, -0.06526660919189453, -0.06164741516113281, -0.058028221130371094, -0.054409027099609375, -0.050789833068847656, -0.04717063903808594, -0.04355144500732422, -0.0399322509765625, -0.03631305694580078, -0.03269386291503906, -0.029074668884277344, -0.025455474853515625, -0.021836280822753906, -0.018217086791992188, -0.014597892761230469, -0.01097869873046875, -0.007359504699707031, -0.0037403106689453125, -0.00012111663818359375, 0.003498077392578125, 0.007117271423339844, 0.010736465454101562, 0.014355659484863281, 0.017974853515625, 0.02159404754638672, 0.025213241577148438, 0.028832435607910156, 0.032451629638671875, 0.036070823669433594, 0.03969001770019531, 0.04330921173095703, 0.04692840576171875, 0.05054759979248047, 0.05416679382324219, 0.057785987854003906, 0.061405181884765625, 0.06502437591552734, 0.06864356994628906, 0.07226276397705078, 0.0758819580078125, 0.07950115203857422, 0.08312034606933594, 0.08673954010009766, 0.09035873413085938, 0.0939779281616211, 0.09759712219238281, 0.10121631622314453, 0.10483551025390625, 0.10845470428466797, 0.11207389831542969, 0.1156930923461914, 0.11931228637695312, 0.12293148040771484, 0.12655067443847656, 0.13016986846923828, 0.1337890625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 16.0, 20.0, 54.0, 149.0, 277.0, 260.0, 127.0, 40.0, 30.0, 17.0, 3.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.733736276626587, -2.619910478591919, -2.506084680557251, -2.392258882522583, -2.278433084487915, -2.164607286453247, -2.05078125, -1.9369555711746216, -1.8231297731399536, -1.7093039751052856, -1.5954781770706177, -1.4816522598266602, -1.3678264617919922, -1.2540006637573242, -1.1401748657226562, -1.0263490676879883, -0.9125232696533203, -0.7986974716186523, -0.6848716735839844, -0.5710458159446716, -0.45722001791000366, -0.3433942198753357, -0.22956836223602295, -0.11574256420135498, -0.0019167661666870117, 0.11190904676914215, 0.2257348597049713, 0.33956068754196167, 0.45338648557662964, 0.5672122836112976, 0.6810381412506104, 0.7948639392852783, 0.9086899757385254, 1.0225157737731934, 1.1363415718078613, 1.2501673698425293, 1.3639931678771973, 1.4778189659118652, 1.5916448831558228, 1.7054706811904907, 1.8192964792251587, 1.9331222772598267, 2.046948194503784, 2.160773992538452, 2.27459979057312, 2.388425588607788, 2.502251386642456, 2.616077184677124, 2.729902982711792, 2.84372878074646, 2.957554578781128, 3.071380376815796, 3.185206174850464, 3.299031972885132, 3.412858009338379, 3.526683807373047, 3.640509605407715, 3.754335403442383, 3.868161201477051, 3.9819869995117188, 4.095812797546387, 4.209638595581055, 4.323464393615723, 4.437290191650391, 4.551115989685059]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 8.0, 4.0, 8.0, 9.0, 22.0, 24.0, 21.0, 25.0, 39.0, 43.0, 50.0, 58.0, 50.0, 60.0, 69.0, 71.0, 66.0, 58.0, 45.0, 53.0, 43.0, 24.0, 35.0, 27.0, 24.0, 18.0, 9.0, 15.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9182522296905518, -1.840989112854004, -1.7637261152267456, -1.6864629983901978, -1.60919988155365, -1.5319368839263916, -1.4546737670898438, -1.377410650253296, -1.300147533416748, -1.2228844165802002, -1.145621418952942, -1.068358302116394, -0.9910951852798462, -0.9138321280479431, -0.83656907081604, -0.7593059539794922, -0.6820429563522339, -0.6047798991203308, -0.527516782283783, -0.4502537250518799, -0.3729906380176544, -0.29572755098342896, -0.21846449375152588, -0.14120137691497803, -0.06393831968307495, 0.013324759900569916, 0.09058783948421478, 0.16785091161727905, 0.24511399865150452, 0.32237708568573, 0.39964014291763306, 0.4769032597541809, 0.554166316986084, 0.6314293742179871, 0.7086924910545349, 0.785955548286438, 0.8632186651229858, 0.9404817223548889, 1.017744779586792, 1.0950078964233398, 1.1722710132598877, 1.2495341300964355, 1.3267971277236938, 1.4040602445602417, 1.4813233613967896, 1.5585863590240479, 1.6358494758605957, 1.7131125926971436, 1.7903755903244019, 1.8676387071609497, 1.944901704788208, 2.022164821624756, 2.0994279384613037, 2.1766910552978516, 2.2539539337158203, 2.3312172889709473, 2.408480167388916, 2.485743284225464, 2.5630064010620117, 2.6402692794799805, 2.7175323963165283, 2.794795513153076, 2.872058629989624, 2.949321746826172, 3.0265848636627197]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 2.0, 9.0, 19.0, 16.0, 17.0, 41.0, 35.0, 62.0, 119.0, 199.0, 291.0, 501.0, 917.0, 1849.0, 4175.0, 11469.0, 45690.0, 338695.0, 3172135.0, 530992.0, 62498.0, 14934.0, 5159.0, 2139.0, 1004.0, 538.0, 295.0, 174.0, 105.0, 68.0, 48.0, 30.0, 17.0, 11.0, 10.0, 10.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.6215896606445312, -0.5952301025390625, -0.5688705444335938, -0.542510986328125, -0.5161514282226562, -0.4897918701171875, -0.46343231201171875, -0.43707275390625, -0.41071319580078125, -0.3843536376953125, -0.35799407958984375, -0.331634521484375, -0.30527496337890625, -0.2789154052734375, -0.25255584716796875, -0.2261962890625, -0.19983673095703125, -0.1734771728515625, -0.14711761474609375, -0.120758056640625, -0.09439849853515625, -0.0680389404296875, -0.04167938232421875, -0.01531982421875, 0.01103973388671875, 0.0373992919921875, 0.06375885009765625, 0.090118408203125, 0.11647796630859375, 0.1428375244140625, 0.16919708251953125, 0.195556640625, 0.22191619873046875, 0.2482757568359375, 0.27463531494140625, 0.300994873046875, 0.32735443115234375, 0.3537139892578125, 0.38007354736328125, 0.40643310546875, 0.43279266357421875, 0.4591522216796875, 0.48551177978515625, 0.511871337890625, 0.5382308959960938, 0.5645904541015625, 0.5909500122070312, 0.6173095703125, 0.6436691284179688, 0.6700286865234375, 0.6963882446289062, 0.722747802734375, 0.7491073608398438, 0.7754669189453125, 0.8018264770507812, 0.82818603515625, 0.8545455932617188, 0.8809051513671875, 0.9072647094726562, 0.933624267578125, 0.9599838256835938, 0.9863433837890625, 1.0127029418945312, 1.0390625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 8.0, 5.0, 17.0, 16.0, 29.0, 25.0, 34.0, 28.0, 55.0, 56.0, 65.0, 62.0, 85.0, 81.0, 66.0, 59.0, 52.0, 50.0, 43.0, 26.0, 21.0, 25.0, 16.0, 8.0, 12.0, 4.0, 4.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.6239471435546875, -0.603851318359375, -0.5837554931640625, -0.56365966796875, -0.5435638427734375, -0.523468017578125, -0.5033721923828125, -0.4832763671875, -0.4631805419921875, -0.443084716796875, -0.4229888916015625, -0.40289306640625, -0.3827972412109375, -0.362701416015625, -0.3426055908203125, -0.322509765625, -0.3024139404296875, -0.282318115234375, -0.2622222900390625, -0.24212646484375, -0.2220306396484375, -0.201934814453125, -0.1818389892578125, -0.1617431640625, -0.1416473388671875, -0.121551513671875, -0.1014556884765625, -0.08135986328125, -0.0612640380859375, -0.041168212890625, -0.0210723876953125, -0.0009765625, 0.0191192626953125, 0.039215087890625, 0.0593109130859375, 0.07940673828125, 0.0995025634765625, 0.119598388671875, 0.1396942138671875, 0.1597900390625, 0.1798858642578125, 0.199981689453125, 0.2200775146484375, 0.24017333984375, 0.2602691650390625, 0.280364990234375, 0.3004608154296875, 0.320556640625, 0.3406524658203125, 0.360748291015625, 0.3808441162109375, 0.40093994140625, 0.4210357666015625, 0.441131591796875, 0.4612274169921875, 0.4813232421875, 0.5014190673828125, 0.521514892578125, 0.5416107177734375, 0.56170654296875, 0.5818023681640625, 0.601898193359375, 0.6219940185546875, 0.64208984375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 14.0, 27.0, 31.0, 55.0, 112.0, 228.0, 398.0, 964.0, 2900.0, 10511.0, 69673.0, 3268452.0, 794746.0, 35887.0, 6767.0, 2042.0, 745.0, 314.0, 171.0, 94.0, 44.0, 36.0, 20.0, 11.0, 6.0, 9.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.3529281616210938, -1.3171844482421875, -1.2814407348632812, -1.245697021484375, -1.2099533081054688, -1.1742095947265625, -1.1384658813476562, -1.10272216796875, -1.0669784545898438, -1.0312347412109375, -0.9954910278320312, -0.959747314453125, -0.9240036010742188, -0.8882598876953125, -0.8525161743164062, -0.8167724609375, -0.7810287475585938, -0.7452850341796875, -0.7095413208007812, -0.673797607421875, -0.6380538940429688, -0.6023101806640625, -0.5665664672851562, -0.53082275390625, -0.49507904052734375, -0.4593353271484375, -0.42359161376953125, -0.387847900390625, -0.35210418701171875, -0.3163604736328125, -0.28061676025390625, -0.244873046875, -0.20912933349609375, -0.1733856201171875, -0.13764190673828125, -0.101898193359375, -0.06615447998046875, -0.0304107666015625, 0.00533294677734375, 0.04107666015625, 0.07682037353515625, 0.1125640869140625, 0.14830780029296875, 0.184051513671875, 0.21979522705078125, 0.2555389404296875, 0.29128265380859375, 0.3270263671875, 0.36277008056640625, 0.3985137939453125, 0.43425750732421875, 0.470001220703125, 0.5057449340820312, 0.5414886474609375, 0.5772323608398438, 0.61297607421875, 0.6487197875976562, 0.6844635009765625, 0.7202072143554688, 0.755950927734375, 0.7916946411132812, 0.8274383544921875, 0.8631820678710938, 0.89892578125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 15.0, 21.0, 20.0, 32.0, 56.0, 89.0, 146.0, 274.0, 546.0, 986.0, 887.0, 438.0, 201.0, 116.0, 83.0, 33.0, 30.0, 24.0, 16.0, 13.0, 14.0, 5.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234375, -0.22564315795898438, -0.21691131591796875, -0.20817947387695312, -0.1994476318359375, -0.19071578979492188, -0.18198394775390625, -0.17325210571289062, -0.164520263671875, -0.15578842163085938, -0.14705657958984375, -0.13832473754882812, -0.1295928955078125, -0.12086105346679688, -0.11212921142578125, -0.10339736938476562, -0.09466552734375, -0.08593368530273438, -0.07720184326171875, -0.06847000122070312, -0.0597381591796875, -0.051006317138671875, -0.04227447509765625, -0.033542633056640625, -0.024810791015625, -0.016078948974609375, -0.00734710693359375, 0.001384735107421875, 0.0101165771484375, 0.018848419189453125, 0.02758026123046875, 0.036312103271484375, 0.0450439453125, 0.053775787353515625, 0.06250762939453125, 0.07123947143554688, 0.0799713134765625, 0.08870315551757812, 0.09743499755859375, 0.10616683959960938, 0.114898681640625, 0.12363052368164062, 0.13236236572265625, 0.14109420776367188, 0.1498260498046875, 0.15855789184570312, 0.16728973388671875, 0.17602157592773438, 0.18475341796875, 0.19348526000976562, 0.20221710205078125, 0.21094894409179688, 0.2196807861328125, 0.22841262817382812, 0.23714447021484375, 0.24587631225585938, 0.254608154296875, 0.2633399963378906, 0.27207183837890625, 0.2808036804199219, 0.2895355224609375, 0.2982673645019531, 0.30699920654296875, 0.3157310485839844, 0.324462890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 10.0, 8.0, 14.0, 19.0, 34.0, 37.0, 70.0, 107.0, 121.0, 148.0, 111.0, 89.0, 73.0, 48.0, 35.0, 19.0, 11.0, 8.0, 7.0, 3.0, 9.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3823992013931274, -1.3455817699432373, -1.3087643384933472, -1.271946907043457, -1.235129475593567, -1.1983120441436768, -1.161494493484497, -1.124677062034607, -1.0878596305847168, -1.0510421991348267, -1.0142247676849365, -0.9774073362350464, -0.9405898451805115, -0.9037724137306213, -0.8669549822807312, -0.8301374912261963, -0.7933201193809509, -0.7565026879310608, -0.7196852564811707, -0.6828677654266357, -0.6460503339767456, -0.6092329025268555, -0.5724154710769653, -0.5355980396270752, -0.49878057837486267, -0.46196314692497253, -0.42514568567276, -0.3883282542228699, -0.35151082277297974, -0.3146933615207672, -0.2778759300708771, -0.24105846881866455, -0.20424097776412964, -0.1674235314130783, -0.13060608506202698, -0.09378865361213684, -0.05697120726108551, -0.02015376091003418, 0.016663670539855957, 0.05348113179206848, 0.09029856324195862, 0.12711600959300995, 0.16393345594406128, 0.20075088739395142, 0.23756833374500275, 0.2743857800960541, 0.3112032115459442, 0.34802067279815674, 0.3848381042480469, 0.421655535697937, 0.45847299695014954, 0.4952904284000397, 0.5321078896522522, 0.5689253211021423, 0.6057427525520325, 0.6425602436065674, 0.6793776750564575, 0.7161951065063477, 0.7530125379562378, 0.7898299694061279, 0.8266474604606628, 0.863464891910553, 0.9002823233604431, 0.937099814414978, 0.9739171862602234]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 6.0, 8.0, 13.0, 3.0, 16.0, 14.0, 21.0, 28.0, 32.0, 35.0, 53.0, 56.0, 60.0, 54.0, 56.0, 59.0, 65.0, 66.0, 45.0, 42.0, 40.0, 44.0, 25.0, 25.0, 26.0, 26.0, 17.0, 8.0, 6.0, 10.0, 8.0, 2.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.631807267665863, -0.612474262714386, -0.5931412577629089, -0.5738082528114319, -0.5544752478599548, -0.5351423025131226, -0.5158092975616455, -0.49647629261016846, -0.4771432876586914, -0.45781028270721436, -0.4384772777557373, -0.41914427280426025, -0.3998112976551056, -0.38047829270362854, -0.3611452877521515, -0.3418123126029968, -0.3224792778491974, -0.30314627289772034, -0.2838132679462433, -0.2644802927970886, -0.24514728784561157, -0.22581428289413452, -0.20648127794265747, -0.1871482878923416, -0.16781528294086456, -0.1484822779893875, -0.12914928793907166, -0.1098162829875946, -0.09048328548669815, -0.0711502879858017, -0.051817283034324646, -0.03248429298400879, -0.013151288032531738, 0.006181711331009865, 0.025514710694551468, 0.04484771192073822, 0.06418070942163467, 0.08351370692253113, 0.10284671187400818, 0.12217970192432404, 0.1415127068758011, 0.16084571182727814, 0.180178701877594, 0.19951170682907104, 0.2188447117805481, 0.23817770183086395, 0.2575107216835022, 0.27684369683265686, 0.2961767017841339, 0.31550970673561096, 0.334842711687088, 0.3541756868362427, 0.3735086917877197, 0.3928416967391968, 0.41217470169067383, 0.4315077066421509, 0.45084071159362793, 0.470173716545105, 0.48950672149658203, 0.5088397264480591, 0.5281727313995361, 0.5475057363510132, 0.5668387413024902, 0.5861716866493225, 0.6055046916007996]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 4.0, 8.0, 10.0, 17.0, 33.0, 26.0, 50.0, 54.0, 89.0, 134.0, 174.0, 278.0, 413.0, 673.0, 995.0, 1754.0, 3150.0, 5881.0, 12147.0, 27211.0, 71436.0, 230319.0, 415436.0, 176507.0, 56894.0, 22633.0, 10192.0, 5104.0, 2697.0, 1510.0, 923.0, 606.0, 362.0, 265.0, 150.0, 125.0, 78.0, 57.0, 45.0, 37.0, 16.0, 17.0, 8.0, 5.0, 7.0, 9.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.09930419921875, -0.09641647338867188, -0.09352874755859375, -0.09064102172851562, -0.0877532958984375, -0.08486557006835938, -0.08197784423828125, -0.07909011840820312, -0.076202392578125, -0.07331466674804688, -0.07042694091796875, -0.06753921508789062, -0.0646514892578125, -0.061763763427734375, -0.05887603759765625, -0.055988311767578125, -0.0531005859375, -0.050212860107421875, -0.04732513427734375, -0.044437408447265625, -0.0415496826171875, -0.038661956787109375, -0.03577423095703125, -0.032886505126953125, -0.029998779296875, -0.027111053466796875, -0.02422332763671875, -0.021335601806640625, -0.0184478759765625, -0.015560150146484375, -0.01267242431640625, -0.009784698486328125, -0.00689697265625, -0.004009246826171875, -0.00112152099609375, 0.001766204833984375, 0.0046539306640625, 0.007541656494140625, 0.01042938232421875, 0.013317108154296875, 0.016204833984375, 0.019092559814453125, 0.02198028564453125, 0.024868011474609375, 0.0277557373046875, 0.030643463134765625, 0.03353118896484375, 0.036418914794921875, 0.039306640625, 0.042194366455078125, 0.04508209228515625, 0.047969818115234375, 0.0508575439453125, 0.053745269775390625, 0.05663299560546875, 0.059520721435546875, 0.062408447265625, 0.06529617309570312, 0.06818389892578125, 0.07107162475585938, 0.0739593505859375, 0.07684707641601562, 0.07973480224609375, 0.08262252807617188, 0.08551025390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 14.0, 9.0, 17.0, 17.0, 28.0, 21.0, 41.0, 52.0, 59.0, 53.0, 67.0, 59.0, 54.0, 73.0, 64.0, 53.0, 43.0, 43.0, 38.0, 32.0, 27.0, 27.0, 21.0, 15.0, 10.0, 7.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.416259765625, -0.4026756286621094, -0.38909149169921875, -0.3755073547363281, -0.3619232177734375, -0.3483390808105469, -0.33475494384765625, -0.3211708068847656, -0.307586669921875, -0.2940025329589844, -0.28041839599609375, -0.2668342590332031, -0.2532501220703125, -0.23966598510742188, -0.22608184814453125, -0.21249771118164062, -0.19891357421875, -0.18532943725585938, -0.17174530029296875, -0.15816116333007812, -0.1445770263671875, -0.13099288940429688, -0.11740875244140625, -0.10382461547851562, -0.090240478515625, -0.07665634155273438, -0.06307220458984375, -0.049488067626953125, -0.0359039306640625, -0.022319793701171875, -0.00873565673828125, 0.004848480224609375, 0.0184326171875, 0.032016754150390625, 0.04560089111328125, 0.059185028076171875, 0.0727691650390625, 0.08635330200195312, 0.09993743896484375, 0.11352157592773438, 0.127105712890625, 0.14068984985351562, 0.15427398681640625, 0.16785812377929688, 0.1814422607421875, 0.19502639770507812, 0.20861053466796875, 0.22219467163085938, 0.23577880859375, 0.24936294555664062, 0.26294708251953125, 0.2765312194824219, 0.2901153564453125, 0.3036994934082031, 0.31728363037109375, 0.3308677673339844, 0.344451904296875, 0.3580360412597656, 0.37162017822265625, 0.3852043151855469, 0.3987884521484375, 0.4123725891113281, 0.42595672607421875, 0.4395408630371094, 0.453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 2.0, 4.0, 9.0, 13.0, 17.0, 18.0, 19.0, 27.0, 64.0, 106.0, 210.0, 377.0, 760.0, 2228.0, 8085.0, 52065.0, 598575.0, 348275.0, 29578.0, 5297.0, 1585.0, 570.0, 263.0, 151.0, 83.0, 54.0, 37.0, 21.0, 19.0, 8.0, 5.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.17162132263183594, -0.16587448120117188, -0.1601276397705078, -0.15438079833984375, -0.1486339569091797, -0.14288711547851562, -0.13714027404785156, -0.1313934326171875, -0.12564659118652344, -0.11989974975585938, -0.11415290832519531, -0.10840606689453125, -0.10265922546386719, -0.09691238403320312, -0.09116554260253906, -0.085418701171875, -0.07967185974121094, -0.07392501831054688, -0.06817817687988281, -0.06243133544921875, -0.05668449401855469, -0.050937652587890625, -0.04519081115722656, -0.0394439697265625, -0.03369712829589844, -0.027950286865234375, -0.022203445434570312, -0.01645660400390625, -0.010709762573242188, -0.004962921142578125, 0.0007839202880859375, 0.00653076171875, 0.012277603149414062, 0.018024444580078125, 0.023771286010742188, 0.02951812744140625, 0.03526496887207031, 0.041011810302734375, 0.04675865173339844, 0.0525054931640625, 0.05825233459472656, 0.06399917602539062, 0.06974601745605469, 0.07549285888671875, 0.08123970031738281, 0.08698654174804688, 0.09273338317871094, 0.098480224609375, 0.10422706604003906, 0.10997390747070312, 0.11572074890136719, 0.12146759033203125, 0.1272144317626953, 0.13296127319335938, 0.13870811462402344, 0.1444549560546875, 0.15020179748535156, 0.15594863891601562, 0.1616954803466797, 0.16744232177734375, 0.1731891632080078, 0.17893600463867188, 0.18468284606933594, 0.1904296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 5.0, 13.0, 19.0, 20.0, 21.0, 26.0, 38.0, 35.0, 45.0, 41.0, 44.0, 55.0, 49.0, 43.0, 50.0, 62.0, 46.0, 38.0, 49.0, 47.0, 45.0, 26.0, 33.0, 30.0, 29.0, 11.0, 16.0, 13.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8513031005859375, -0.827117919921875, -0.8029327392578125, -0.77874755859375, -0.7545623779296875, -0.730377197265625, -0.7061920166015625, -0.6820068359375, -0.6578216552734375, -0.633636474609375, -0.6094512939453125, -0.58526611328125, -0.5610809326171875, -0.536895751953125, -0.5127105712890625, -0.488525390625, -0.4643402099609375, -0.440155029296875, -0.4159698486328125, -0.39178466796875, -0.3675994873046875, -0.343414306640625, -0.3192291259765625, -0.2950439453125, -0.2708587646484375, -0.246673583984375, -0.2224884033203125, -0.19830322265625, -0.1741180419921875, -0.149932861328125, -0.1257476806640625, -0.1015625, -0.0773773193359375, -0.053192138671875, -0.0290069580078125, -0.00482177734375, 0.0193634033203125, 0.043548583984375, 0.0677337646484375, 0.0919189453125, 0.1161041259765625, 0.140289306640625, 0.1644744873046875, 0.18865966796875, 0.2128448486328125, 0.237030029296875, 0.2612152099609375, 0.285400390625, 0.3095855712890625, 0.333770751953125, 0.3579559326171875, 0.38214111328125, 0.4063262939453125, 0.430511474609375, 0.4546966552734375, 0.4788818359375, 0.5030670166015625, 0.527252197265625, 0.5514373779296875, 0.57562255859375, 0.5998077392578125, 0.623992919921875, 0.6481781005859375, 0.67236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 14.0, 22.0, 26.0, 55.0, 71.0, 158.0, 314.0, 615.0, 1652.0, 5985.0, 35530.0, 561015.0, 408028.0, 27236.0, 5156.0, 1455.0, 597.0, 265.0, 137.0, 82.0, 45.0, 21.0, 18.0, 12.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.09014892578125, -0.0877084732055664, -0.08526802062988281, -0.08282756805419922, -0.08038711547851562, -0.07794666290283203, -0.07550621032714844, -0.07306575775146484, -0.07062530517578125, -0.06818485260009766, -0.06574440002441406, -0.06330394744873047, -0.060863494873046875, -0.05842304229736328, -0.05598258972167969, -0.053542137145996094, -0.0511016845703125, -0.048661231994628906, -0.04622077941894531, -0.04378032684326172, -0.041339874267578125, -0.03889942169189453, -0.03645896911621094, -0.034018516540527344, -0.03157806396484375, -0.029137611389160156, -0.026697158813476562, -0.02425670623779297, -0.021816253662109375, -0.01937580108642578, -0.016935348510742188, -0.014494895935058594, -0.012054443359375, -0.009613990783691406, -0.0071735382080078125, -0.004733085632324219, -0.002292633056640625, 0.00014781951904296875, 0.0025882720947265625, 0.005028724670410156, 0.00746917724609375, 0.009909629821777344, 0.012350082397460938, 0.014790534973144531, 0.017230987548828125, 0.01967144012451172, 0.022111892700195312, 0.024552345275878906, 0.0269927978515625, 0.029433250427246094, 0.03187370300292969, 0.03431415557861328, 0.036754608154296875, 0.03919506072998047, 0.04163551330566406, 0.044075965881347656, 0.04651641845703125, 0.048956871032714844, 0.05139732360839844, 0.05383777618408203, 0.056278228759765625, 0.05871868133544922, 0.06115913391113281, 0.0635995864868164, 0.0660400390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 8.0, 25.0, 35.0, 40.0, 62.0, 73.0, 96.0, 85.0, 118.0, 102.0, 92.0, 70.0, 48.0, 28.0, 22.0, 19.0, 16.0, 8.0, 4.0, 5.0, 7.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2232532501220703e-05, -2.1447427570819855e-05, -2.0662322640419006e-05, -1.9877217710018158e-05, -1.909211277961731e-05, -1.830700784921646e-05, -1.7521902918815613e-05, -1.6736797988414764e-05, -1.5951693058013916e-05, -1.5166588127613068e-05, -1.438148319721222e-05, -1.3596378266811371e-05, -1.2811273336410522e-05, -1.2026168406009674e-05, -1.1241063475608826e-05, -1.0455958545207977e-05, -9.670853614807129e-06, -8.88574868440628e-06, -8.100643754005432e-06, -7.315538823604584e-06, -6.530433893203735e-06, -5.745328962802887e-06, -4.9602240324020386e-06, -4.17511910200119e-06, -3.390014171600342e-06, -2.6049092411994934e-06, -1.819804310798645e-06, -1.0346993803977966e-06, -2.4959444999694824e-07, 5.355104804039001e-07, 1.3206154108047485e-06, 2.105720341205597e-06, 2.8908252716064453e-06, 3.6759302020072937e-06, 4.461035132408142e-06, 5.2461400628089905e-06, 6.031244993209839e-06, 6.816349923610687e-06, 7.601454854011536e-06, 8.386559784412384e-06, 9.171664714813232e-06, 9.95676964521408e-06, 1.074187457561493e-05, 1.1526979506015778e-05, 1.2312084436416626e-05, 1.3097189366817474e-05, 1.3882294297218323e-05, 1.4667399227619171e-05, 1.545250415802002e-05, 1.6237609088420868e-05, 1.7022714018821716e-05, 1.7807818949222565e-05, 1.8592923879623413e-05, 1.937802881002426e-05, 2.016313374042511e-05, 2.0948238670825958e-05, 2.1733343601226807e-05, 2.2518448531627655e-05, 2.3303553462028503e-05, 2.4088658392429352e-05, 2.48737633228302e-05, 2.565886825323105e-05, 2.6443973183631897e-05, 2.7229078114032745e-05, 2.8014183044433594e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 12.0, 12.0, 13.0, 12.0, 32.0, 37.0, 71.0, 91.0, 155.0, 213.0, 399.0, 723.0, 1404.0, 3170.0, 7749.0, 21102.0, 69984.0, 286146.0, 463992.0, 135503.0, 36359.0, 12181.0, 4718.0, 2077.0, 1006.0, 534.0, 296.0, 184.0, 123.0, 73.0, 44.0, 26.0, 19.0, 20.0, 18.0, 11.0, 8.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04132080078125, -0.03999805450439453, -0.03867530822753906, -0.037352561950683594, -0.036029815673828125, -0.034707069396972656, -0.03338432312011719, -0.03206157684326172, -0.03073883056640625, -0.02941608428955078, -0.028093338012695312, -0.026770591735839844, -0.025447845458984375, -0.024125099182128906, -0.022802352905273438, -0.02147960662841797, -0.0201568603515625, -0.01883411407470703, -0.017511367797851562, -0.016188621520996094, -0.014865875244140625, -0.013543128967285156, -0.012220382690429688, -0.010897636413574219, -0.00957489013671875, -0.008252143859863281, -0.0069293975830078125, -0.005606651306152344, -0.004283905029296875, -0.0029611587524414062, -0.0016384124755859375, -0.00031566619873046875, 0.001007080078125, 0.0023298263549804688, 0.0036525726318359375, 0.004975318908691406, 0.006298065185546875, 0.007620811462402344, 0.008943557739257812, 0.010266304016113281, 0.01158905029296875, 0.012911796569824219, 0.014234542846679688, 0.015557289123535156, 0.016880035400390625, 0.018202781677246094, 0.019525527954101562, 0.02084827423095703, 0.0221710205078125, 0.02349376678466797, 0.024816513061523438, 0.026139259338378906, 0.027462005615234375, 0.028784751892089844, 0.030107498168945312, 0.03143024444580078, 0.03275299072265625, 0.03407573699951172, 0.03539848327636719, 0.036721229553222656, 0.038043975830078125, 0.039366722106933594, 0.04068946838378906, 0.04201221466064453, 0.0433349609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 12.0, 12.0, 10.0, 21.0, 23.0, 30.0, 40.0, 61.0, 71.0, 122.0, 110.0, 98.0, 104.0, 70.0, 53.0, 41.0, 27.0, 16.0, 20.0, 18.0, 14.0, 7.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01129913330078125, -0.01082456111907959, -0.01034998893737793, -0.00987541675567627, -0.00940084457397461, -0.00892627239227295, -0.008451700210571289, -0.007977128028869629, -0.007502555847167969, -0.007027983665466309, -0.0065534114837646484, -0.006078839302062988, -0.005604267120361328, -0.005129694938659668, -0.004655122756958008, -0.004180550575256348, -0.0037059783935546875, -0.0032314062118530273, -0.002756834030151367, -0.002282261848449707, -0.0018076896667480469, -0.0013331174850463867, -0.0008585453033447266, -0.0003839731216430664, 9.059906005859375e-05, 0.0005651712417602539, 0.001039743423461914, 0.0015143156051635742, 0.0019888877868652344, 0.0024634599685668945, 0.0029380321502685547, 0.003412604331970215, 0.003887176513671875, 0.004361748695373535, 0.004836320877075195, 0.0053108930587768555, 0.005785465240478516, 0.006260037422180176, 0.006734609603881836, 0.007209181785583496, 0.007683753967285156, 0.008158326148986816, 0.008632898330688477, 0.009107470512390137, 0.009582042694091797, 0.010056614875793457, 0.010531187057495117, 0.011005759239196777, 0.011480331420898438, 0.011954903602600098, 0.012429475784301758, 0.012904047966003418, 0.013378620147705078, 0.013853192329406738, 0.014327764511108398, 0.014802336692810059, 0.015276908874511719, 0.01575148105621338, 0.01622605323791504, 0.0167006254196167, 0.01717519760131836, 0.01764976978302002, 0.01812434196472168, 0.01859891414642334, 0.019073486328125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 12.0, 23.0, 29.0, 70.0, 132.0, 177.0, 215.0, 124.0, 87.0, 42.0, 23.0, 19.0, 9.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0850715637207031, -1.052314043045044, -1.0195565223693848, -0.9867991209030151, -0.954041600227356, -0.9212840795516968, -0.8885266184806824, -0.855769157409668, -0.8230116367340088, -0.7902541160583496, -0.7574966549873352, -0.7247391939163208, -0.6919816732406616, -0.6592241525650024, -0.626466691493988, -0.5937092304229736, -0.5609517097473145, -0.5281941890716553, -0.49543672800064087, -0.4626792371273041, -0.4299217462539673, -0.3971642553806305, -0.3644067645072937, -0.3316492736339569, -0.2988917827606201, -0.2661342918872833, -0.23337680101394653, -0.20061931014060974, -0.16786181926727295, -0.13510432839393616, -0.10234683752059937, -0.06958934664726257, -0.03683185577392578, -0.004074364900588989, 0.028683125972747803, 0.061440616846084595, 0.09419810771942139, 0.12695559859275818, 0.15971308946609497, 0.19247058033943176, 0.22522807121276855, 0.25798556208610535, 0.29074305295944214, 0.32350054383277893, 0.3562580347061157, 0.3890155255794525, 0.4217730164527893, 0.4545305073261261, 0.4872879981994629, 0.5200455188751221, 0.5528029799461365, 0.5855604410171509, 0.6183179616928101, 0.6510754823684692, 0.6838329434394836, 0.716590404510498, 0.7493479251861572, 0.7821054458618164, 0.8148629069328308, 0.8476203680038452, 0.8803778886795044, 0.9131354093551636, 0.945892870426178, 0.9786503314971924, 1.0114078521728516]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 6.0, 5.0, 10.0, 5.0, 8.0, 17.0, 8.0, 20.0, 36.0, 34.0, 39.0, 63.0, 67.0, 69.0, 73.0, 62.0, 67.0, 71.0, 52.0, 53.0, 53.0, 34.0, 20.0, 28.0, 29.0, 18.0, 8.0, 6.0, 11.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.4573909044265747, -0.44344955682754517, -0.429508239030838, -0.41556689143180847, -0.40162554383277893, -0.3876842260360718, -0.37374287843704224, -0.3598015308380127, -0.34586021304130554, -0.331918865442276, -0.31797754764556885, -0.3040362000465393, -0.29009485244750977, -0.2761535346508026, -0.26221218705177307, -0.24827085435390472, -0.23432950675487518, -0.22038817405700684, -0.2064468264579773, -0.19250549376010895, -0.1785641610622406, -0.16462281346321106, -0.1506814807653427, -0.13674014806747437, -0.12279880791902542, -0.10885746777057648, -0.09491613507270813, -0.08097479492425919, -0.06703345477581024, -0.053092122077941895, -0.03915078192949295, -0.025209449231624603, -0.01126810908317566, 0.002673228271305561, 0.01661456562578678, 0.030555903911590576, 0.04449724033474922, 0.05843857675790787, 0.07237991690635681, 0.08632124960422516, 0.1002625897526741, 0.11420392990112305, 0.1281452625989914, 0.14208659529685974, 0.15602794289588928, 0.16996927559375763, 0.18391060829162598, 0.19785195589065552, 0.21179328858852386, 0.2257346212863922, 0.23967596888542175, 0.2536172866821289, 0.26755863428115845, 0.281499981880188, 0.29544132947921753, 0.3093826472759247, 0.3233239948749542, 0.33726534247398376, 0.3512066602706909, 0.36514800786972046, 0.37908935546875, 0.39303067326545715, 0.4069720208644867, 0.42091333866119385, 0.4348546862602234]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 7.0, 9.0, 24.0, 23.0, 41.0, 62.0, 96.0, 177.0, 320.0, 537.0, 1203.0, 2500.0, 5946.0, 15385.0, 47213.0, 210176.0, 575753.0, 133941.0, 34315.0, 11868.0, 4718.0, 2114.0, 987.0, 477.0, 259.0, 145.0, 83.0, 57.0, 36.0, 22.0, 15.0, 10.0, 19.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.50244140625, -0.4873847961425781, -0.47232818603515625, -0.4572715759277344, -0.4422149658203125, -0.4271583557128906, -0.41210174560546875, -0.3970451354980469, -0.381988525390625, -0.3669319152832031, -0.35187530517578125, -0.3368186950683594, -0.3217620849609375, -0.3067054748535156, -0.29164886474609375, -0.2765922546386719, -0.26153564453125, -0.24647903442382812, -0.23142242431640625, -0.21636581420898438, -0.2013092041015625, -0.18625259399414062, -0.17119598388671875, -0.15613937377929688, -0.141082763671875, -0.12602615356445312, -0.11096954345703125, -0.09591293334960938, -0.0808563232421875, -0.06579971313476562, -0.05074310302734375, -0.035686492919921875, -0.0206298828125, -0.005573272705078125, 0.00948333740234375, 0.024539947509765625, 0.0395965576171875, 0.054653167724609375, 0.06970977783203125, 0.08476638793945312, 0.099822998046875, 0.11487960815429688, 0.12993621826171875, 0.14499282836914062, 0.1600494384765625, 0.17510604858398438, 0.19016265869140625, 0.20521926879882812, 0.22027587890625, 0.23533248901367188, 0.25038909912109375, 0.2654457092285156, 0.2805023193359375, 0.2955589294433594, 0.31061553955078125, 0.3256721496582031, 0.340728759765625, 0.3557853698730469, 0.37084197998046875, 0.3858985900878906, 0.4009552001953125, 0.4160118103027344, 0.43106842041015625, 0.4461250305175781, 0.461181640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 6.0, 8.0, 9.0, 5.0, 11.0, 24.0, 20.0, 31.0, 42.0, 40.0, 43.0, 52.0, 56.0, 55.0, 69.0, 67.0, 62.0, 62.0, 47.0, 45.0, 36.0, 42.0, 34.0, 24.0, 24.0, 14.0, 15.0, 9.0, 6.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.97119140625, -0.94097900390625, -0.9107666015625, -0.88055419921875, -0.850341796875, -0.82012939453125, -0.7899169921875, -0.75970458984375, -0.7294921875, -0.69927978515625, -0.6690673828125, -0.63885498046875, -0.608642578125, -0.57843017578125, -0.5482177734375, -0.51800537109375, -0.48779296875, -0.45758056640625, -0.4273681640625, -0.39715576171875, -0.366943359375, -0.33673095703125, -0.3065185546875, -0.27630615234375, -0.24609375, -0.21588134765625, -0.1856689453125, -0.15545654296875, -0.125244140625, -0.09503173828125, -0.0648193359375, -0.03460693359375, -0.00439453125, 0.02581787109375, 0.0560302734375, 0.08624267578125, 0.116455078125, 0.14666748046875, 0.1768798828125, 0.20709228515625, 0.2373046875, 0.26751708984375, 0.2977294921875, 0.32794189453125, 0.358154296875, 0.38836669921875, 0.4185791015625, 0.44879150390625, 0.47900390625, 0.50921630859375, 0.5394287109375, 0.56964111328125, 0.599853515625, 0.63006591796875, 0.6602783203125, 0.69049072265625, 0.720703125, 0.75091552734375, 0.7811279296875, 0.81134033203125, 0.841552734375, 0.87176513671875, 0.9019775390625, 0.93218994140625, 0.96240234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 9.0, 17.0, 19.0, 29.0, 27.0, 23.0, 32.0, 59.0, 66.0, 98.0, 177.0, 230.0, 401.0, 629.0, 1235.0, 2748.0, 7066.0, 22403.0, 98055.0, 588388.0, 261147.0, 44751.0, 12539.0, 4301.0, 1798.0, 877.0, 443.0, 285.0, 196.0, 131.0, 108.0, 52.0, 56.0, 44.0, 35.0, 18.0, 14.0, 9.0, 4.0, 8.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.39582061767578125, -0.3829498291015625, -0.37007904052734375, -0.357208251953125, -0.34433746337890625, -0.3314666748046875, -0.31859588623046875, -0.30572509765625, -0.29285430908203125, -0.2799835205078125, -0.26711273193359375, -0.254241943359375, -0.24137115478515625, -0.2285003662109375, -0.21562957763671875, -0.2027587890625, -0.18988800048828125, -0.1770172119140625, -0.16414642333984375, -0.151275634765625, -0.13840484619140625, -0.1255340576171875, -0.11266326904296875, -0.09979248046875, -0.08692169189453125, -0.0740509033203125, -0.06118011474609375, -0.048309326171875, -0.03543853759765625, -0.0225677490234375, -0.00969696044921875, 0.003173828125, 0.01604461669921875, 0.0289154052734375, 0.04178619384765625, 0.054656982421875, 0.06752777099609375, 0.0803985595703125, 0.09326934814453125, 0.10614013671875, 0.11901092529296875, 0.1318817138671875, 0.14475250244140625, 0.157623291015625, 0.17049407958984375, 0.1833648681640625, 0.19623565673828125, 0.2091064453125, 0.22197723388671875, 0.2348480224609375, 0.24771881103515625, 0.260589599609375, 0.27346038818359375, 0.2863311767578125, 0.29920196533203125, 0.31207275390625, 0.32494354248046875, 0.3378143310546875, 0.35068511962890625, 0.363555908203125, 0.37642669677734375, 0.3892974853515625, 0.40216827392578125, 0.4150390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 8.0, 8.0, 6.0, 9.0, 12.0, 27.0, 20.0, 21.0, 30.0, 30.0, 38.0, 33.0, 38.0, 40.0, 45.0, 36.0, 48.0, 56.0, 47.0, 42.0, 45.0, 38.0, 50.0, 46.0, 38.0, 27.0, 19.0, 29.0, 19.0, 11.0, 21.0, 12.0, 10.0, 12.0, 8.0, 7.0, 1.0, 4.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0451278686523438, -1.0150604248046875, -0.9849929809570312, -0.954925537109375, -0.9248580932617188, -0.8947906494140625, -0.8647232055664062, -0.83465576171875, -0.8045883178710938, -0.7745208740234375, -0.7444534301757812, -0.714385986328125, -0.6843185424804688, -0.6542510986328125, -0.6241836547851562, -0.5941162109375, -0.5640487670898438, -0.5339813232421875, -0.5039138793945312, -0.473846435546875, -0.44377899169921875, -0.4137115478515625, -0.38364410400390625, -0.35357666015625, -0.32350921630859375, -0.2934417724609375, -0.26337432861328125, -0.233306884765625, -0.20323944091796875, -0.1731719970703125, -0.14310455322265625, -0.113037109375, -0.08296966552734375, -0.0529022216796875, -0.02283477783203125, 0.007232666015625, 0.03730010986328125, 0.0673675537109375, 0.09743499755859375, 0.12750244140625, 0.15756988525390625, 0.1876373291015625, 0.21770477294921875, 0.247772216796875, 0.27783966064453125, 0.3079071044921875, 0.33797454833984375, 0.3680419921875, 0.39810943603515625, 0.4281768798828125, 0.45824432373046875, 0.488311767578125, 0.5183792114257812, 0.5484466552734375, 0.5785140991210938, 0.60858154296875, 0.6386489868164062, 0.6687164306640625, 0.6987838745117188, 0.728851318359375, 0.7589187622070312, 0.7889862060546875, 0.8190536499023438, 0.84912109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 12.0, 9.0, 13.0, 13.0, 33.0, 50.0, 63.0, 90.0, 170.0, 326.0, 600.0, 1349.0, 3766.0, 15681.0, 100572.0, 705225.0, 187045.0, 24805.0, 5418.0, 1765.0, 712.0, 327.0, 190.0, 108.0, 60.0, 49.0, 30.0, 19.0, 19.0, 6.0, 9.0, 7.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1937255859375, -0.18740272521972656, -0.18107986450195312, -0.1747570037841797, -0.16843414306640625, -0.1621112823486328, -0.15578842163085938, -0.14946556091308594, -0.1431427001953125, -0.13681983947753906, -0.13049697875976562, -0.12417411804199219, -0.11785125732421875, -0.11152839660644531, -0.10520553588867188, -0.09888267517089844, -0.092559814453125, -0.08623695373535156, -0.07991409301757812, -0.07359123229980469, -0.06726837158203125, -0.06094551086425781, -0.054622650146484375, -0.04829978942871094, -0.0419769287109375, -0.03565406799316406, -0.029331207275390625, -0.023008346557617188, -0.01668548583984375, -0.010362625122070312, -0.004039764404296875, 0.0022830963134765625, 0.00860595703125, 0.014928817749023438, 0.021251678466796875, 0.027574539184570312, 0.03389739990234375, 0.04022026062011719, 0.046543121337890625, 0.05286598205566406, 0.0591888427734375, 0.06551170349121094, 0.07183456420898438, 0.07815742492675781, 0.08448028564453125, 0.09080314636230469, 0.09712600708007812, 0.10344886779785156, 0.109771728515625, 0.11609458923339844, 0.12241744995117188, 0.1287403106689453, 0.13506317138671875, 0.1413860321044922, 0.14770889282226562, 0.15403175354003906, 0.1603546142578125, 0.16667747497558594, 0.17300033569335938, 0.1793231964111328, 0.18564605712890625, 0.1919689178466797, 0.19829177856445312, 0.20461463928222656, 0.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 20.0, 16.0, 27.0, 26.0, 48.0, 78.0, 105.0, 153.0, 148.0, 114.0, 80.0, 51.0, 33.0, 28.0, 11.0, 20.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.315376281738281e-05, -4.189833998680115e-05, -4.064291715621948e-05, -3.938749432563782e-05, -3.813207149505615e-05, -3.687664866447449e-05, -3.562122583389282e-05, -3.436580300331116e-05, -3.311038017272949e-05, -3.185495734214783e-05, -3.059953451156616e-05, -2.9344111680984497e-05, -2.8088688850402832e-05, -2.6833266019821167e-05, -2.5577843189239502e-05, -2.4322420358657837e-05, -2.3066997528076172e-05, -2.1811574697494507e-05, -2.0556151866912842e-05, -1.9300729036331177e-05, -1.8045306205749512e-05, -1.6789883375167847e-05, -1.553446054458618e-05, -1.4279037714004517e-05, -1.3023614883422852e-05, -1.1768192052841187e-05, -1.0512769222259521e-05, -9.257346391677856e-06, -8.001923561096191e-06, -6.746500730514526e-06, -5.491077899932861e-06, -4.235655069351196e-06, -2.9802322387695312e-06, -1.7248094081878662e-06, -4.6938657760620117e-07, 7.860362529754639e-07, 2.041459083557129e-06, 3.296881914138794e-06, 4.552304744720459e-06, 5.807727575302124e-06, 7.063150405883789e-06, 8.318573236465454e-06, 9.573996067047119e-06, 1.0829418897628784e-05, 1.208484172821045e-05, 1.3340264558792114e-05, 1.459568738937378e-05, 1.5851110219955444e-05, 1.710653305053711e-05, 1.8361955881118774e-05, 1.961737871170044e-05, 2.0872801542282104e-05, 2.212822437286377e-05, 2.3383647203445435e-05, 2.46390700340271e-05, 2.5894492864608765e-05, 2.714991569519043e-05, 2.8405338525772095e-05, 2.966076135635376e-05, 3.0916184186935425e-05, 3.217160701751709e-05, 3.3427029848098755e-05, 3.468245267868042e-05, 3.5937875509262085e-05, 3.719329833984375e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 10.0, 10.0, 19.0, 17.0, 45.0, 40.0, 73.0, 110.0, 196.0, 299.0, 573.0, 933.0, 2031.0, 4291.0, 10943.0, 32237.0, 124765.0, 556415.0, 235372.0, 52420.0, 16053.0, 6121.0, 2563.0, 1314.0, 673.0, 405.0, 217.0, 116.0, 80.0, 52.0, 39.0, 38.0, 21.0, 14.0, 9.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.121337890625, -0.11710929870605469, -0.11288070678710938, -0.10865211486816406, -0.10442352294921875, -0.10019493103027344, -0.09596633911132812, -0.09173774719238281, -0.0875091552734375, -0.08328056335449219, -0.07905197143554688, -0.07482337951660156, -0.07059478759765625, -0.06636619567871094, -0.062137603759765625, -0.05790901184082031, -0.053680419921875, -0.04945182800292969, -0.045223236083984375, -0.04099464416503906, -0.03676605224609375, -0.03253746032714844, -0.028308868408203125, -0.024080276489257812, -0.0198516845703125, -0.015623092651367188, -0.011394500732421875, -0.0071659088134765625, -0.00293731689453125, 0.0012912750244140625, 0.005519866943359375, 0.009748458862304688, 0.01397705078125, 0.018205642700195312, 0.022434234619140625, 0.026662826538085938, 0.03089141845703125, 0.03512001037597656, 0.039348602294921875, 0.04357719421386719, 0.0478057861328125, 0.05203437805175781, 0.056262969970703125, 0.06049156188964844, 0.06472015380859375, 0.06894874572753906, 0.07317733764648438, 0.07740592956542969, 0.081634521484375, 0.08586311340332031, 0.09009170532226562, 0.09432029724121094, 0.09854888916015625, 0.10277748107910156, 0.10700607299804688, 0.11123466491699219, 0.1154632568359375, 0.11969184875488281, 0.12392044067382812, 0.12814903259277344, 0.13237762451171875, 0.13660621643066406, 0.14083480834960938, 0.1450634002685547, 0.1492919921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 8.0, 7.0, 11.0, 24.0, 24.0, 34.0, 38.0, 44.0, 71.0, 83.0, 112.0, 120.0, 85.0, 61.0, 56.0, 42.0, 44.0, 29.0, 18.0, 19.0, 21.0, 7.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.07302379608154297, -0.07042503356933594, -0.0678262710571289, -0.06522750854492188, -0.06262874603271484, -0.06002998352050781, -0.05743122100830078, -0.05483245849609375, -0.05223369598388672, -0.04963493347167969, -0.047036170959472656, -0.044437408447265625, -0.041838645935058594, -0.03923988342285156, -0.03664112091064453, -0.0340423583984375, -0.03144359588623047, -0.028844833374023438, -0.026246070861816406, -0.023647308349609375, -0.021048545837402344, -0.018449783325195312, -0.01585102081298828, -0.01325225830078125, -0.010653495788574219, -0.008054733276367188, -0.005455970764160156, -0.002857208251953125, -0.00025844573974609375, 0.0023403167724609375, 0.004939079284667969, 0.007537841796875, 0.010136604309082031, 0.012735366821289062, 0.015334129333496094, 0.017932891845703125, 0.020531654357910156, 0.023130416870117188, 0.02572917938232422, 0.02832794189453125, 0.03092670440673828, 0.03352546691894531, 0.036124229431152344, 0.038722991943359375, 0.041321754455566406, 0.04392051696777344, 0.04651927947998047, 0.0491180419921875, 0.05171680450439453, 0.05431556701660156, 0.056914329528808594, 0.059513092041015625, 0.062111854553222656, 0.06471061706542969, 0.06730937957763672, 0.06990814208984375, 0.07250690460205078, 0.07510566711425781, 0.07770442962646484, 0.08030319213867188, 0.0829019546508789, 0.08550071716308594, 0.08809947967529297, 0.0906982421875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 12.0, 22.0, 36.0, 78.0, 196.0, 278.0, 192.0, 101.0, 35.0, 27.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8401881456375122, -1.7460123300552368, -1.6518365144729614, -1.557660698890686, -1.4634848833084106, -1.3693090677261353, -1.2751331329345703, -1.180957317352295, -1.0867815017700195, -0.9926056861877441, -0.8984298706054688, -0.8042540550231934, -0.710078239440918, -0.6159024238586426, -0.5217265486717224, -0.427550733089447, -0.3333749771118164, -0.23919916152954102, -0.14502333104610443, -0.05084750056266785, 0.043328315019607544, 0.13750413060188293, 0.2316799759864807, 0.3258557915687561, 0.4200316071510315, 0.5142074227333069, 0.6083832383155823, 0.7025591135025024, 0.7967349290847778, 0.8909107446670532, 0.9850865602493286, 1.079262375831604, 1.173438310623169, 1.2676141262054443, 1.3617899417877197, 1.4559657573699951, 1.5501415729522705, 1.644317388534546, 1.7384932041168213, 1.8326690196990967, 1.926844835281372, 2.0210206508636475, 2.115196466445923, 2.2093722820281982, 2.3035480976104736, 2.397723913192749, 2.4918997287750244, 2.5860755443573, 2.6802515983581543, 2.7744274139404297, 2.868603229522705, 2.9627790451049805, 3.056954860687256, 3.1511306762695312, 3.2453064918518066, 3.339482307434082, 3.4336581230163574, 3.527833938598633, 3.622009754180908, 3.7161855697631836, 3.810361385345459, 3.9045372009277344, 3.9987130165100098, 4.092888832092285, 4.1870646476745605]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 16.0, 16.0, 18.0, 23.0, 14.0, 37.0, 22.0, 23.0, 35.0, 36.0, 43.0, 47.0, 51.0, 51.0, 47.0, 53.0, 60.0, 48.0, 53.0, 39.0, 38.0, 33.0, 32.0, 30.0, 26.0, 27.0, 12.0, 10.0, 15.0, 11.0, 6.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1416618824005127, -2.082296848297119, -2.0229318141937256, -1.963566780090332, -1.9042017459869385, -1.844836711883545, -1.7854716777801514, -1.7261066436767578, -1.6667416095733643, -1.6073765754699707, -1.5480115413665771, -1.4886465072631836, -1.42928147315979, -1.3699164390563965, -1.310551404953003, -1.2511863708496094, -1.1918213367462158, -1.1324563026428223, -1.0730912685394287, -1.0137262344360352, -0.9543612003326416, -0.894996166229248, -0.8356311321258545, -0.7762660980224609, -0.7169011831283569, -0.6575361490249634, -0.5981711149215698, -0.5388060808181763, -0.4794410467147827, -0.42007604241371155, -0.360711008310318, -0.30134597420692444, -0.2419809103012085, -0.18261587619781494, -0.12325084954500198, -0.06388582289218903, -0.004520788788795471, 0.05484423041343689, 0.11420926451683044, 0.173574298620224, 0.23293933272361755, 0.2923043668270111, 0.35166940093040466, 0.41103440523147583, 0.4703994393348694, 0.5297644734382629, 0.5891295075416565, 0.64849454164505, 0.7078595757484436, 0.7672246098518372, 0.8265896439552307, 0.8859546780586243, 0.9453197121620178, 1.0046846866607666, 1.0640497207641602, 1.1234147548675537, 1.1827797889709473, 1.2421448230743408, 1.3015098571777344, 1.360874891281128, 1.4202399253845215, 1.479604959487915, 1.5389699935913086, 1.5983350276947021, 1.6577000617980957]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 8.0, 10.0, 28.0, 25.0, 55.0, 82.0, 155.0, 250.0, 466.0, 944.0, 1803.0, 4075.0, 11230.0, 46526.0, 418437.0, 3333933.0, 318048.0, 40709.0, 10204.0, 3697.0, 1714.0, 825.0, 424.0, 250.0, 148.0, 97.0, 59.0, 37.0, 25.0, 12.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6289443969726562, -0.6021270751953125, -0.5753097534179688, -0.548492431640625, -0.5216751098632812, -0.4948577880859375, -0.46804046630859375, -0.44122314453125, -0.41440582275390625, -0.3875885009765625, -0.36077117919921875, -0.333953857421875, -0.30713653564453125, -0.2803192138671875, -0.25350189208984375, -0.2266845703125, -0.19986724853515625, -0.1730499267578125, -0.14623260498046875, -0.119415283203125, -0.09259796142578125, -0.0657806396484375, -0.03896331787109375, -0.01214599609375, 0.01467132568359375, 0.0414886474609375, 0.06830596923828125, 0.095123291015625, 0.12194061279296875, 0.1487579345703125, 0.17557525634765625, 0.202392578125, 0.22920989990234375, 0.2560272216796875, 0.28284454345703125, 0.309661865234375, 0.33647918701171875, 0.3632965087890625, 0.39011383056640625, 0.41693115234375, 0.44374847412109375, 0.4705657958984375, 0.49738311767578125, 0.524200439453125, 0.5510177612304688, 0.5778350830078125, 0.6046524047851562, 0.6314697265625, 0.6582870483398438, 0.6851043701171875, 0.7119216918945312, 0.738739013671875, 0.7655563354492188, 0.7923736572265625, 0.8191909790039062, 0.84600830078125, 0.8728256225585938, 0.8996429443359375, 0.9264602661132812, 0.953277587890625, 0.9800949096679688, 1.0069122314453125, 1.0337295532226562, 1.060546875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 13.0, 15.0, 10.0, 14.0, 19.0, 37.0, 37.0, 57.0, 64.0, 69.0, 62.0, 97.0, 78.0, 89.0, 62.0, 58.0, 46.0, 34.0, 26.0, 16.0, 15.0, 21.0, 10.0, 9.0, 8.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6675872802734375, -0.647186279296875, -0.6267852783203125, -0.60638427734375, -0.5859832763671875, -0.565582275390625, -0.5451812744140625, -0.5247802734375, -0.5043792724609375, -0.483978271484375, -0.4635772705078125, -0.44317626953125, -0.4227752685546875, -0.402374267578125, -0.3819732666015625, -0.361572265625, -0.3411712646484375, -0.320770263671875, -0.3003692626953125, -0.27996826171875, -0.2595672607421875, -0.239166259765625, -0.2187652587890625, -0.1983642578125, -0.1779632568359375, -0.157562255859375, -0.1371612548828125, -0.11676025390625, -0.0963592529296875, -0.075958251953125, -0.0555572509765625, -0.03515625, -0.0147552490234375, 0.005645751953125, 0.0260467529296875, 0.04644775390625, 0.0668487548828125, 0.087249755859375, 0.1076507568359375, 0.1280517578125, 0.1484527587890625, 0.168853759765625, 0.1892547607421875, 0.20965576171875, 0.2300567626953125, 0.250457763671875, 0.2708587646484375, 0.291259765625, 0.3116607666015625, 0.332061767578125, 0.3524627685546875, 0.37286376953125, 0.3932647705078125, 0.413665771484375, 0.4340667724609375, 0.4544677734375, 0.4748687744140625, 0.495269775390625, 0.5156707763671875, 0.53607177734375, 0.5564727783203125, 0.576873779296875, 0.5972747802734375, 0.61767578125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 0.0, 7.0, 6.0, 6.0, 9.0, 15.0, 21.0, 23.0, 54.0, 60.0, 105.0, 193.0, 425.0, 927.0, 2481.0, 8566.0, 49330.0, 1263304.0, 2784622.0, 68354.0, 10685.0, 2977.0, 1100.0, 455.0, 221.0, 133.0, 68.0, 50.0, 33.0, 21.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.6918106079101562, -0.6604766845703125, -0.6291427612304688, -0.597808837890625, -0.5664749145507812, -0.5351409912109375, -0.5038070678710938, -0.47247314453125, -0.44113922119140625, -0.4098052978515625, -0.37847137451171875, -0.347137451171875, -0.31580352783203125, -0.2844696044921875, -0.25313568115234375, -0.2218017578125, -0.19046783447265625, -0.1591339111328125, -0.12779998779296875, -0.096466064453125, -0.06513214111328125, -0.0337982177734375, -0.00246429443359375, 0.02886962890625, 0.06020355224609375, 0.0915374755859375, 0.12287139892578125, 0.154205322265625, 0.18553924560546875, 0.2168731689453125, 0.24820709228515625, 0.279541015625, 0.31087493896484375, 0.3422088623046875, 0.37354278564453125, 0.404876708984375, 0.43621063232421875, 0.4675445556640625, 0.49887847900390625, 0.53021240234375, 0.5615463256835938, 0.5928802490234375, 0.6242141723632812, 0.655548095703125, 0.6868820190429688, 0.7182159423828125, 0.7495498657226562, 0.7808837890625, 0.8122177124023438, 0.8435516357421875, 0.8748855590820312, 0.906219482421875, 0.9375534057617188, 0.9688873291015625, 1.0002212524414062, 1.03155517578125, 1.0628890991210938, 1.0942230224609375, 1.1255569458007812, 1.156890869140625, 1.1882247924804688, 1.2195587158203125, 1.2508926391601562, 1.2822265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 10.0, 5.0, 13.0, 34.0, 40.0, 60.0, 102.0, 130.0, 244.0, 481.0, 922.0, 873.0, 503.0, 234.0, 153.0, 81.0, 50.0, 34.0, 28.0, 17.0, 12.0, 12.0, 12.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259033203125, -0.2511730194091797, -0.24331283569335938, -0.23545265197753906, -0.22759246826171875, -0.21973228454589844, -0.21187210083007812, -0.2040119171142578, -0.1961517333984375, -0.1882915496826172, -0.18043136596679688, -0.17257118225097656, -0.16471099853515625, -0.15685081481933594, -0.14899063110351562, -0.1411304473876953, -0.133270263671875, -0.1254100799560547, -0.11754989624023438, -0.10968971252441406, -0.10182952880859375, -0.09396934509277344, -0.08610916137695312, -0.07824897766113281, -0.0703887939453125, -0.06252861022949219, -0.054668426513671875, -0.04680824279785156, -0.03894805908203125, -0.031087875366210938, -0.023227691650390625, -0.015367507934570312, -0.00750732421875, 0.0003528594970703125, 0.008213043212890625, 0.016073226928710938, 0.02393341064453125, 0.03179359436035156, 0.039653778076171875, 0.04751396179199219, 0.0553741455078125, 0.06323432922363281, 0.07109451293945312, 0.07895469665527344, 0.08681488037109375, 0.09467506408691406, 0.10253524780273438, 0.11039543151855469, 0.118255615234375, 0.1261157989501953, 0.13397598266601562, 0.14183616638183594, 0.14969635009765625, 0.15755653381347656, 0.16541671752929688, 0.1732769012451172, 0.1811370849609375, 0.1889972686767578, 0.19685745239257812, 0.20471763610839844, 0.21257781982421875, 0.22043800354003906, 0.22829818725585938, 0.2361583709716797, 0.2440185546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 11.0, 7.0, 31.0, 29.0, 55.0, 83.0, 126.0, 156.0, 150.0, 135.0, 72.0, 46.0, 33.0, 13.0, 13.0, 9.0, 5.0, 5.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4888819456100464, -1.4494564533233643, -1.4100308418273926, -1.3706053495407104, -1.3311798572540283, -1.2917542457580566, -1.2523287534713745, -1.2129032611846924, -1.1734776496887207, -1.1340521574020386, -1.094626545906067, -1.0552010536193848, -1.0157755613327026, -0.9763500094413757, -0.9369244575500488, -0.8974989652633667, -0.8580734729766846, -0.8186479210853577, -0.7792224287986755, -0.7397968769073486, -0.7003713846206665, -0.6609458327293396, -0.6215202808380127, -0.5820947885513306, -0.5426692366600037, -0.5032436847686768, -0.46381819248199463, -0.4243926405906677, -0.3849671185016632, -0.3455415964126587, -0.3061160445213318, -0.26669052243232727, -0.2272651195526123, -0.1878395974636078, -0.14841406047344208, -0.10898853093385696, -0.06956300139427185, -0.030137479305267334, 0.009288057684898376, 0.04871359467506409, 0.0881391167640686, 0.12756463885307312, 0.16699017584323883, 0.20641571283340454, 0.24584123492240906, 0.2852667570114136, 0.3246923089027405, 0.364117830991745, 0.4035433530807495, 0.44296887516975403, 0.48239439725875854, 0.5218199491500854, 0.5612454414367676, 0.6006709933280945, 0.6400965452194214, 0.6795220375061035, 0.7189475893974304, 0.7583731412887573, 0.7977986335754395, 0.8372241854667664, 0.8766497373580933, 0.9160752296447754, 0.9555007815361023, 0.9949263334274292, 1.0343518257141113]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 8.0, 10.0, 12.0, 11.0, 16.0, 30.0, 25.0, 31.0, 41.0, 38.0, 54.0, 64.0, 61.0, 63.0, 74.0, 66.0, 59.0, 57.0, 42.0, 41.0, 38.0, 34.0, 28.0, 17.0, 17.0, 12.0, 7.0, 10.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6819748282432556, -0.6619782447814941, -0.6419816017150879, -0.6219850182533264, -0.6019884347915649, -0.5819917917251587, -0.5619952082633972, -0.5419986248016357, -0.5220019817352295, -0.502005398273468, -0.48200878500938416, -0.4620121717453003, -0.4420155882835388, -0.42201897501945496, -0.4020223617553711, -0.3820257782936096, -0.36202919483184814, -0.3420325815677643, -0.3220359981060028, -0.30203938484191895, -0.28204280138015747, -0.2620461881160736, -0.24204957485198975, -0.22205297648906708, -0.2020563781261444, -0.18205977976322174, -0.16206318140029907, -0.1420665681362152, -0.12206996977329254, -0.10207337141036987, -0.08207676559686661, -0.06208015978336334, -0.04208362102508545, -0.022087018936872482, -0.0020904168486595154, 0.01790618523955345, 0.03790278732776642, 0.05789938569068909, 0.07789599150419235, 0.09789259731769562, 0.11788919568061829, 0.13788579404354095, 0.15788239240646362, 0.17787900567054749, 0.19787560403347015, 0.21787220239639282, 0.23786881566047668, 0.25786542892456055, 0.277862012386322, 0.2978586256504059, 0.31785520911216736, 0.3378518223762512, 0.3578484058380127, 0.37784501910209656, 0.3978416323661804, 0.4178382158279419, 0.43783482909202576, 0.4578314423561096, 0.4778280258178711, 0.49782463908195496, 0.5178212523460388, 0.5378178358078003, 0.5578144192695618, 0.577811062335968, 0.5978076457977295]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 11.0, 10.0, 16.0, 27.0, 62.0, 79.0, 131.0, 172.0, 318.0, 499.0, 871.0, 1604.0, 3170.0, 6411.0, 15378.0, 39835.0, 125077.0, 369207.0, 324075.0, 102771.0, 33806.0, 13221.0, 5653.0, 2627.0, 1463.0, 832.0, 497.0, 265.0, 139.0, 94.0, 67.0, 51.0, 26.0, 16.0, 18.0, 11.0, 12.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1009521484375, -0.0979757308959961, -0.09499931335449219, -0.09202289581298828, -0.08904647827148438, -0.08607006072998047, -0.08309364318847656, -0.08011722564697266, -0.07714080810546875, -0.07416439056396484, -0.07118797302246094, -0.06821155548095703, -0.06523513793945312, -0.06225872039794922, -0.05928230285644531, -0.056305885314941406, -0.0533294677734375, -0.050353050231933594, -0.04737663269042969, -0.04440021514892578, -0.041423797607421875, -0.03844738006591797, -0.03547096252441406, -0.032494544982910156, -0.02951812744140625, -0.026541709899902344, -0.023565292358398438, -0.02058887481689453, -0.017612457275390625, -0.014636039733886719, -0.011659622192382812, -0.008683204650878906, -0.005706787109375, -0.0027303695678710938, 0.0002460479736328125, 0.0032224655151367188, 0.006198883056640625, 0.009175300598144531, 0.012151718139648438, 0.015128135681152344, 0.01810455322265625, 0.021080970764160156, 0.024057388305664062, 0.02703380584716797, 0.030010223388671875, 0.03298664093017578, 0.03596305847167969, 0.038939476013183594, 0.0419158935546875, 0.044892311096191406, 0.04786872863769531, 0.05084514617919922, 0.053821563720703125, 0.05679798126220703, 0.05977439880371094, 0.06275081634521484, 0.06572723388671875, 0.06870365142822266, 0.07168006896972656, 0.07465648651123047, 0.07763290405273438, 0.08060932159423828, 0.08358573913574219, 0.0865621566772461, 0.08953857421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 9.0, 11.0, 10.0, 12.0, 11.0, 30.0, 40.0, 39.0, 53.0, 63.0, 84.0, 89.0, 78.0, 78.0, 77.0, 77.0, 52.0, 52.0, 29.0, 32.0, 20.0, 13.0, 10.0, 5.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6181640625, -0.6002120971679688, -0.5822601318359375, -0.5643081665039062, -0.546356201171875, -0.5284042358398438, -0.5104522705078125, -0.49250030517578125, -0.47454833984375, -0.45659637451171875, -0.4386444091796875, -0.42069244384765625, -0.402740478515625, -0.38478851318359375, -0.3668365478515625, -0.34888458251953125, -0.3309326171875, -0.31298065185546875, -0.2950286865234375, -0.27707672119140625, -0.259124755859375, -0.24117279052734375, -0.2232208251953125, -0.20526885986328125, -0.18731689453125, -0.16936492919921875, -0.1514129638671875, -0.13346099853515625, -0.115509033203125, -0.09755706787109375, -0.0796051025390625, -0.06165313720703125, -0.043701171875, -0.02574920654296875, -0.0077972412109375, 0.01015472412109375, 0.028106689453125, 0.04605865478515625, 0.0640106201171875, 0.08196258544921875, 0.09991455078125, 0.11786651611328125, 0.1358184814453125, 0.15377044677734375, 0.171722412109375, 0.18967437744140625, 0.2076263427734375, 0.22557830810546875, 0.2435302734375, 0.26148223876953125, 0.2794342041015625, 0.29738616943359375, 0.315338134765625, 0.33329010009765625, 0.3512420654296875, 0.36919403076171875, 0.38714599609375, 0.40509796142578125, 0.4230499267578125, 0.44100189208984375, 0.458953857421875, 0.47690582275390625, 0.4948577880859375, 0.5128097534179688, 0.53076171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 5.0, 7.0, 10.0, 3.0, 16.0, 9.0, 10.0, 14.0, 30.0, 40.0, 43.0, 67.0, 71.0, 120.0, 187.0, 239.0, 423.0, 741.0, 1355.0, 2850.0, 7076.0, 20028.0, 70396.0, 284454.0, 450341.0, 151772.0, 37681.0, 11554.0, 4429.0, 1956.0, 1001.0, 514.0, 360.0, 229.0, 135.0, 107.0, 61.0, 38.0, 33.0, 26.0, 18.0, 15.0, 15.0, 12.0, 13.0, 6.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08587646484375, -0.0831298828125, -0.08038330078125, -0.07763671875, -0.07489013671875, -0.0721435546875, -0.06939697265625, -0.066650390625, -0.06390380859375, -0.0611572265625, -0.05841064453125, -0.0556640625, -0.05291748046875, -0.0501708984375, -0.04742431640625, -0.044677734375, -0.04193115234375, -0.0391845703125, -0.03643798828125, -0.03369140625, -0.03094482421875, -0.0281982421875, -0.02545166015625, -0.022705078125, -0.01995849609375, -0.0172119140625, -0.01446533203125, -0.01171875, -0.00897216796875, -0.0062255859375, -0.00347900390625, -0.000732421875, 0.00201416015625, 0.0047607421875, 0.00750732421875, 0.01025390625, 0.01300048828125, 0.0157470703125, 0.01849365234375, 0.021240234375, 0.02398681640625, 0.0267333984375, 0.02947998046875, 0.0322265625, 0.03497314453125, 0.0377197265625, 0.04046630859375, 0.043212890625, 0.04595947265625, 0.0487060546875, 0.05145263671875, 0.05419921875, 0.05694580078125, 0.0596923828125, 0.06243896484375, 0.065185546875, 0.06793212890625, 0.0706787109375, 0.07342529296875, 0.076171875, 0.07891845703125, 0.0816650390625, 0.08441162109375, 0.087158203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 6.0, 9.0, 7.0, 5.0, 10.0, 12.0, 4.0, 10.0, 21.0, 23.0, 29.0, 27.0, 22.0, 32.0, 35.0, 31.0, 43.0, 35.0, 45.0, 43.0, 53.0, 58.0, 42.0, 35.0, 36.0, 40.0, 30.0, 34.0, 33.0, 29.0, 25.0, 25.0, 13.0, 23.0, 11.0, 10.0, 17.0, 8.0, 7.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.71240234375, -0.6925582885742188, -0.6727142333984375, -0.6528701782226562, -0.633026123046875, -0.6131820678710938, -0.5933380126953125, -0.5734939575195312, -0.55364990234375, -0.5338058471679688, -0.5139617919921875, -0.49411773681640625, -0.474273681640625, -0.45442962646484375, -0.4345855712890625, -0.41474151611328125, -0.3948974609375, -0.37505340576171875, -0.3552093505859375, -0.33536529541015625, -0.315521240234375, -0.29567718505859375, -0.2758331298828125, -0.25598907470703125, -0.23614501953125, -0.21630096435546875, -0.1964569091796875, -0.17661285400390625, -0.156768798828125, -0.13692474365234375, -0.1170806884765625, -0.09723663330078125, -0.077392578125, -0.05754852294921875, -0.0377044677734375, -0.01786041259765625, 0.001983642578125, 0.02182769775390625, 0.0416717529296875, 0.06151580810546875, 0.08135986328125, 0.10120391845703125, 0.1210479736328125, 0.14089202880859375, 0.160736083984375, 0.18058013916015625, 0.2004241943359375, 0.22026824951171875, 0.2401123046875, 0.25995635986328125, 0.2798004150390625, 0.29964447021484375, 0.319488525390625, 0.33933258056640625, 0.3591766357421875, 0.37902069091796875, 0.39886474609375, 0.41870880126953125, 0.4385528564453125, 0.45839691162109375, 0.478240966796875, 0.49808502197265625, 0.5179290771484375, 0.5377731323242188, 0.5576171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 14.0, 31.0, 46.0, 57.0, 99.0, 156.0, 218.0, 367.0, 628.0, 1294.0, 2753.0, 6882.0, 23394.0, 118454.0, 599176.0, 238740.0, 38731.0, 10176.0, 3768.0, 1578.0, 814.0, 401.0, 254.0, 156.0, 100.0, 61.0, 51.0, 25.0, 20.0, 26.0, 7.0, 9.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044219970703125, -0.04277849197387695, -0.041337013244628906, -0.03989553451538086, -0.03845405578613281, -0.037012577056884766, -0.03557109832763672, -0.03412961959838867, -0.032688140869140625, -0.031246662139892578, -0.02980518341064453, -0.028363704681396484, -0.026922225952148438, -0.02548074722290039, -0.024039268493652344, -0.022597789764404297, -0.02115631103515625, -0.019714832305908203, -0.018273353576660156, -0.01683187484741211, -0.015390396118164062, -0.013948917388916016, -0.012507438659667969, -0.011065959930419922, -0.009624481201171875, -0.008183002471923828, -0.006741523742675781, -0.005300045013427734, -0.0038585662841796875, -0.0024170875549316406, -0.0009756088256835938, 0.0004658699035644531, 0.0019073486328125, 0.003348827362060547, 0.004790306091308594, 0.006231784820556641, 0.0076732635498046875, 0.009114742279052734, 0.010556221008300781, 0.011997699737548828, 0.013439178466796875, 0.014880657196044922, 0.01632213592529297, 0.017763614654541016, 0.019205093383789062, 0.02064657211303711, 0.022088050842285156, 0.023529529571533203, 0.02497100830078125, 0.026412487030029297, 0.027853965759277344, 0.02929544448852539, 0.030736923217773438, 0.032178401947021484, 0.03361988067626953, 0.03506135940551758, 0.036502838134765625, 0.03794431686401367, 0.03938579559326172, 0.040827274322509766, 0.04226875305175781, 0.04371023178100586, 0.045151710510253906, 0.04659318923950195, 0.04803466796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 4.0, 20.0, 21.0, 48.0, 50.0, 75.0, 81.0, 115.0, 104.0, 106.0, 96.0, 82.0, 49.0, 50.0, 34.0, 16.0, 10.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6404857635498047e-05, -2.557411789894104e-05, -2.4743378162384033e-05, -2.3912638425827026e-05, -2.308189868927002e-05, -2.2251158952713013e-05, -2.1420419216156006e-05, -2.0589679479599e-05, -1.9758939743041992e-05, -1.8928200006484985e-05, -1.809746026992798e-05, -1.726672053337097e-05, -1.6435980796813965e-05, -1.5605241060256958e-05, -1.4774501323699951e-05, -1.3943761587142944e-05, -1.3113021850585938e-05, -1.228228211402893e-05, -1.1451542377471924e-05, -1.0620802640914917e-05, -9.79006290435791e-06, -8.959323167800903e-06, -8.128583431243896e-06, -7.29784369468689e-06, -6.467103958129883e-06, -5.636364221572876e-06, -4.805624485015869e-06, -3.974884748458862e-06, -3.1441450119018555e-06, -2.3134052753448486e-06, -1.4826655387878418e-06, -6.51925802230835e-07, 1.7881393432617188e-07, 1.0095536708831787e-06, 1.8402934074401855e-06, 2.6710331439971924e-06, 3.5017728805541992e-06, 4.332512617111206e-06, 5.163252353668213e-06, 5.99399209022522e-06, 6.8247318267822266e-06, 7.655471563339233e-06, 8.48621129989624e-06, 9.316951036453247e-06, 1.0147690773010254e-05, 1.097843050956726e-05, 1.1809170246124268e-05, 1.2639909982681274e-05, 1.3470649719238281e-05, 1.4301389455795288e-05, 1.5132129192352295e-05, 1.5962868928909302e-05, 1.679360866546631e-05, 1.7624348402023315e-05, 1.8455088138580322e-05, 1.928582787513733e-05, 2.0116567611694336e-05, 2.0947307348251343e-05, 2.177804708480835e-05, 2.2608786821365356e-05, 2.3439526557922363e-05, 2.427026629447937e-05, 2.5101006031036377e-05, 2.5931745767593384e-05, 2.676248550415039e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 3.0, 5.0, 7.0, 16.0, 19.0, 24.0, 37.0, 54.0, 89.0, 110.0, 198.0, 371.0, 748.0, 1432.0, 3269.0, 8653.0, 26381.0, 97631.0, 372681.0, 388951.0, 103929.0, 27993.0, 9305.0, 3429.0, 1508.0, 695.0, 395.0, 208.0, 133.0, 96.0, 54.0, 32.0, 35.0, 20.0, 8.0, 5.0, 8.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.04296875, -0.041808128356933594, -0.04064750671386719, -0.03948688507080078, -0.038326263427734375, -0.03716564178466797, -0.03600502014160156, -0.034844398498535156, -0.03368377685546875, -0.032523155212402344, -0.03136253356933594, -0.03020191192626953, -0.029041290283203125, -0.02788066864013672, -0.026720046997070312, -0.025559425354003906, -0.0243988037109375, -0.023238182067871094, -0.022077560424804688, -0.02091693878173828, -0.019756317138671875, -0.01859569549560547, -0.017435073852539062, -0.016274452209472656, -0.01511383056640625, -0.013953208923339844, -0.012792587280273438, -0.011631965637207031, -0.010471343994140625, -0.009310722351074219, -0.008150100708007812, -0.006989479064941406, -0.005828857421875, -0.004668235778808594, -0.0035076141357421875, -0.0023469924926757812, -0.001186370849609375, -2.574920654296875e-05, 0.0011348724365234375, 0.0022954940795898438, 0.00345611572265625, 0.004616737365722656, 0.0057773590087890625, 0.006937980651855469, 0.008098602294921875, 0.009259223937988281, 0.010419845581054688, 0.011580467224121094, 0.0127410888671875, 0.013901710510253906, 0.015062332153320312, 0.01622295379638672, 0.017383575439453125, 0.01854419708251953, 0.019704818725585938, 0.020865440368652344, 0.02202606201171875, 0.023186683654785156, 0.024347305297851562, 0.02550792694091797, 0.026668548583984375, 0.02782917022705078, 0.028989791870117188, 0.030150413513183594, 0.03131103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 7.0, 10.0, 12.0, 17.0, 27.0, 23.0, 40.0, 45.0, 63.0, 70.0, 83.0, 87.0, 86.0, 99.0, 62.0, 51.0, 50.0, 35.0, 25.0, 28.0, 12.0, 14.0, 9.0, 9.0, 10.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00753021240234375, -0.007199764251708984, -0.006869316101074219, -0.006538867950439453, -0.0062084197998046875, -0.005877971649169922, -0.005547523498535156, -0.005217075347900391, -0.004886627197265625, -0.004556179046630859, -0.004225730895996094, -0.003895282745361328, -0.0035648345947265625, -0.003234386444091797, -0.0029039382934570312, -0.0025734901428222656, -0.0022430419921875, -0.0019125938415527344, -0.0015821456909179688, -0.0012516975402832031, -0.0009212493896484375, -0.0005908012390136719, -0.00026035308837890625, 7.009506225585938e-05, 0.000400543212890625, 0.0007309913635253906, 0.0010614395141601562, 0.0013918876647949219, 0.0017223358154296875, 0.002052783966064453, 0.0023832321166992188, 0.0027136802673339844, 0.00304412841796875, 0.0033745765686035156, 0.0037050247192382812, 0.004035472869873047, 0.0043659210205078125, 0.004696369171142578, 0.005026817321777344, 0.005357265472412109, 0.005687713623046875, 0.006018161773681641, 0.006348609924316406, 0.006679058074951172, 0.0070095062255859375, 0.007339954376220703, 0.007670402526855469, 0.008000850677490234, 0.008331298828125, 0.008661746978759766, 0.008992195129394531, 0.009322643280029297, 0.009653091430664062, 0.009983539581298828, 0.010313987731933594, 0.01064443588256836, 0.010974884033203125, 0.01130533218383789, 0.011635780334472656, 0.011966228485107422, 0.012296676635742188, 0.012627124786376953, 0.012957572937011719, 0.013288021087646484, 0.01361846923828125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 15.0, 23.0, 41.0, 73.0, 133.0, 202.0, 218.0, 129.0, 56.0, 42.0, 21.0, 14.0, 5.0, 8.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3471403121948242, -1.3125070333480835, -1.2778738737106323, -1.2432405948638916, -1.2086074352264404, -1.1739741563796997, -1.139340877532959, -1.1047077178955078, -1.070074439048767, -1.0354411602020264, -1.0008080005645752, -0.9661747217178345, -0.9315415024757385, -0.8969082832336426, -0.8622750639915466, -0.8276418447494507, -0.7930086255073547, -0.7583754062652588, -0.7237421870231628, -0.6891089677810669, -0.6544756889343262, -0.6198424696922302, -0.5852092504501343, -0.5505760312080383, -0.5159428119659424, -0.48130959272384644, -0.4466763436794281, -0.41204312443733215, -0.3774098753929138, -0.34277665615081787, -0.3081434369087219, -0.273510217666626, -0.23887693881988525, -0.2042437046766281, -0.16961047053337097, -0.13497725129127502, -0.10034401714801788, -0.06571078300476074, -0.031077563762664795, 0.003555670380592346, 0.03818890452384949, 0.07282213866710663, 0.10745536535978317, 0.14208859205245972, 0.17672182619571686, 0.211355060338974, 0.24598827958106995, 0.2806215286254883, 0.31525474786758423, 0.3498879671096802, 0.3845212161540985, 0.41915443539619446, 0.4537876844406128, 0.48842090368270874, 0.5230541229248047, 0.5576873421669006, 0.5923205614089966, 0.6269537806510925, 0.6615869998931885, 0.6962202787399292, 0.7308534979820251, 0.7654867172241211, 0.800119936466217, 0.834753155708313, 0.8693864345550537]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 5.0, 3.0, 4.0, 4.0, 4.0, 15.0, 9.0, 16.0, 13.0, 35.0, 27.0, 33.0, 40.0, 57.0, 67.0, 70.0, 72.0, 72.0, 80.0, 59.0, 66.0, 39.0, 46.0, 41.0, 31.0, 18.0, 19.0, 10.0, 11.0, 11.0, 5.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5037251710891724, -0.48898470401763916, -0.47424423694610596, -0.45950376987457275, -0.44476330280303955, -0.43002283573150635, -0.41528236865997314, -0.40054190158843994, -0.38580143451690674, -0.37106096744537354, -0.35632050037384033, -0.34158003330230713, -0.3268395662307739, -0.3120990991592407, -0.2973586320877075, -0.2826181650161743, -0.2678777277469635, -0.2531372606754303, -0.2383967936038971, -0.2236563265323639, -0.2089158594608307, -0.19417539238929749, -0.17943494021892548, -0.16469447314739227, -0.14995400607585907, -0.13521353900432587, -0.12047307193279266, -0.10573261231184006, -0.09099214524030685, -0.07625167816877365, -0.061511218547821045, -0.04677075147628784, -0.032030314207077026, -0.017289848998188972, -0.0025493837893009186, 0.012191079556941986, 0.02693154662847519, 0.04167201370000839, 0.056412473320961, 0.0711529403924942, 0.0858934074640274, 0.10063387453556061, 0.11537434160709381, 0.13011479377746582, 0.14485526084899902, 0.15959572792053223, 0.17433619499206543, 0.18907666206359863, 0.20381712913513184, 0.21855759620666504, 0.23329806327819824, 0.24803853034973145, 0.26277899742126465, 0.27751946449279785, 0.29225993156433105, 0.30700039863586426, 0.32174086570739746, 0.33648133277893066, 0.35122179985046387, 0.36596226692199707, 0.3807027339935303, 0.3954432010650635, 0.4101836681365967, 0.4249241352081299, 0.4396645724773407]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 9.0, 11.0, 22.0, 17.0, 33.0, 54.0, 58.0, 100.0, 139.0, 236.0, 394.0, 615.0, 1141.0, 2125.0, 4639.0, 11531.0, 43122.0, 463978.0, 456573.0, 42600.0, 11532.0, 4487.0, 2192.0, 1135.0, 671.0, 421.0, 245.0, 157.0, 119.0, 63.0, 32.0, 31.0, 21.0, 13.0, 15.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.5859375, -0.5687026977539062, -0.5514678955078125, -0.5342330932617188, -0.516998291015625, -0.49976348876953125, -0.4825286865234375, -0.46529388427734375, -0.44805908203125, -0.43082427978515625, -0.4135894775390625, -0.39635467529296875, -0.379119873046875, -0.36188507080078125, -0.3446502685546875, -0.32741546630859375, -0.3101806640625, -0.29294586181640625, -0.2757110595703125, -0.25847625732421875, -0.241241455078125, -0.22400665283203125, -0.2067718505859375, -0.18953704833984375, -0.17230224609375, -0.15506744384765625, -0.1378326416015625, -0.12059783935546875, -0.103363037109375, -0.08612823486328125, -0.0688934326171875, -0.05165863037109375, -0.034423828125, -0.01718902587890625, 4.57763671875e-05, 0.01728057861328125, 0.034515380859375, 0.05175018310546875, 0.0689849853515625, 0.08621978759765625, 0.10345458984375, 0.12068939208984375, 0.1379241943359375, 0.15515899658203125, 0.172393798828125, 0.18962860107421875, 0.2068634033203125, 0.22409820556640625, 0.2413330078125, 0.25856781005859375, 0.2758026123046875, 0.29303741455078125, 0.310272216796875, 0.32750701904296875, 0.3447418212890625, 0.36197662353515625, 0.37921142578125, 0.39644622802734375, 0.4136810302734375, 0.43091583251953125, 0.448150634765625, 0.46538543701171875, 0.4826202392578125, 0.49985504150390625, 0.51708984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 19.0, 15.0, 30.0, 16.0, 26.0, 25.0, 50.0, 56.0, 74.0, 77.0, 81.0, 80.0, 77.0, 70.0, 64.0, 45.0, 39.0, 33.0, 26.0, 14.0, 16.0, 8.0, 7.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2021484375, -1.168548583984375, -1.13494873046875, -1.101348876953125, -1.0677490234375, -1.034149169921875, -1.00054931640625, -0.966949462890625, -0.933349609375, -0.899749755859375, -0.86614990234375, -0.832550048828125, -0.7989501953125, -0.765350341796875, -0.73175048828125, -0.698150634765625, -0.66455078125, -0.630950927734375, -0.59735107421875, -0.563751220703125, -0.5301513671875, -0.496551513671875, -0.46295166015625, -0.429351806640625, -0.395751953125, -0.362152099609375, -0.32855224609375, -0.294952392578125, -0.2613525390625, -0.227752685546875, -0.19415283203125, -0.160552978515625, -0.126953125, -0.093353271484375, -0.05975341796875, -0.026153564453125, 0.0074462890625, 0.041046142578125, 0.07464599609375, 0.108245849609375, 0.141845703125, 0.175445556640625, 0.20904541015625, 0.242645263671875, 0.2762451171875, 0.309844970703125, 0.34344482421875, 0.377044677734375, 0.41064453125, 0.444244384765625, 0.47784423828125, 0.511444091796875, 0.5450439453125, 0.578643798828125, 0.61224365234375, 0.645843505859375, 0.679443359375, 0.713043212890625, 0.74664306640625, 0.780242919921875, 0.8138427734375, 0.847442626953125, 0.88104248046875, 0.914642333984375, 0.9482421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 4.0, 9.0, 27.0, 28.0, 41.0, 39.0, 90.0, 94.0, 190.0, 330.0, 509.0, 1006.0, 1979.0, 4515.0, 12906.0, 67973.0, 761098.0, 164654.0, 21171.0, 6438.0, 2517.0, 1204.0, 623.0, 390.0, 244.0, 171.0, 91.0, 65.0, 37.0, 35.0, 20.0, 11.0, 9.0, 5.0, 5.0, 1.0, 2.0, 6.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.5003128051757812, -0.4850006103515625, -0.46968841552734375, -0.454376220703125, -0.43906402587890625, -0.4237518310546875, -0.40843963623046875, -0.39312744140625, -0.37781524658203125, -0.3625030517578125, -0.34719085693359375, -0.331878662109375, -0.31656646728515625, -0.3012542724609375, -0.28594207763671875, -0.2706298828125, -0.25531768798828125, -0.2400054931640625, -0.22469329833984375, -0.209381103515625, -0.19406890869140625, -0.1787567138671875, -0.16344451904296875, -0.14813232421875, -0.13282012939453125, -0.1175079345703125, -0.10219573974609375, -0.086883544921875, -0.07157135009765625, -0.0562591552734375, -0.04094696044921875, -0.025634765625, -0.01032257080078125, 0.0049896240234375, 0.02030181884765625, 0.035614013671875, 0.05092620849609375, 0.0662384033203125, 0.08155059814453125, 0.09686279296875, 0.11217498779296875, 0.1274871826171875, 0.14279937744140625, 0.158111572265625, 0.17342376708984375, 0.1887359619140625, 0.20404815673828125, 0.2193603515625, 0.23467254638671875, 0.2499847412109375, 0.26529693603515625, 0.280609130859375, 0.29592132568359375, 0.3112335205078125, 0.32654571533203125, 0.34185791015625, 0.35717010498046875, 0.3724822998046875, 0.38779449462890625, 0.403106689453125, 0.41841888427734375, 0.4337310791015625, 0.44904327392578125, 0.46435546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 7.0, 5.0, 2.0, 3.0, 11.0, 7.0, 18.0, 13.0, 11.0, 17.0, 32.0, 30.0, 32.0, 39.0, 45.0, 35.0, 46.0, 54.0, 48.0, 71.0, 43.0, 53.0, 30.0, 46.0, 47.0, 49.0, 32.0, 42.0, 26.0, 22.0, 15.0, 11.0, 9.0, 21.0, 14.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1328125, -1.10101318359375, -1.0692138671875, -1.03741455078125, -1.005615234375, -0.97381591796875, -0.9420166015625, -0.91021728515625, -0.87841796875, -0.84661865234375, -0.8148193359375, -0.78302001953125, -0.751220703125, -0.71942138671875, -0.6876220703125, -0.65582275390625, -0.6240234375, -0.59222412109375, -0.5604248046875, -0.52862548828125, -0.496826171875, -0.46502685546875, -0.4332275390625, -0.40142822265625, -0.36962890625, -0.33782958984375, -0.3060302734375, -0.27423095703125, -0.242431640625, -0.21063232421875, -0.1788330078125, -0.14703369140625, -0.115234375, -0.08343505859375, -0.0516357421875, -0.01983642578125, 0.011962890625, 0.04376220703125, 0.0755615234375, 0.10736083984375, 0.13916015625, 0.17095947265625, 0.2027587890625, 0.23455810546875, 0.266357421875, 0.29815673828125, 0.3299560546875, 0.36175537109375, 0.3935546875, 0.42535400390625, 0.4571533203125, 0.48895263671875, 0.520751953125, 0.55255126953125, 0.5843505859375, 0.61614990234375, 0.64794921875, 0.67974853515625, 0.7115478515625, 0.74334716796875, 0.775146484375, 0.80694580078125, 0.8387451171875, 0.87054443359375, 0.90234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 8.0, 10.0, 2.0, 12.0, 13.0, 24.0, 42.0, 84.0, 110.0, 239.0, 489.0, 1160.0, 3376.0, 15690.0, 150773.0, 803528.0, 60459.0, 8637.0, 2275.0, 796.0, 400.0, 170.0, 120.0, 62.0, 27.0, 14.0, 16.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192138671875, -0.18558692932128906, -0.17903518676757812, -0.1724834442138672, -0.16593170166015625, -0.1593799591064453, -0.15282821655273438, -0.14627647399902344, -0.1397247314453125, -0.13317298889160156, -0.12662124633789062, -0.12006950378417969, -0.11351776123046875, -0.10696601867675781, -0.10041427612304688, -0.09386253356933594, -0.087310791015625, -0.08075904846191406, -0.07420730590820312, -0.06765556335449219, -0.06110382080078125, -0.05455207824707031, -0.048000335693359375, -0.04144859313964844, -0.0348968505859375, -0.028345108032226562, -0.021793365478515625, -0.015241622924804688, -0.00868988037109375, -0.0021381378173828125, 0.004413604736328125, 0.010965347290039062, 0.01751708984375, 0.024068832397460938, 0.030620574951171875, 0.03717231750488281, 0.04372406005859375, 0.05027580261230469, 0.056827545166015625, 0.06337928771972656, 0.0699310302734375, 0.07648277282714844, 0.08303451538085938, 0.08958625793457031, 0.09613800048828125, 0.10268974304199219, 0.10924148559570312, 0.11579322814941406, 0.122344970703125, 0.12889671325683594, 0.13544845581054688, 0.1420001983642578, 0.14855194091796875, 0.1551036834716797, 0.16165542602539062, 0.16820716857910156, 0.1747589111328125, 0.18131065368652344, 0.18786239624023438, 0.1944141387939453, 0.20096588134765625, 0.2075176239013672, 0.21406936645507812, 0.22062110900878906, 0.2271728515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 13.0, 14.0, 8.0, 16.0, 29.0, 40.0, 58.0, 88.0, 126.0, 215.0, 122.0, 96.0, 50.0, 27.0, 24.0, 22.0, 20.0, 6.0, 7.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.165006637573242e-05, -3.082677721977234e-05, -3.0003488063812256e-05, -2.9180198907852173e-05, -2.835690975189209e-05, -2.7533620595932007e-05, -2.6710331439971924e-05, -2.588704228401184e-05, -2.5063753128051758e-05, -2.4240463972091675e-05, -2.3417174816131592e-05, -2.259388566017151e-05, -2.1770596504211426e-05, -2.0947307348251343e-05, -2.012401819229126e-05, -1.9300729036331177e-05, -1.8477439880371094e-05, -1.765415072441101e-05, -1.6830861568450928e-05, -1.6007572412490845e-05, -1.5184283256530762e-05, -1.4360994100570679e-05, -1.3537704944610596e-05, -1.2714415788650513e-05, -1.189112663269043e-05, -1.1067837476730347e-05, -1.0244548320770264e-05, -9.42125916481018e-06, -8.597970008850098e-06, -7.774680852890015e-06, -6.951391696929932e-06, -6.128102540969849e-06, -5.304813385009766e-06, -4.481524229049683e-06, -3.6582350730895996e-06, -2.8349459171295166e-06, -2.0116567611694336e-06, -1.1883676052093506e-06, -3.650784492492676e-07, 4.5821070671081543e-07, 1.2814998626708984e-06, 2.1047890186309814e-06, 2.9280781745910645e-06, 3.7513673305511475e-06, 4.5746564865112305e-06, 5.3979456424713135e-06, 6.2212347984313965e-06, 7.0445239543914795e-06, 7.867813110351562e-06, 8.691102266311646e-06, 9.514391422271729e-06, 1.0337680578231812e-05, 1.1160969734191895e-05, 1.1984258890151978e-05, 1.280754804611206e-05, 1.3630837202072144e-05, 1.4454126358032227e-05, 1.527741551399231e-05, 1.6100704669952393e-05, 1.6923993825912476e-05, 1.774728298187256e-05, 1.857057213783264e-05, 1.9393861293792725e-05, 2.0217150449752808e-05, 2.104043960571289e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 7.0, 11.0, 22.0, 17.0, 38.0, 53.0, 71.0, 127.0, 229.0, 334.0, 572.0, 1160.0, 2622.0, 6130.0, 17579.0, 65156.0, 461409.0, 402836.0, 61971.0, 17118.0, 6008.0, 2496.0, 1136.0, 550.0, 306.0, 196.0, 146.0, 77.0, 45.0, 30.0, 26.0, 12.0, 21.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1439208984375, -0.13980674743652344, -0.13569259643554688, -0.1315784454345703, -0.12746429443359375, -0.12335014343261719, -0.11923599243164062, -0.11512184143066406, -0.1110076904296875, -0.10689353942871094, -0.10277938842773438, -0.09866523742675781, -0.09455108642578125, -0.09043693542480469, -0.08632278442382812, -0.08220863342285156, -0.078094482421875, -0.07398033142089844, -0.06986618041992188, -0.06575202941894531, -0.06163787841796875, -0.05752372741699219, -0.053409576416015625, -0.04929542541503906, -0.0451812744140625, -0.04106712341308594, -0.036952972412109375, -0.03283882141113281, -0.02872467041015625, -0.024610519409179688, -0.020496368408203125, -0.016382217407226562, -0.01226806640625, -0.008153915405273438, -0.004039764404296875, 7.43865966796875e-05, 0.00418853759765625, 0.008302688598632812, 0.012416839599609375, 0.016530990600585938, 0.0206451416015625, 0.024759292602539062, 0.028873443603515625, 0.03298759460449219, 0.03710174560546875, 0.04121589660644531, 0.045330047607421875, 0.04944419860839844, 0.053558349609375, 0.05767250061035156, 0.061786651611328125, 0.06590080261230469, 0.07001495361328125, 0.07412910461425781, 0.07824325561523438, 0.08235740661621094, 0.0864715576171875, 0.09058570861816406, 0.09469985961914062, 0.09881401062011719, 0.10292816162109375, 0.10704231262207031, 0.11115646362304688, 0.11527061462402344, 0.119384765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 7.0, 9.0, 11.0, 16.0, 10.0, 14.0, 18.0, 25.0, 27.0, 35.0, 48.0, 76.0, 139.0, 196.0, 94.0, 76.0, 35.0, 35.0, 19.0, 25.0, 20.0, 10.0, 8.0, 11.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05780029296875, -0.055675506591796875, -0.05355072021484375, -0.051425933837890625, -0.0493011474609375, -0.047176361083984375, -0.04505157470703125, -0.042926788330078125, -0.040802001953125, -0.038677215576171875, -0.03655242919921875, -0.034427642822265625, -0.0323028564453125, -0.030178070068359375, -0.02805328369140625, -0.025928497314453125, -0.0238037109375, -0.021678924560546875, -0.01955413818359375, -0.017429351806640625, -0.0153045654296875, -0.013179779052734375, -0.01105499267578125, -0.008930206298828125, -0.006805419921875, -0.004680633544921875, -0.00255584716796875, -0.000431060791015625, 0.0016937255859375, 0.003818511962890625, 0.00594329833984375, 0.008068084716796875, 0.01019287109375, 0.012317657470703125, 0.01444244384765625, 0.016567230224609375, 0.0186920166015625, 0.020816802978515625, 0.02294158935546875, 0.025066375732421875, 0.027191162109375, 0.029315948486328125, 0.03144073486328125, 0.033565521240234375, 0.0356903076171875, 0.037815093994140625, 0.03993988037109375, 0.042064666748046875, 0.044189453125, 0.046314239501953125, 0.04843902587890625, 0.050563812255859375, 0.0526885986328125, 0.054813385009765625, 0.05693817138671875, 0.059062957763671875, 0.061187744140625, 0.06331253051757812, 0.06543731689453125, 0.06756210327148438, 0.0696868896484375, 0.07181167602539062, 0.07393646240234375, 0.07606124877929688, 0.07818603515625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 11.0, 41.0, 72.0, 234.0, 335.0, 184.0, 55.0, 27.0, 22.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8225148916244507, -1.7111507654190063, -1.599786639213562, -1.4884226322174072, -1.377058506011963, -1.2656943798065186, -1.1543302536010742, -1.0429661273956299, -0.9316020011901855, -0.8202378749847412, -0.7088737487792969, -0.5975096821784973, -0.486145555973053, -0.37478142976760864, -0.2634173631668091, -0.15205323696136475, -0.04068911075592041, 0.07067500054836273, 0.18203911185264587, 0.2934032082557678, 0.40476733446121216, 0.5161314606666565, 0.627495527267456, 0.7388596534729004, 0.8502237796783447, 0.9615879058837891, 1.0729520320892334, 1.1843161582946777, 1.295680284500122, 1.4070444107055664, 1.5184084177017212, 1.6297725439071655, 1.7411365509033203, 1.8525006771087646, 1.963864803314209, 2.0752289295196533, 2.1865930557250977, 2.297957181930542, 2.4093213081359863, 2.5206851959228516, 2.632049560546875, 2.7434136867523193, 2.8547778129577637, 2.966141939163208, 3.0775060653686523, 3.1888701915740967, 3.300234317779541, 3.4115982055664062, 3.5229623317718506, 3.634326457977295, 3.7456905841827393, 3.8570547103881836, 3.968418836593628, 4.079782962799072, 4.1911468505859375, 4.302511215209961, 4.413875102996826, 4.525238990783691, 4.636603355407715, 4.74796724319458, 4.8593316078186035, 4.970695495605469, 5.082059860229492, 5.193423748016357, 5.304788112640381]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 1.0, 9.0, 20.0, 17.0, 8.0, 24.0, 19.0, 29.0, 37.0, 30.0, 36.0, 29.0, 37.0, 39.0, 52.0, 56.0, 38.0, 56.0, 44.0, 46.0, 51.0, 31.0, 43.0, 27.0, 27.0, 22.0, 27.0, 19.0, 16.0, 19.0, 12.0, 18.0, 14.0, 11.0, 6.0, 6.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5644503831863403, -1.5151917934417725, -1.4659332036972046, -1.4166746139526367, -1.3674159049987793, -1.3181573152542114, -1.2688987255096436, -1.2196401357650757, -1.1703815460205078, -1.12112295627594, -1.071864366531372, -1.0226056575775146, -0.9733470678329468, -0.9240884780883789, -0.874829888343811, -0.8255712985992432, -0.7763125896453857, -0.7270539999008179, -0.6777953505516052, -0.6285367608070374, -0.5792781114578247, -0.5300195217132568, -0.48076093196868896, -0.4315023124217987, -0.38224369287490845, -0.3329850733280182, -0.28372645378112793, -0.23446786403656006, -0.1852092444896698, -0.13595062494277954, -0.08669203519821167, -0.03743341565132141, 0.011825084686279297, 0.06108369678258896, 0.11034230887889862, 0.15960091352462769, 0.20885953307151794, 0.2581181526184082, 0.3073767423629761, 0.35663536190986633, 0.4058939814567566, 0.45515260100364685, 0.5044112205505371, 0.553669810295105, 0.6029284000396729, 0.6521870493888855, 0.7014456391334534, 0.750704288482666, 0.7999628782272339, 0.8492214679718018, 0.8984801173210144, 0.9477387070655823, 0.9969973564147949, 1.0462559461593628, 1.0955145359039307, 1.1447731256484985, 1.1940317153930664, 1.2432903051376343, 1.2925488948822021, 1.3418076038360596, 1.3910661935806274, 1.4403247833251953, 1.4895833730697632, 1.538841962814331, 1.5881006717681885]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 9.0, 5.0, 8.0, 14.0, 21.0, 31.0, 41.0, 58.0, 90.0, 114.0, 181.0, 297.0, 562.0, 1007.0, 2047.0, 5116.0, 17855.0, 110753.0, 2679100.0, 1279506.0, 74409.0, 14292.0, 4563.0, 1954.0, 935.0, 490.0, 292.0, 179.0, 133.0, 71.0, 51.0, 32.0, 30.0, 13.0, 8.0, 8.0, 1.0, 7.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97900390625, -0.9501266479492188, -0.9212493896484375, -0.8923721313476562, -0.863494873046875, -0.8346176147460938, -0.8057403564453125, -0.7768630981445312, -0.74798583984375, -0.7191085815429688, -0.6902313232421875, -0.6613540649414062, -0.632476806640625, -0.6035995483398438, -0.5747222900390625, -0.5458450317382812, -0.5169677734375, -0.48809051513671875, -0.4592132568359375, -0.43033599853515625, -0.401458740234375, -0.37258148193359375, -0.3437042236328125, -0.31482696533203125, -0.28594970703125, -0.25707244873046875, -0.2281951904296875, -0.19931793212890625, -0.170440673828125, -0.14156341552734375, -0.1126861572265625, -0.08380889892578125, -0.054931640625, -0.02605438232421875, 0.0028228759765625, 0.03170013427734375, 0.060577392578125, 0.08945465087890625, 0.1183319091796875, 0.14720916748046875, 0.17608642578125, 0.20496368408203125, 0.2338409423828125, 0.26271820068359375, 0.291595458984375, 0.32047271728515625, 0.3493499755859375, 0.37822723388671875, 0.4071044921875, 0.43598175048828125, 0.4648590087890625, 0.49373626708984375, 0.522613525390625, 0.5514907836914062, 0.5803680419921875, 0.6092453002929688, 0.63812255859375, 0.6669998168945312, 0.6958770751953125, 0.7247543334960938, 0.753631591796875, 0.7825088500976562, 0.8113861083984375, 0.8402633666992188, 0.869140625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 19.0, 20.0, 24.0, 35.0, 52.0, 56.0, 86.0, 70.0, 94.0, 76.0, 90.0, 74.0, 57.0, 54.0, 39.0, 37.0, 22.0, 16.0, 19.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7915878295898438, -0.7701873779296875, -0.7487869262695312, -0.727386474609375, -0.7059860229492188, -0.6845855712890625, -0.6631851196289062, -0.64178466796875, -0.6203842163085938, -0.5989837646484375, -0.5775833129882812, -0.556182861328125, -0.5347824096679688, -0.5133819580078125, -0.49198150634765625, -0.4705810546875, -0.44918060302734375, -0.4277801513671875, -0.40637969970703125, -0.384979248046875, -0.36357879638671875, -0.3421783447265625, -0.32077789306640625, -0.29937744140625, -0.27797698974609375, -0.2565765380859375, -0.23517608642578125, -0.213775634765625, -0.19237518310546875, -0.1709747314453125, -0.14957427978515625, -0.128173828125, -0.10677337646484375, -0.0853729248046875, -0.06397247314453125, -0.042572021484375, -0.02117156982421875, 0.0002288818359375, 0.02162933349609375, 0.04302978515625, 0.06443023681640625, 0.0858306884765625, 0.10723114013671875, 0.128631591796875, 0.15003204345703125, 0.1714324951171875, 0.19283294677734375, 0.2142333984375, 0.23563385009765625, 0.2570343017578125, 0.27843475341796875, 0.299835205078125, 0.32123565673828125, 0.3426361083984375, 0.36403656005859375, 0.38543701171875, 0.40683746337890625, 0.4282379150390625, 0.44963836669921875, 0.471038818359375, 0.49243927001953125, 0.5138397216796875, 0.5352401733398438, 0.556640625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 5.0, 17.0, 18.0, 40.0, 76.0, 138.0, 236.0, 536.0, 1410.0, 4386.0, 21096.0, 233023.0, 3762302.0, 148513.0, 16556.0, 3725.0, 1209.0, 459.0, 217.0, 121.0, 60.0, 35.0, 22.0, 14.0, 14.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9188461303710938, -0.8840789794921875, -0.8493118286132812, -0.814544677734375, -0.7797775268554688, -0.7450103759765625, -0.7102432250976562, -0.67547607421875, -0.6407089233398438, -0.6059417724609375, -0.5711746215820312, -0.536407470703125, -0.5016403198242188, -0.4668731689453125, -0.43210601806640625, -0.3973388671875, -0.36257171630859375, -0.3278045654296875, -0.29303741455078125, -0.258270263671875, -0.22350311279296875, -0.1887359619140625, -0.15396881103515625, -0.11920166015625, -0.08443450927734375, -0.0496673583984375, -0.01490020751953125, 0.019866943359375, 0.05463409423828125, 0.0894012451171875, 0.12416839599609375, 0.158935546875, 0.19370269775390625, 0.2284698486328125, 0.26323699951171875, 0.298004150390625, 0.33277130126953125, 0.3675384521484375, 0.40230560302734375, 0.43707275390625, 0.47183990478515625, 0.5066070556640625, 0.5413742065429688, 0.576141357421875, 0.6109085083007812, 0.6456756591796875, 0.6804428100585938, 0.7152099609375, 0.7499771118164062, 0.7847442626953125, 0.8195114135742188, 0.854278564453125, 0.8890457153320312, 0.9238128662109375, 0.9585800170898438, 0.99334716796875, 1.0281143188476562, 1.0628814697265625, 1.0976486206054688, 1.132415771484375, 1.1671829223632812, 1.2019500732421875, 1.2367172241210938, 1.271484375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 7.0, 7.0, 15.0, 11.0, 16.0, 20.0, 31.0, 51.0, 83.0, 94.0, 157.0, 269.0, 516.0, 935.0, 778.0, 435.0, 226.0, 139.0, 85.0, 53.0, 35.0, 29.0, 19.0, 13.0, 12.0, 9.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2688312530517578, -0.2615394592285156, -0.25424766540527344, -0.24695587158203125, -0.23966407775878906, -0.23237228393554688, -0.2250804901123047, -0.2177886962890625, -0.2104969024658203, -0.20320510864257812, -0.19591331481933594, -0.18862152099609375, -0.18132972717285156, -0.17403793334960938, -0.1667461395263672, -0.159454345703125, -0.1521625518798828, -0.14487075805664062, -0.13757896423339844, -0.13028717041015625, -0.12299537658691406, -0.11570358276367188, -0.10841178894042969, -0.1011199951171875, -0.09382820129394531, -0.08653640747070312, -0.07924461364746094, -0.07195281982421875, -0.06466102600097656, -0.057369232177734375, -0.05007743835449219, -0.04278564453125, -0.03549385070800781, -0.028202056884765625, -0.020910263061523438, -0.01361846923828125, -0.0063266754150390625, 0.000965118408203125, 0.008256912231445312, 0.0155487060546875, 0.022840499877929688, 0.030132293701171875, 0.03742408752441406, 0.04471588134765625, 0.05200767517089844, 0.059299468994140625, 0.06659126281738281, 0.073883056640625, 0.08117485046386719, 0.08846664428710938, 0.09575843811035156, 0.10305023193359375, 0.11034202575683594, 0.11763381958007812, 0.12492561340332031, 0.1322174072265625, 0.1395092010498047, 0.14680099487304688, 0.15409278869628906, 0.16138458251953125, 0.16867637634277344, 0.17596817016601562, 0.1832599639892578, 0.1905517578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 13.0, 15.0, 35.0, 56.0, 70.0, 94.0, 122.0, 126.0, 154.0, 89.0, 67.0, 49.0, 19.0, 22.0, 9.0, 12.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1374131441116333, -1.1022365093231201, -1.067059874534607, -1.0318832397460938, -0.9967066049575806, -0.9615299701690674, -0.9263532757759094, -0.8911766409873962, -0.8560000061988831, -0.8208233714103699, -0.7856467366218567, -0.7504701018333435, -0.7152934074401855, -0.6801167726516724, -0.6449401378631592, -0.609763503074646, -0.5745868682861328, -0.5394102334976196, -0.5042335987091064, -0.4690569341182709, -0.4338802993297577, -0.3987036645412445, -0.36352699995040894, -0.32835036516189575, -0.29317373037338257, -0.2579970955848694, -0.222820445895195, -0.18764379620552063, -0.15246716141700745, -0.11729052662849426, -0.08211387693881989, -0.04693722724914551, -0.011760711669921875, 0.023415930569171906, 0.058592572808265686, 0.09376921504735947, 0.12894585728645325, 0.16412249207496643, 0.1992991417646408, 0.23447579145431519, 0.26965242624282837, 0.30482906103134155, 0.34000569581985474, 0.3751823604106903, 0.4103589951992035, 0.4455356299877167, 0.48071229457855225, 0.5158889293670654, 0.5510655641555786, 0.5862421989440918, 0.621418833732605, 0.6565954685211182, 0.6917721033096313, 0.7269487380981445, 0.7621254324913025, 0.7973020672798157, 0.8324787020683289, 0.867655336856842, 0.9028319716453552, 0.9380086064338684, 0.9731853008270264, 1.0083619356155396, 1.0435385704040527, 1.078715205192566, 1.113891839981079]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 0.0, 4.0, 6.0, 3.0, 5.0, 9.0, 15.0, 8.0, 30.0, 16.0, 23.0, 39.0, 41.0, 49.0, 53.0, 55.0, 56.0, 51.0, 48.0, 67.0, 62.0, 52.0, 47.0, 47.0, 40.0, 40.0, 31.0, 20.0, 14.0, 13.0, 14.0, 8.0, 8.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6562923192977905, -0.6367194652557373, -0.6171466708183289, -0.5975738167762756, -0.5780009627342224, -0.558428168296814, -0.5388553142547607, -0.5192824602127075, -0.4997096359729767, -0.48013681173324585, -0.4605639576911926, -0.4409911334514618, -0.42141830921173096, -0.40184545516967773, -0.3822726309299469, -0.36269980669021606, -0.34312695264816284, -0.323554128408432, -0.3039812743663788, -0.28440845012664795, -0.2648355960845947, -0.2452627718448639, -0.22568994760513306, -0.20611710846424103, -0.186544269323349, -0.16697143018245697, -0.14739859104156494, -0.1278257668018341, -0.10825292766094208, -0.08868008852005005, -0.06910725682973862, -0.049534425139427185, -0.02996164560317993, -0.010388810187578201, 0.009184025228023529, 0.02875686064362526, 0.04832969605922699, 0.06790253520011902, 0.08747536689043045, 0.10704819858074188, 0.1266210377216339, 0.14619387686252594, 0.16576671600341797, 0.1853395402431488, 0.20491237938404083, 0.22448521852493286, 0.2440580427646637, 0.26363086700439453, 0.28320372104644775, 0.3027765452861786, 0.3223493993282318, 0.34192222356796265, 0.36149507761001587, 0.3810679018497467, 0.40064072608947754, 0.42021358013153076, 0.4397864043712616, 0.45935922861099243, 0.47893208265304565, 0.4985049068927765, 0.5180777311325073, 0.5376505851745605, 0.5572234392166138, 0.5767962336540222, 0.5963690876960754]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 13.0, 7.0, 26.0, 38.0, 57.0, 92.0, 152.0, 277.0, 446.0, 869.0, 1815.0, 3884.0, 10529.0, 37396.0, 227221.0, 595862.0, 130936.0, 24891.0, 7756.0, 3089.0, 1476.0, 733.0, 391.0, 226.0, 142.0, 78.0, 56.0, 27.0, 24.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.149169921875, -0.14441299438476562, -0.13965606689453125, -0.13489913940429688, -0.1301422119140625, -0.12538528442382812, -0.12062835693359375, -0.11587142944335938, -0.111114501953125, -0.10635757446289062, -0.10160064697265625, -0.09684371948242188, -0.0920867919921875, -0.08732986450195312, -0.08257293701171875, -0.07781600952148438, -0.07305908203125, -0.06830215454101562, -0.06354522705078125, -0.058788299560546875, -0.0540313720703125, -0.049274444580078125, -0.04451751708984375, -0.039760589599609375, -0.035003662109375, -0.030246734619140625, -0.02548980712890625, -0.020732879638671875, -0.0159759521484375, -0.011219024658203125, -0.00646209716796875, -0.001705169677734375, 0.0030517578125, 0.007808685302734375, 0.01256561279296875, 0.017322540283203125, 0.0220794677734375, 0.026836395263671875, 0.03159332275390625, 0.036350250244140625, 0.041107177734375, 0.045864105224609375, 0.05062103271484375, 0.055377960205078125, 0.0601348876953125, 0.06489181518554688, 0.06964874267578125, 0.07440567016601562, 0.07916259765625, 0.08391952514648438, 0.08867645263671875, 0.09343338012695312, 0.0981903076171875, 0.10294723510742188, 0.10770416259765625, 0.11246109008789062, 0.117218017578125, 0.12197494506835938, 0.12673187255859375, 0.13148880004882812, 0.1362457275390625, 0.14100265502929688, 0.14575958251953125, 0.15051651000976562, 0.1552734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 5.0, 7.0, 17.0, 25.0, 18.0, 25.0, 39.0, 34.0, 60.0, 60.0, 53.0, 54.0, 77.0, 65.0, 53.0, 70.0, 55.0, 53.0, 40.0, 30.0, 26.0, 20.0, 27.0, 9.0, 11.0, 7.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.4892578125, -0.4752311706542969, -0.46120452880859375, -0.4471778869628906, -0.4331512451171875, -0.4191246032714844, -0.40509796142578125, -0.3910713195800781, -0.377044677734375, -0.3630180358886719, -0.34899139404296875, -0.3349647521972656, -0.3209381103515625, -0.3069114685058594, -0.29288482666015625, -0.2788581848144531, -0.26483154296875, -0.2508049011230469, -0.23677825927734375, -0.22275161743164062, -0.2087249755859375, -0.19469833374023438, -0.18067169189453125, -0.16664505004882812, -0.152618408203125, -0.13859176635742188, -0.12456512451171875, -0.11053848266601562, -0.0965118408203125, -0.08248519897460938, -0.06845855712890625, -0.054431915283203125, -0.0404052734375, -0.026378631591796875, -0.01235198974609375, 0.001674652099609375, 0.0157012939453125, 0.029727935791015625, 0.04375457763671875, 0.057781219482421875, 0.071807861328125, 0.08583450317382812, 0.09986114501953125, 0.11388778686523438, 0.1279144287109375, 0.14194107055664062, 0.15596771240234375, 0.16999435424804688, 0.18402099609375, 0.19804763793945312, 0.21207427978515625, 0.22610092163085938, 0.2401275634765625, 0.2541542053222656, 0.26818084716796875, 0.2822074890136719, 0.296234130859375, 0.3102607727050781, 0.32428741455078125, 0.3383140563964844, 0.3523406982421875, 0.3663673400878906, 0.38039398193359375, 0.3944206237792969, 0.408447265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 2.0, 6.0, 9.0, 8.0, 13.0, 22.0, 30.0, 43.0, 58.0, 83.0, 137.0, 179.0, 318.0, 534.0, 977.0, 1973.0, 4362.0, 12194.0, 49426.0, 335475.0, 527750.0, 86253.0, 17523.0, 5794.0, 2548.0, 1209.0, 651.0, 326.0, 225.0, 125.0, 91.0, 48.0, 35.0, 28.0, 21.0, 13.0, 15.0, 13.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11346435546875, -0.10970211029052734, -0.10593986511230469, -0.10217761993408203, -0.09841537475585938, -0.09465312957763672, -0.09089088439941406, -0.0871286392211914, -0.08336639404296875, -0.0796041488647461, -0.07584190368652344, -0.07207965850830078, -0.06831741333007812, -0.06455516815185547, -0.06079292297363281, -0.057030677795410156, -0.0532684326171875, -0.049506187438964844, -0.04574394226074219, -0.04198169708251953, -0.038219451904296875, -0.03445720672607422, -0.030694961547851562, -0.026932716369628906, -0.02317047119140625, -0.019408226013183594, -0.015645980834960938, -0.011883735656738281, -0.008121490478515625, -0.004359245300292969, -0.0005970001220703125, 0.0031652450561523438, 0.006927490234375, 0.010689735412597656, 0.014451980590820312, 0.01821422576904297, 0.021976470947265625, 0.02573871612548828, 0.029500961303710938, 0.033263206481933594, 0.03702545166015625, 0.040787696838378906, 0.04454994201660156, 0.04831218719482422, 0.052074432373046875, 0.05583667755126953, 0.05959892272949219, 0.06336116790771484, 0.0671234130859375, 0.07088565826416016, 0.07464790344238281, 0.07841014862060547, 0.08217239379882812, 0.08593463897705078, 0.08969688415527344, 0.0934591293334961, 0.09722137451171875, 0.1009836196899414, 0.10474586486816406, 0.10850811004638672, 0.11227035522460938, 0.11603260040283203, 0.11979484558105469, 0.12355709075927734, 0.1273193359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 3.0, 7.0, 5.0, 11.0, 9.0, 14.0, 20.0, 26.0, 21.0, 18.0, 34.0, 38.0, 32.0, 39.0, 54.0, 38.0, 34.0, 36.0, 63.0, 47.0, 46.0, 42.0, 50.0, 47.0, 27.0, 49.0, 32.0, 28.0, 24.0, 15.0, 15.0, 20.0, 11.0, 11.0, 8.0, 9.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7021484375, -0.67999267578125, -0.6578369140625, -0.63568115234375, -0.613525390625, -0.59136962890625, -0.5692138671875, -0.54705810546875, -0.52490234375, -0.50274658203125, -0.4805908203125, -0.45843505859375, -0.436279296875, -0.41412353515625, -0.3919677734375, -0.36981201171875, -0.34765625, -0.32550048828125, -0.3033447265625, -0.28118896484375, -0.259033203125, -0.23687744140625, -0.2147216796875, -0.19256591796875, -0.17041015625, -0.14825439453125, -0.1260986328125, -0.10394287109375, -0.081787109375, -0.05963134765625, -0.0374755859375, -0.01531982421875, 0.0068359375, 0.02899169921875, 0.0511474609375, 0.07330322265625, 0.095458984375, 0.11761474609375, 0.1397705078125, 0.16192626953125, 0.18408203125, 0.20623779296875, 0.2283935546875, 0.25054931640625, 0.272705078125, 0.29486083984375, 0.3170166015625, 0.33917236328125, 0.361328125, 0.38348388671875, 0.4056396484375, 0.42779541015625, 0.449951171875, 0.47210693359375, 0.4942626953125, 0.51641845703125, 0.53857421875, 0.56072998046875, 0.5828857421875, 0.60504150390625, 0.627197265625, 0.64935302734375, 0.6715087890625, 0.69366455078125, 0.7158203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 27.0, 34.0, 61.0, 84.0, 159.0, 281.0, 487.0, 902.0, 1824.0, 4378.0, 13170.0, 68243.0, 674378.0, 244558.0, 27140.0, 7315.0, 2745.0, 1283.0, 622.0, 359.0, 180.0, 90.0, 80.0, 39.0, 22.0, 18.0, 14.0, 8.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052215576171875, -0.05026388168334961, -0.04831218719482422, -0.04636049270629883, -0.04440879821777344, -0.04245710372924805, -0.040505409240722656, -0.038553714752197266, -0.036602020263671875, -0.034650325775146484, -0.032698631286621094, -0.030746936798095703, -0.028795242309570312, -0.026843547821044922, -0.02489185333251953, -0.02294015884399414, -0.02098846435546875, -0.01903676986694336, -0.01708507537841797, -0.015133380889892578, -0.013181686401367188, -0.011229991912841797, -0.009278297424316406, -0.007326602935791016, -0.005374908447265625, -0.0034232139587402344, -0.0014715194702148438, 0.0004801750183105469, 0.0024318695068359375, 0.004383563995361328, 0.006335258483886719, 0.00828695297241211, 0.0102386474609375, 0.01219034194946289, 0.014142036437988281, 0.016093730926513672, 0.018045425415039062, 0.019997119903564453, 0.021948814392089844, 0.023900508880615234, 0.025852203369140625, 0.027803897857666016, 0.029755592346191406, 0.0317072868347168, 0.03365898132324219, 0.03561067581176758, 0.03756237030029297, 0.03951406478881836, 0.04146575927734375, 0.04341745376586914, 0.04536914825439453, 0.04732084274291992, 0.04927253723144531, 0.0512242317199707, 0.053175926208496094, 0.055127620697021484, 0.057079315185546875, 0.059031009674072266, 0.060982704162597656, 0.06293439865112305, 0.06488609313964844, 0.06683778762817383, 0.06878948211669922, 0.07074117660522461, 0.07269287109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 4.0, 8.0, 23.0, 26.0, 33.0, 67.0, 87.0, 132.0, 140.0, 143.0, 91.0, 75.0, 63.0, 32.0, 19.0, 10.0, 12.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8908252716064453e-05, -2.793874591588974e-05, -2.6969239115715027e-05, -2.5999732315540314e-05, -2.50302255153656e-05, -2.4060718715190887e-05, -2.3091211915016174e-05, -2.212170511484146e-05, -2.1152198314666748e-05, -2.0182691514492035e-05, -1.9213184714317322e-05, -1.824367791414261e-05, -1.7274171113967896e-05, -1.6304664313793182e-05, -1.533515751361847e-05, -1.4365650713443756e-05, -1.3396143913269043e-05, -1.242663711309433e-05, -1.1457130312919617e-05, -1.0487623512744904e-05, -9.51811671257019e-06, -8.548609912395477e-06, -7.579103112220764e-06, -6.609596312046051e-06, -5.640089511871338e-06, -4.670582711696625e-06, -3.7010759115219116e-06, -2.7315691113471985e-06, -1.7620623111724854e-06, -7.925555109977722e-07, 1.7695128917694092e-07, 1.146458089351654e-06, 2.115964889526367e-06, 3.0854716897010803e-06, 4.0549784898757935e-06, 5.024485290050507e-06, 5.99399209022522e-06, 6.963498890399933e-06, 7.933005690574646e-06, 8.902512490749359e-06, 9.872019290924072e-06, 1.0841526091098785e-05, 1.1811032891273499e-05, 1.2780539691448212e-05, 1.3750046491622925e-05, 1.4719553291797638e-05, 1.568906009197235e-05, 1.6658566892147064e-05, 1.7628073692321777e-05, 1.859758049249649e-05, 1.9567087292671204e-05, 2.0536594092845917e-05, 2.150610089302063e-05, 2.2475607693195343e-05, 2.3445114493370056e-05, 2.441462129354477e-05, 2.5384128093719482e-05, 2.6353634893894196e-05, 2.732314169406891e-05, 2.8292648494243622e-05, 2.9262155294418335e-05, 3.0231662094593048e-05, 3.120116889476776e-05, 3.2170675694942474e-05, 3.314018249511719e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 4.0, 7.0, 10.0, 14.0, 17.0, 28.0, 37.0, 62.0, 108.0, 179.0, 283.0, 520.0, 883.0, 1633.0, 3183.0, 6679.0, 15945.0, 49617.0, 205785.0, 519836.0, 173309.0, 43443.0, 14443.0, 6126.0, 2796.0, 1601.0, 827.0, 442.0, 289.0, 163.0, 95.0, 61.0, 42.0, 24.0, 17.0, 11.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.044891357421875, -0.0435490608215332, -0.042206764221191406, -0.04086446762084961, -0.03952217102050781, -0.038179874420166016, -0.03683757781982422, -0.03549528121948242, -0.034152984619140625, -0.03281068801879883, -0.03146839141845703, -0.030126094818115234, -0.028783798217773438, -0.02744150161743164, -0.026099205017089844, -0.024756908416748047, -0.02341461181640625, -0.022072315216064453, -0.020730018615722656, -0.01938772201538086, -0.018045425415039062, -0.016703128814697266, -0.015360832214355469, -0.014018535614013672, -0.012676239013671875, -0.011333942413330078, -0.009991645812988281, -0.008649349212646484, -0.0073070526123046875, -0.005964756011962891, -0.004622459411621094, -0.003280162811279297, -0.0019378662109375, -0.0005955696105957031, 0.0007467269897460938, 0.0020890235900878906, 0.0034313201904296875, 0.004773616790771484, 0.006115913391113281, 0.007458209991455078, 0.008800506591796875, 0.010142803192138672, 0.011485099792480469, 0.012827396392822266, 0.014169692993164062, 0.01551198959350586, 0.016854286193847656, 0.018196582794189453, 0.01953887939453125, 0.020881175994873047, 0.022223472595214844, 0.02356576919555664, 0.024908065795898438, 0.026250362396240234, 0.02759265899658203, 0.028934955596923828, 0.030277252197265625, 0.03161954879760742, 0.03296184539794922, 0.034304141998291016, 0.03564643859863281, 0.03698873519897461, 0.038331031799316406, 0.0396733283996582, 0.041015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 10.0, 16.0, 13.0, 16.0, 39.0, 34.0, 75.0, 81.0, 103.0, 110.0, 124.0, 91.0, 84.0, 46.0, 41.0, 32.0, 22.0, 12.0, 15.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.01465606689453125, -0.014222502708435059, -0.013788938522338867, -0.013355374336242676, -0.012921810150146484, -0.012488245964050293, -0.012054681777954102, -0.01162111759185791, -0.011187553405761719, -0.010753989219665527, -0.010320425033569336, -0.009886860847473145, -0.009453296661376953, -0.009019732475280762, -0.00858616828918457, -0.008152604103088379, -0.0077190399169921875, -0.007285475730895996, -0.006851911544799805, -0.006418347358703613, -0.005984783172607422, -0.0055512189865112305, -0.005117654800415039, -0.004684090614318848, -0.004250526428222656, -0.003816962242126465, -0.0033833980560302734, -0.002949833869934082, -0.0025162696838378906, -0.0020827054977416992, -0.0016491413116455078, -0.0012155771255493164, -0.000782012939453125, -0.0003484487533569336, 8.511543273925781e-05, 0.0005186796188354492, 0.0009522438049316406, 0.001385807991027832, 0.0018193721771240234, 0.002252936363220215, 0.0026865005493164062, 0.0031200647354125977, 0.003553628921508789, 0.0039871931076049805, 0.004420757293701172, 0.004854321479797363, 0.005287885665893555, 0.005721449851989746, 0.0061550140380859375, 0.006588578224182129, 0.00702214241027832, 0.007455706596374512, 0.007889270782470703, 0.008322834968566895, 0.008756399154663086, 0.009189963340759277, 0.009623527526855469, 0.01005709171295166, 0.010490655899047852, 0.010924220085144043, 0.011357784271240234, 0.011791348457336426, 0.012224912643432617, 0.012658476829528809, 0.013092041015625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 11.0, 8.0, 17.0, 29.0, 52.0, 103.0, 116.0, 154.0, 170.0, 134.0, 68.0, 41.0, 30.0, 17.0, 8.0, 13.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8422192931175232, -0.8157488107681274, -0.7892783284187317, -0.7628079056739807, -0.736337423324585, -0.7098669409751892, -0.6833964586257935, -0.6569260358810425, -0.6304555535316467, -0.603985071182251, -0.5775145888328552, -0.5510441660881042, -0.5245736837387085, -0.49810320138931274, -0.471632719039917, -0.44516226649284363, -0.4186917841434479, -0.3922213017940521, -0.36575084924697876, -0.339280366897583, -0.31280991435050964, -0.2863394320011139, -0.2598689794540405, -0.23339849710464478, -0.20692802965641022, -0.18045756220817566, -0.1539870947599411, -0.12751662731170654, -0.10104615241289139, -0.07457567751407623, -0.048105210065841675, -0.021634742617607117, 0.004835724830627441, 0.031306192278862, 0.057776663452386856, 0.08424713462591171, 0.11071760207414627, 0.13718807697296143, 0.16365854442119598, 0.19012901186943054, 0.2165994793176651, 0.24306994676589966, 0.2695404291152954, 0.2960108816623688, 0.3224813640117645, 0.3489518165588379, 0.37542229890823364, 0.4018927812576294, 0.42836323380470276, 0.4548337161540985, 0.4813041687011719, 0.5077746510505676, 0.5342451333999634, 0.5607155561447144, 0.5871860384941101, 0.6136565208435059, 0.6401270031929016, 0.6665974855422974, 0.6930679678916931, 0.7195383906364441, 0.7460088729858398, 0.7724793553352356, 0.7989498376846313, 0.8254202604293823, 0.8518907427787781]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 8.0, 11.0, 9.0, 11.0, 25.0, 22.0, 28.0, 46.0, 51.0, 51.0, 59.0, 63.0, 69.0, 58.0, 74.0, 60.0, 57.0, 51.0, 40.0, 51.0, 32.0, 22.0, 18.0, 13.0, 9.0, 14.0, 7.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.46091294288635254, -0.4472023546695709, -0.4334917664527893, -0.4197811484336853, -0.4060705602169037, -0.39235997200012207, -0.37864935398101807, -0.36493876576423645, -0.35122817754745483, -0.3375175893306732, -0.3238070011138916, -0.3100963830947876, -0.296385794878006, -0.28267520666122437, -0.26896458864212036, -0.25525400042533875, -0.24154341220855713, -0.2278328239917755, -0.2141222208738327, -0.2004116177558899, -0.18670102953910828, -0.17299044132232666, -0.15927983820438385, -0.14556923508644104, -0.13185864686965942, -0.11814805120229721, -0.104437455534935, -0.09072685986757278, -0.07701626420021057, -0.06330566853284836, -0.049595072865486145, -0.03588447719812393, -0.02217385172843933, -0.008463256061077118, 0.005247339606285095, 0.01895793527364731, 0.03266853094100952, 0.046379126608371735, 0.06008972227573395, 0.07380031794309616, 0.08751091361045837, 0.10122150927782059, 0.1149321049451828, 0.1286427080631256, 0.14235329627990723, 0.15606388449668884, 0.16977448761463165, 0.18348509073257446, 0.19719567894935608, 0.2109062671661377, 0.2246168702840805, 0.23832747340202332, 0.25203806161880493, 0.26574864983558655, 0.27945923805236816, 0.29316985607147217, 0.3068804442882538, 0.3205910325050354, 0.3343016505241394, 0.348012238740921, 0.36172282695770264, 0.37543341517448425, 0.38914400339126587, 0.4028546214103699, 0.4165652096271515]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 14.0, 19.0, 30.0, 36.0, 49.0, 80.0, 120.0, 234.0, 370.0, 550.0, 1023.0, 2198.0, 4654.0, 11256.0, 34352.0, 182632.0, 691985.0, 83027.0, 21245.0, 7713.0, 3280.0, 1572.0, 856.0, 494.0, 286.0, 167.0, 89.0, 69.0, 44.0, 38.0, 16.0, 15.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49169921875, -0.47599029541015625, -0.4602813720703125, -0.44457244873046875, -0.428863525390625, -0.41315460205078125, -0.3974456787109375, -0.38173675537109375, -0.36602783203125, -0.35031890869140625, -0.3346099853515625, -0.31890106201171875, -0.303192138671875, -0.28748321533203125, -0.2717742919921875, -0.25606536865234375, -0.2403564453125, -0.22464752197265625, -0.2089385986328125, -0.19322967529296875, -0.177520751953125, -0.16181182861328125, -0.1461029052734375, -0.13039398193359375, -0.11468505859375, -0.09897613525390625, -0.0832672119140625, -0.06755828857421875, -0.051849365234375, -0.03614044189453125, -0.0204315185546875, -0.00472259521484375, 0.010986328125, 0.02669525146484375, 0.0424041748046875, 0.05811309814453125, 0.073822021484375, 0.08953094482421875, 0.1052398681640625, 0.12094879150390625, 0.13665771484375, 0.15236663818359375, 0.1680755615234375, 0.18378448486328125, 0.199493408203125, 0.21520233154296875, 0.2309112548828125, 0.24662017822265625, 0.2623291015625, 0.27803802490234375, 0.2937469482421875, 0.30945587158203125, 0.325164794921875, 0.34087371826171875, 0.3565826416015625, 0.37229156494140625, 0.38800048828125, 0.40370941162109375, 0.4194183349609375, 0.43512725830078125, 0.450836181640625, 0.46654510498046875, 0.4822540283203125, 0.49796295166015625, 0.513671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 10.0, 5.0, 6.0, 8.0, 10.0, 13.0, 22.0, 33.0, 31.0, 48.0, 58.0, 67.0, 62.0, 62.0, 75.0, 72.0, 67.0, 62.0, 55.0, 44.0, 38.0, 30.0, 25.0, 26.0, 14.0, 11.0, 11.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0439453125, -1.0154342651367188, -0.9869232177734375, -0.9584121704101562, -0.929901123046875, -0.9013900756835938, -0.8728790283203125, -0.8443679809570312, -0.81585693359375, -0.7873458862304688, -0.7588348388671875, -0.7303237915039062, -0.701812744140625, -0.6733016967773438, -0.6447906494140625, -0.6162796020507812, -0.5877685546875, -0.5592575073242188, -0.5307464599609375, -0.5022354125976562, -0.473724365234375, -0.44521331787109375, -0.4167022705078125, -0.38819122314453125, -0.35968017578125, -0.33116912841796875, -0.3026580810546875, -0.27414703369140625, -0.245635986328125, -0.21712493896484375, -0.1886138916015625, -0.16010284423828125, -0.131591796875, -0.10308074951171875, -0.0745697021484375, -0.04605865478515625, -0.017547607421875, 0.01096343994140625, 0.0394744873046875, 0.06798553466796875, 0.09649658203125, 0.12500762939453125, 0.1535186767578125, 0.18202972412109375, 0.210540771484375, 0.23905181884765625, 0.2675628662109375, 0.29607391357421875, 0.3245849609375, 0.35309600830078125, 0.3816070556640625, 0.41011810302734375, 0.438629150390625, 0.46714019775390625, 0.4956512451171875, 0.5241622924804688, 0.55267333984375, 0.5811843872070312, 0.6096954345703125, 0.6382064819335938, 0.666717529296875, 0.6952285766601562, 0.7237396240234375, 0.7522506713867188, 0.78076171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 13.0, 10.0, 7.0, 20.0, 27.0, 26.0, 47.0, 68.0, 103.0, 169.0, 297.0, 842.0, 2658.0, 12897.0, 116771.0, 855813.0, 48432.0, 7455.0, 1672.0, 528.0, 259.0, 116.0, 67.0, 59.0, 43.0, 35.0, 24.0, 16.0, 7.0, 11.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7109375, -0.6866989135742188, -0.6624603271484375, -0.6382217407226562, -0.613983154296875, -0.5897445678710938, -0.5655059814453125, -0.5412673950195312, -0.51702880859375, -0.49279022216796875, -0.4685516357421875, -0.44431304931640625, -0.420074462890625, -0.39583587646484375, -0.3715972900390625, -0.34735870361328125, -0.3231201171875, -0.29888153076171875, -0.2746429443359375, -0.25040435791015625, -0.226165771484375, -0.20192718505859375, -0.1776885986328125, -0.15345001220703125, -0.12921142578125, -0.10497283935546875, -0.0807342529296875, -0.05649566650390625, -0.032257080078125, -0.00801849365234375, 0.0162200927734375, 0.04045867919921875, 0.064697265625, 0.08893585205078125, 0.1131744384765625, 0.13741302490234375, 0.161651611328125, 0.18589019775390625, 0.2101287841796875, 0.23436737060546875, 0.25860595703125, 0.28284454345703125, 0.3070831298828125, 0.33132171630859375, 0.355560302734375, 0.37979888916015625, 0.4040374755859375, 0.42827606201171875, 0.4525146484375, 0.47675323486328125, 0.5009918212890625, 0.5252304077148438, 0.549468994140625, 0.5737075805664062, 0.5979461669921875, 0.6221847534179688, 0.64642333984375, 0.6706619262695312, 0.6949005126953125, 0.7191390991210938, 0.743377685546875, 0.7676162719726562, 0.7918548583984375, 0.8160934448242188, 0.84033203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 5.0, 10.0, 8.0, 3.0, 7.0, 13.0, 19.0, 25.0, 22.0, 26.0, 33.0, 39.0, 64.0, 57.0, 74.0, 54.0, 69.0, 53.0, 51.0, 72.0, 41.0, 42.0, 33.0, 31.0, 30.0, 24.0, 21.0, 18.0, 18.0, 14.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9958343505859375, -0.962371826171875, -0.9289093017578125, -0.89544677734375, -0.8619842529296875, -0.828521728515625, -0.7950592041015625, -0.7615966796875, -0.7281341552734375, -0.694671630859375, -0.6612091064453125, -0.62774658203125, -0.5942840576171875, -0.560821533203125, -0.5273590087890625, -0.493896484375, -0.4604339599609375, -0.426971435546875, -0.3935089111328125, -0.36004638671875, -0.3265838623046875, -0.293121337890625, -0.2596588134765625, -0.2261962890625, -0.1927337646484375, -0.159271240234375, -0.1258087158203125, -0.09234619140625, -0.0588836669921875, -0.025421142578125, 0.0080413818359375, 0.04150390625, 0.0749664306640625, 0.108428955078125, 0.1418914794921875, 0.17535400390625, 0.2088165283203125, 0.242279052734375, 0.2757415771484375, 0.3092041015625, 0.3426666259765625, 0.376129150390625, 0.4095916748046875, 0.44305419921875, 0.4765167236328125, 0.509979248046875, 0.5434417724609375, 0.576904296875, 0.6103668212890625, 0.643829345703125, 0.6772918701171875, 0.71075439453125, 0.7442169189453125, 0.777679443359375, 0.8111419677734375, 0.8446044921875, 0.8780670166015625, 0.911529541015625, 0.9449920654296875, 0.97845458984375, 1.0119171142578125, 1.045379638671875, 1.0788421630859375, 1.1123046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 6.0, 7.0, 9.0, 12.0, 16.0, 28.0, 39.0, 89.0, 192.0, 412.0, 983.0, 3357.0, 17940.0, 244841.0, 743217.0, 30346.0, 4762.0, 1314.0, 514.0, 217.0, 119.0, 62.0, 29.0, 19.0, 7.0, 4.0, 7.0, 1.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.364990234375, -0.3561134338378906, -0.34723663330078125, -0.3383598327636719, -0.3294830322265625, -0.3206062316894531, -0.31172943115234375, -0.3028526306152344, -0.293975830078125, -0.2850990295410156, -0.27622222900390625, -0.2673454284667969, -0.2584686279296875, -0.24959182739257812, -0.24071502685546875, -0.23183822631835938, -0.22296142578125, -0.21408462524414062, -0.20520782470703125, -0.19633102416992188, -0.1874542236328125, -0.17857742309570312, -0.16970062255859375, -0.16082382202148438, -0.151947021484375, -0.14307022094726562, -0.13419342041015625, -0.12531661987304688, -0.1164398193359375, -0.10756301879882812, -0.09868621826171875, -0.08980941772460938, -0.0809326171875, -0.07205581665039062, -0.06317901611328125, -0.054302215576171875, -0.0454254150390625, -0.036548614501953125, -0.02767181396484375, -0.018795013427734375, -0.009918212890625, -0.001041412353515625, 0.00783538818359375, 0.016712188720703125, 0.0255889892578125, 0.034465789794921875, 0.04334259033203125, 0.052219390869140625, 0.06109619140625, 0.06997299194335938, 0.07884979248046875, 0.08772659301757812, 0.0966033935546875, 0.10548019409179688, 0.11435699462890625, 0.12323379516601562, 0.132110595703125, 0.14098739624023438, 0.14986419677734375, 0.15874099731445312, 0.1676177978515625, 0.17649459838867188, 0.18537139892578125, 0.19424819946289062, 0.203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 9.0, 17.0, 24.0, 24.0, 17.0, 30.0, 43.0, 71.0, 100.0, 244.0, 154.0, 69.0, 48.0, 36.0, 24.0, 17.0, 14.0, 5.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.205371856689453e-05, -2.1224841475486755e-05, -2.039596438407898e-05, -1.9567087292671204e-05, -1.8738210201263428e-05, -1.7909333109855652e-05, -1.7080456018447876e-05, -1.62515789270401e-05, -1.5422701835632324e-05, -1.4593824744224548e-05, -1.3764947652816772e-05, -1.2936070561408997e-05, -1.210719347000122e-05, -1.1278316378593445e-05, -1.0449439287185669e-05, -9.620562195777893e-06, -8.791685104370117e-06, -7.962808012962341e-06, -7.1339309215545654e-06, -6.3050538301467896e-06, -5.476176738739014e-06, -4.647299647331238e-06, -3.818422555923462e-06, -2.989545464515686e-06, -2.16066837310791e-06, -1.3317912817001343e-06, -5.029141902923584e-07, 3.259629011154175e-07, 1.1548399925231934e-06, 1.9837170839309692e-06, 2.812594175338745e-06, 3.641471266746521e-06, 4.470348358154297e-06, 5.299225449562073e-06, 6.128102540969849e-06, 6.9569796323776245e-06, 7.7858567237854e-06, 8.614733815193176e-06, 9.443610906600952e-06, 1.0272487998008728e-05, 1.1101365089416504e-05, 1.193024218082428e-05, 1.2759119272232056e-05, 1.3587996363639832e-05, 1.4416873455047607e-05, 1.5245750546455383e-05, 1.607462763786316e-05, 1.6903504729270935e-05, 1.773238182067871e-05, 1.8561258912086487e-05, 1.9390136003494263e-05, 2.021901309490204e-05, 2.1047890186309814e-05, 2.187676727771759e-05, 2.2705644369125366e-05, 2.3534521460533142e-05, 2.4363398551940918e-05, 2.5192275643348694e-05, 2.602115273475647e-05, 2.6850029826164246e-05, 2.767890691757202e-05, 2.8507784008979797e-05, 2.9336661100387573e-05, 3.016553819179535e-05, 3.0994415283203125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 8.0, 8.0, 17.0, 23.0, 33.0, 31.0, 82.0, 155.0, 292.0, 843.0, 2644.0, 12747.0, 93399.0, 844149.0, 79115.0, 11246.0, 2440.0, 743.0, 276.0, 125.0, 69.0, 34.0, 24.0, 13.0, 14.0, 9.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2293701171875, -0.2213115692138672, -0.21325302124023438, -0.20519447326660156, -0.19713592529296875, -0.18907737731933594, -0.18101882934570312, -0.1729602813720703, -0.1649017333984375, -0.1568431854248047, -0.14878463745117188, -0.14072608947753906, -0.13266754150390625, -0.12460899353027344, -0.11655044555664062, -0.10849189758300781, -0.100433349609375, -0.09237480163574219, -0.08431625366210938, -0.07625770568847656, -0.06819915771484375, -0.06014060974121094, -0.052082061767578125, -0.04402351379394531, -0.0359649658203125, -0.027906417846679688, -0.019847869873046875, -0.011789321899414062, -0.00373077392578125, 0.0043277740478515625, 0.012386322021484375, 0.020444869995117188, 0.02850341796875, 0.03656196594238281, 0.044620513916015625, 0.05267906188964844, 0.06073760986328125, 0.06879615783691406, 0.07685470581054688, 0.08491325378417969, 0.0929718017578125, 0.10103034973144531, 0.10908889770507812, 0.11714744567871094, 0.12520599365234375, 0.13326454162597656, 0.14132308959960938, 0.1493816375732422, 0.157440185546875, 0.1654987335205078, 0.17355728149414062, 0.18161582946777344, 0.18967437744140625, 0.19773292541503906, 0.20579147338867188, 0.2138500213623047, 0.2219085693359375, 0.2299671173095703, 0.23802566528320312, 0.24608421325683594, 0.25414276123046875, 0.26220130920410156, 0.2702598571777344, 0.2783184051513672, 0.286376953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 9.0, 13.0, 18.0, 38.0, 44.0, 73.0, 125.0, 310.0, 130.0, 71.0, 50.0, 25.0, 28.0, 19.0, 14.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1536865234375, -0.15006542205810547, -0.14644432067871094, -0.1428232192993164, -0.13920211791992188, -0.13558101654052734, -0.1319599151611328, -0.12833881378173828, -0.12471771240234375, -0.12109661102294922, -0.11747550964355469, -0.11385440826416016, -0.11023330688476562, -0.1066122055053711, -0.10299110412597656, -0.09937000274658203, -0.0957489013671875, -0.09212779998779297, -0.08850669860839844, -0.0848855972290039, -0.08126449584960938, -0.07764339447021484, -0.07402229309082031, -0.07040119171142578, -0.06678009033203125, -0.06315898895263672, -0.05953788757324219, -0.055916786193847656, -0.052295684814453125, -0.048674583435058594, -0.04505348205566406, -0.04143238067626953, -0.037811279296875, -0.03419017791748047, -0.030569076538085938, -0.026947975158691406, -0.023326873779296875, -0.019705772399902344, -0.016084671020507812, -0.012463569641113281, -0.00884246826171875, -0.005221366882324219, -0.0016002655029296875, 0.0020208358764648438, 0.005641937255859375, 0.009263038635253906, 0.012884140014648438, 0.01650524139404297, 0.0201263427734375, 0.02374744415283203, 0.027368545532226562, 0.030989646911621094, 0.034610748291015625, 0.038231849670410156, 0.04185295104980469, 0.04547405242919922, 0.04909515380859375, 0.05271625518798828, 0.05633735656738281, 0.059958457946777344, 0.06357955932617188, 0.0672006607055664, 0.07082176208496094, 0.07444286346435547, 0.07806396484375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 6.0, 12.0, 41.0, 66.0, 178.0, 274.0, 231.0, 99.0, 48.0, 20.0, 11.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9080429077148438, -1.8107364177703857, -1.7134299278259277, -1.6161233186721802, -1.5188168287277222, -1.4215103387832642, -1.3242037296295166, -1.2268972396850586, -1.1295907497406006, -1.0322842597961426, -0.9349777102470398, -0.837671160697937, -0.740364670753479, -0.643058180809021, -0.5457516312599182, -0.44844508171081543, -0.3511385917663574, -0.253832072019577, -0.15652555227279663, -0.059219032526016235, 0.03808748722076416, 0.13539400696754456, 0.23270052671432495, 0.33000707626342773, 0.42731356620788574, 0.5246200561523438, 0.6219266057014465, 0.7192331552505493, 0.8165396451950073, 0.9138461351394653, 1.011152744293213, 1.108459234237671, 1.205765724182129, 1.303072214126587, 1.400378704071045, 1.4976853132247925, 1.5949918031692505, 1.6922982931137085, 1.789604902267456, 1.886911392211914, 1.984217882156372, 2.08152437210083, 2.178830862045288, 2.276137351989746, 2.373444080352783, 2.470750570297241, 2.568057060241699, 2.6653635501861572, 2.7626700401306152, 2.8599765300750732, 2.9572830200195312, 3.0545895099639893, 3.1518959999084473, 3.2492027282714844, 3.3465092182159424, 3.4438157081604004, 3.5411221981048584, 3.6384286880493164, 3.7357351779937744, 3.8330416679382324, 3.9303483963012695, 4.027654647827148, 4.1249613761901855, 4.222268104553223, 4.319574356079102]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 11.0, 13.0, 9.0, 17.0, 24.0, 26.0, 24.0, 27.0, 26.0, 31.0, 22.0, 27.0, 46.0, 41.0, 38.0, 49.0, 42.0, 53.0, 40.0, 42.0, 38.0, 38.0, 28.0, 30.0, 31.0, 33.0, 31.0, 25.0, 23.0, 11.0, 20.0, 13.0, 10.0, 6.0, 12.0, 5.0, 5.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.432656168937683, -1.3903820514678955, -1.3481080532073975, -1.3058339357376099, -1.2635598182678223, -1.2212857007980347, -1.1790117025375366, -1.136737585067749, -1.0944634675979614, -1.0521893501281738, -1.0099153518676758, -0.9676412343978882, -0.9253671169281006, -0.8830930590629578, -0.8408190011978149, -0.7985448837280273, -0.7562708258628845, -0.7139967679977417, -0.6717226505279541, -0.6294485926628113, -0.5871744751930237, -0.5449004173278809, -0.5026262998580933, -0.46035224199295044, -0.41807815432548523, -0.37580406665802, -0.3335299789905548, -0.2912558913230896, -0.24898181855678558, -0.20670773088932037, -0.16443365812301636, -0.12215957045555115, -0.07988548278808594, -0.037611398845911026, 0.0046626850962638855, 0.0469367653131485, 0.08921085298061371, 0.13148494064807892, 0.17375901341438293, 0.21603310108184814, 0.25830718874931335, 0.30058127641677856, 0.3428553640842438, 0.385129451751709, 0.4274035096168518, 0.4696776270866394, 0.5119516849517822, 0.5542258024215698, 0.5964998602867126, 0.6387739181518555, 0.6810480356216431, 0.7233220934867859, 0.7655962109565735, 0.8078702688217163, 0.8501443862915039, 0.8924184441566467, 0.9346925020217896, 0.9769665598869324, 1.0192406177520752, 1.0615147352218628, 1.1037888526916504, 1.146062970161438, 1.188336968421936, 1.2306110858917236, 1.2728852033615112]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 12.0, 9.0, 17.0, 16.0, 20.0, 28.0, 24.0, 39.0, 28.0, 63.0, 96.0, 148.0, 255.0, 526.0, 1259.0, 3691.0, 17035.0, 258304.0, 3776173.0, 118716.0, 12451.0, 3065.0, 1128.0, 446.0, 233.0, 128.0, 73.0, 50.0, 46.0, 28.0, 18.0, 18.0, 23.0, 16.0, 16.0, 8.0, 13.0, 7.0, 9.0, 6.0, 5.0, 8.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.1279296875, -1.0882110595703125, -1.048492431640625, -1.0087738037109375, -0.96905517578125, -0.9293365478515625, -0.889617919921875, -0.8498992919921875, -0.8101806640625, -0.7704620361328125, -0.730743408203125, -0.6910247802734375, -0.65130615234375, -0.6115875244140625, -0.571868896484375, -0.5321502685546875, -0.492431640625, -0.4527130126953125, -0.412994384765625, -0.3732757568359375, -0.33355712890625, -0.2938385009765625, -0.254119873046875, -0.2144012451171875, -0.1746826171875, -0.1349639892578125, -0.095245361328125, -0.0555267333984375, -0.01580810546875, 0.0239105224609375, 0.063629150390625, 0.1033477783203125, 0.14306640625, 0.1827850341796875, 0.222503662109375, 0.2622222900390625, 0.30194091796875, 0.3416595458984375, 0.381378173828125, 0.4210968017578125, 0.4608154296875, 0.5005340576171875, 0.540252685546875, 0.5799713134765625, 0.61968994140625, 0.6594085693359375, 0.699127197265625, 0.7388458251953125, 0.778564453125, 0.8182830810546875, 0.858001708984375, 0.8977203369140625, 0.93743896484375, 0.9771575927734375, 1.016876220703125, 1.0565948486328125, 1.0963134765625, 1.1360321044921875, 1.175750732421875, 1.2154693603515625, 1.25518798828125, 1.2949066162109375, 1.334625244140625, 1.3743438720703125, 1.4140625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 4.0, 3.0, 4.0, 6.0, 10.0, 11.0, 22.0, 27.0, 34.0, 45.0, 71.0, 62.0, 85.0, 76.0, 79.0, 81.0, 71.0, 65.0, 67.0, 38.0, 31.0, 31.0, 20.0, 17.0, 12.0, 4.0, 8.0, 5.0, 0.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65771484375, -0.6391677856445312, -0.6206207275390625, -0.6020736694335938, -0.583526611328125, -0.5649795532226562, -0.5464324951171875, -0.5278854370117188, -0.50933837890625, -0.49079132080078125, -0.4722442626953125, -0.45369720458984375, -0.435150146484375, -0.41660308837890625, -0.3980560302734375, -0.37950897216796875, -0.3609619140625, -0.34241485595703125, -0.3238677978515625, -0.30532073974609375, -0.286773681640625, -0.26822662353515625, -0.2496795654296875, -0.23113250732421875, -0.21258544921875, -0.19403839111328125, -0.1754913330078125, -0.15694427490234375, -0.138397216796875, -0.11985015869140625, -0.1013031005859375, -0.08275604248046875, -0.064208984375, -0.04566192626953125, -0.0271148681640625, -0.00856781005859375, 0.009979248046875, 0.02852630615234375, 0.0470733642578125, 0.06562042236328125, 0.08416748046875, 0.10271453857421875, 0.1212615966796875, 0.13980865478515625, 0.158355712890625, 0.17690277099609375, 0.1954498291015625, 0.21399688720703125, 0.2325439453125, 0.25109100341796875, 0.2696380615234375, 0.28818511962890625, 0.306732177734375, 0.32527923583984375, 0.3438262939453125, 0.36237335205078125, 0.38092041015625, 0.39946746826171875, 0.4180145263671875, 0.43656158447265625, 0.455108642578125, 0.47365570068359375, 0.4922027587890625, 0.5107498168945312, 0.529296875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 9.0, 10.0, 6.0, 7.0, 16.0, 20.0, 33.0, 44.0, 110.0, 160.0, 358.0, 787.0, 1937.0, 6799.0, 36900.0, 800895.0, 3259619.0, 71206.0, 10588.0, 2797.0, 1047.0, 431.0, 213.0, 95.0, 66.0, 43.0, 27.0, 17.0, 5.0, 7.0, 5.0, 3.0, 4.0, 8.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.99951171875, -0.9626998901367188, -0.9258880615234375, -0.8890762329101562, -0.852264404296875, -0.8154525756835938, -0.7786407470703125, -0.7418289184570312, -0.70501708984375, -0.6682052612304688, -0.6313934326171875, -0.5945816040039062, -0.557769775390625, -0.5209579467773438, -0.4841461181640625, -0.44733428955078125, -0.4105224609375, -0.37371063232421875, -0.3368988037109375, -0.30008697509765625, -0.263275146484375, -0.22646331787109375, -0.1896514892578125, -0.15283966064453125, -0.11602783203125, -0.07921600341796875, -0.0424041748046875, -0.00559234619140625, 0.031219482421875, 0.06803131103515625, 0.1048431396484375, 0.14165496826171875, 0.178466796875, 0.21527862548828125, 0.2520904541015625, 0.28890228271484375, 0.325714111328125, 0.36252593994140625, 0.3993377685546875, 0.43614959716796875, 0.47296142578125, 0.5097732543945312, 0.5465850830078125, 0.5833969116210938, 0.620208740234375, 0.6570205688476562, 0.6938323974609375, 0.7306442260742188, 0.7674560546875, 0.8042678833007812, 0.8410797119140625, 0.8778915405273438, 0.914703369140625, 0.9515151977539062, 0.9883270263671875, 1.0251388549804688, 1.06195068359375, 1.0987625122070312, 1.1355743408203125, 1.1723861694335938, 1.209197998046875, 1.2460098266601562, 1.2828216552734375, 1.3196334838867188, 1.3564453125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 15.0, 17.0, 26.0, 22.0, 41.0, 63.0, 82.0, 138.0, 219.0, 430.0, 681.0, 915.0, 541.0, 318.0, 192.0, 99.0, 68.0, 49.0, 27.0, 33.0, 26.0, 12.0, 9.0, 7.0, 4.0, 6.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260498046875, -0.25310516357421875, -0.2457122802734375, -0.23831939697265625, -0.230926513671875, -0.22353363037109375, -0.2161407470703125, -0.20874786376953125, -0.20135498046875, -0.19396209716796875, -0.1865692138671875, -0.17917633056640625, -0.171783447265625, -0.16439056396484375, -0.1569976806640625, -0.14960479736328125, -0.1422119140625, -0.13481903076171875, -0.1274261474609375, -0.12003326416015625, -0.112640380859375, -0.10524749755859375, -0.0978546142578125, -0.09046173095703125, -0.08306884765625, -0.07567596435546875, -0.0682830810546875, -0.06089019775390625, -0.053497314453125, -0.04610443115234375, -0.0387115478515625, -0.03131866455078125, -0.02392578125, -0.01653289794921875, -0.0091400146484375, -0.00174713134765625, 0.005645751953125, 0.01303863525390625, 0.0204315185546875, 0.02782440185546875, 0.03521728515625, 0.04261016845703125, 0.0500030517578125, 0.05739593505859375, 0.064788818359375, 0.07218170166015625, 0.0795745849609375, 0.08696746826171875, 0.0943603515625, 0.10175323486328125, 0.1091461181640625, 0.11653900146484375, 0.123931884765625, 0.13132476806640625, 0.1387176513671875, 0.14611053466796875, 0.15350341796875, 0.16089630126953125, 0.1682891845703125, 0.17568206787109375, 0.183074951171875, 0.19046783447265625, 0.1978607177734375, 0.20525360107421875, 0.212646484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 9.0, 12.0, 18.0, 44.0, 59.0, 84.0, 115.0, 133.0, 130.0, 147.0, 86.0, 58.0, 38.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3423888683319092, -1.3028398752212524, -1.2632908821105957, -1.223741888999939, -1.1841928958892822, -1.144644021987915, -1.1050950288772583, -1.0655460357666016, -1.0259970426559448, -0.9864480495452881, -0.9468990564346313, -0.9073501229286194, -0.8678011298179626, -0.8282521367073059, -0.788703203201294, -0.7491542100906372, -0.7096052169799805, -0.6700562238693237, -0.630507230758667, -0.590958297252655, -0.5514093041419983, -0.5118603110313416, -0.4723113477230072, -0.43276238441467285, -0.3932133913040161, -0.3536643981933594, -0.314115434885025, -0.2745664715766907, -0.23501747846603394, -0.1954685002565384, -0.15591952204704285, -0.1163705587387085, -0.07682168483734131, -0.037272706627845764, 0.0022762715816497803, 0.041825249791145325, 0.08137422800064087, 0.12092320621013641, 0.16047218441963196, 0.2000211477279663, 0.23957014083862305, 0.2791191339492798, 0.31866809725761414, 0.3582170605659485, 0.3977660536766052, 0.43731504678726196, 0.4768640100955963, 0.5164129734039307, 0.5559619665145874, 0.5955109596252441, 0.6350599527359009, 0.6746088862419128, 0.7141578793525696, 0.7537068724632263, 0.7932558059692383, 0.832804799079895, 0.8723537921905518, 0.9119027853012085, 0.9514517784118652, 0.9910007119178772, 1.0305497646331787, 1.070098638534546, 1.1096476316452026, 1.1491966247558594, 1.1887456178665161]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 9.0, 9.0, 17.0, 15.0, 19.0, 23.0, 25.0, 29.0, 39.0, 47.0, 53.0, 44.0, 48.0, 50.0, 55.0, 49.0, 59.0, 52.0, 49.0, 42.0, 41.0, 35.0, 29.0, 36.0, 30.0, 20.0, 8.0, 17.0, 6.0, 5.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0], "bins": [-0.699561357498169, -0.6815537810325623, -0.6635462045669556, -0.6455386281013489, -0.6275310516357422, -0.6095234751701355, -0.5915158987045288, -0.5735083222389221, -0.5555007457733154, -0.5374931693077087, -0.519485592842102, -0.5014780163764954, -0.48347043991088867, -0.465462863445282, -0.4474552869796753, -0.4294477105140686, -0.4114401340484619, -0.3934325575828552, -0.37542498111724854, -0.35741740465164185, -0.33940982818603516, -0.32140225172042847, -0.3033946752548218, -0.2853870987892151, -0.2673795223236084, -0.2493719458580017, -0.23136436939239502, -0.21335679292678833, -0.19534921646118164, -0.17734163999557495, -0.15933406352996826, -0.14132648706436157, -0.12331891059875488, -0.1053113341331482, -0.0873037576675415, -0.06929618120193481, -0.051288604736328125, -0.033281028270721436, -0.015273451805114746, 0.0027341246604919434, 0.020741701126098633, 0.03874927759170532, 0.05675685405731201, 0.0747644305229187, 0.09277200698852539, 0.11077958345413208, 0.12878715991973877, 0.14679473638534546, 0.16480231285095215, 0.18280988931655884, 0.20081746578216553, 0.21882504224777222, 0.2368326187133789, 0.2548401951789856, 0.2728477716445923, 0.290855348110199, 0.30886292457580566, 0.32687050104141235, 0.34487807750701904, 0.36288565397262573, 0.3808932304382324, 0.3989008069038391, 0.4169083833694458, 0.4349159598350525, 0.4529235363006592]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 10.0, 3.0, 13.0, 30.0, 33.0, 56.0, 91.0, 138.0, 285.0, 539.0, 1072.0, 2534.0, 6547.0, 21749.0, 145047.0, 731776.0, 109819.0, 18615.0, 5676.0, 2320.0, 1028.0, 541.0, 277.0, 151.0, 74.0, 50.0, 29.0, 19.0, 16.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324462890625, -0.31555938720703125, -0.3066558837890625, -0.29775238037109375, -0.288848876953125, -0.27994537353515625, -0.2710418701171875, -0.26213836669921875, -0.25323486328125, -0.24433135986328125, -0.2354278564453125, -0.22652435302734375, -0.217620849609375, -0.20871734619140625, -0.1998138427734375, -0.19091033935546875, -0.1820068359375, -0.17310333251953125, -0.1641998291015625, -0.15529632568359375, -0.146392822265625, -0.13748931884765625, -0.1285858154296875, -0.11968231201171875, -0.11077880859375, -0.10187530517578125, -0.0929718017578125, -0.08406829833984375, -0.075164794921875, -0.06626129150390625, -0.0573577880859375, -0.04845428466796875, -0.03955078125, -0.03064727783203125, -0.0217437744140625, -0.01284027099609375, -0.003936767578125, 0.00496673583984375, 0.0138702392578125, 0.02277374267578125, 0.03167724609375, 0.04058074951171875, 0.0494842529296875, 0.05838775634765625, 0.067291259765625, 0.07619476318359375, 0.0850982666015625, 0.09400177001953125, 0.1029052734375, 0.11180877685546875, 0.1207122802734375, 0.12961578369140625, 0.138519287109375, 0.14742279052734375, 0.1563262939453125, 0.16522979736328125, 0.17413330078125, 0.18303680419921875, 0.1919403076171875, 0.20084381103515625, 0.209747314453125, 0.21865081787109375, 0.2275543212890625, 0.23645782470703125, 0.245361328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 6.0, 8.0, 13.0, 14.0, 23.0, 19.0, 25.0, 40.0, 65.0, 65.0, 85.0, 85.0, 87.0, 96.0, 80.0, 64.0, 63.0, 55.0, 31.0, 26.0, 15.0, 12.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5655593872070312, -0.5442047119140625, -0.5228500366210938, -0.501495361328125, -0.48014068603515625, -0.4587860107421875, -0.43743133544921875, -0.41607666015625, -0.39472198486328125, -0.3733673095703125, -0.35201263427734375, -0.330657958984375, -0.30930328369140625, -0.2879486083984375, -0.26659393310546875, -0.2452392578125, -0.22388458251953125, -0.2025299072265625, -0.18117523193359375, -0.159820556640625, -0.13846588134765625, -0.1171112060546875, -0.09575653076171875, -0.07440185546875, -0.05304718017578125, -0.0316925048828125, -0.01033782958984375, 0.011016845703125, 0.03237152099609375, 0.0537261962890625, 0.07508087158203125, 0.096435546875, 0.11779022216796875, 0.1391448974609375, 0.16049957275390625, 0.181854248046875, 0.20320892333984375, 0.2245635986328125, 0.24591827392578125, 0.26727294921875, 0.28862762451171875, 0.3099822998046875, 0.33133697509765625, 0.352691650390625, 0.37404632568359375, 0.3954010009765625, 0.41675567626953125, 0.4381103515625, 0.45946502685546875, 0.4808197021484375, 0.5021743774414062, 0.523529052734375, 0.5448837280273438, 0.5662384033203125, 0.5875930786132812, 0.60894775390625, 0.6303024291992188, 0.6516571044921875, 0.6730117797851562, 0.694366455078125, 0.7157211303710938, 0.7370758056640625, 0.7584304809570312, 0.77978515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 11.0, 10.0, 11.0, 10.0, 23.0, 30.0, 41.0, 54.0, 75.0, 124.0, 217.0, 363.0, 699.0, 1319.0, 2925.0, 7724.0, 27698.0, 183299.0, 674710.0, 117790.0, 20165.0, 6220.0, 2493.0, 1092.0, 563.0, 312.0, 204.0, 123.0, 74.0, 51.0, 33.0, 19.0, 10.0, 15.0, 16.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.20166015625, -0.1957988739013672, -0.18993759155273438, -0.18407630920410156, -0.17821502685546875, -0.17235374450683594, -0.16649246215820312, -0.1606311798095703, -0.1547698974609375, -0.1489086151123047, -0.14304733276367188, -0.13718605041503906, -0.13132476806640625, -0.12546348571777344, -0.11960220336914062, -0.11374092102050781, -0.107879638671875, -0.10201835632324219, -0.09615707397460938, -0.09029579162597656, -0.08443450927734375, -0.07857322692871094, -0.07271194458007812, -0.06685066223144531, -0.0609893798828125, -0.05512809753417969, -0.049266815185546875, -0.04340553283691406, -0.03754425048828125, -0.03168296813964844, -0.025821685791015625, -0.019960403442382812, -0.01409912109375, -0.008237838745117188, -0.002376556396484375, 0.0034847259521484375, 0.00934600830078125, 0.015207290649414062, 0.021068572998046875, 0.026929855346679688, 0.0327911376953125, 0.03865242004394531, 0.044513702392578125, 0.05037498474121094, 0.05623626708984375, 0.06209754943847656, 0.06795883178710938, 0.07382011413574219, 0.079681396484375, 0.08554267883300781, 0.09140396118164062, 0.09726524353027344, 0.10312652587890625, 0.10898780822753906, 0.11484909057617188, 0.12071037292480469, 0.1265716552734375, 0.1324329376220703, 0.13829421997070312, 0.14415550231933594, 0.15001678466796875, 0.15587806701660156, 0.16173934936523438, 0.1676006317138672, 0.1734619140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 7.0, 10.0, 5.0, 6.0, 18.0, 6.0, 16.0, 23.0, 22.0, 32.0, 37.0, 38.0, 38.0, 37.0, 38.0, 35.0, 37.0, 39.0, 58.0, 42.0, 54.0, 38.0, 46.0, 38.0, 37.0, 28.0, 21.0, 24.0, 22.0, 19.0, 19.0, 24.0, 12.0, 13.0, 11.0, 9.0, 11.0, 8.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.8173828125, -0.7937469482421875, -0.770111083984375, -0.7464752197265625, -0.72283935546875, -0.6992034912109375, -0.675567626953125, -0.6519317626953125, -0.6282958984375, -0.6046600341796875, -0.581024169921875, -0.5573883056640625, -0.53375244140625, -0.5101165771484375, -0.486480712890625, -0.4628448486328125, -0.439208984375, -0.4155731201171875, -0.391937255859375, -0.3683013916015625, -0.34466552734375, -0.3210296630859375, -0.297393798828125, -0.2737579345703125, -0.2501220703125, -0.2264862060546875, -0.202850341796875, -0.1792144775390625, -0.15557861328125, -0.1319427490234375, -0.108306884765625, -0.0846710205078125, -0.06103515625, -0.0373992919921875, -0.013763427734375, 0.0098724365234375, 0.03350830078125, 0.0571441650390625, 0.080780029296875, 0.1044158935546875, 0.1280517578125, 0.1516876220703125, 0.175323486328125, 0.1989593505859375, 0.22259521484375, 0.2462310791015625, 0.269866943359375, 0.2935028076171875, 0.317138671875, 0.3407745361328125, 0.364410400390625, 0.3880462646484375, 0.41168212890625, 0.4353179931640625, 0.458953857421875, 0.4825897216796875, 0.5062255859375, 0.5298614501953125, 0.553497314453125, 0.5771331787109375, 0.60076904296875, 0.6244049072265625, 0.648040771484375, 0.6716766357421875, 0.6953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 7.0, 10.0, 12.0, 16.0, 30.0, 51.0, 71.0, 137.0, 207.0, 314.0, 605.0, 1021.0, 2104.0, 4828.0, 13218.0, 52068.0, 452573.0, 447059.0, 51740.0, 13221.0, 4611.0, 2141.0, 1044.0, 604.0, 318.0, 191.0, 125.0, 58.0, 46.0, 23.0, 29.0, 18.0, 12.0, 11.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.09124755859375, -0.08884620666503906, -0.08644485473632812, -0.08404350280761719, -0.08164215087890625, -0.07924079895019531, -0.07683944702148438, -0.07443809509277344, -0.0720367431640625, -0.06963539123535156, -0.06723403930664062, -0.06483268737792969, -0.06243133544921875, -0.06002998352050781, -0.057628631591796875, -0.05522727966308594, -0.052825927734375, -0.05042457580566406, -0.048023223876953125, -0.04562187194824219, -0.04322052001953125, -0.04081916809082031, -0.038417816162109375, -0.03601646423339844, -0.0336151123046875, -0.031213760375976562, -0.028812408447265625, -0.026411056518554688, -0.02400970458984375, -0.021608352661132812, -0.019207000732421875, -0.016805648803710938, -0.014404296875, -0.012002944946289062, -0.009601593017578125, -0.0072002410888671875, -0.00479888916015625, -0.0023975372314453125, 3.814697265625e-06, 0.0024051666259765625, 0.0048065185546875, 0.0072078704833984375, 0.009609222412109375, 0.012010574340820312, 0.01441192626953125, 0.016813278198242188, 0.019214630126953125, 0.021615982055664062, 0.024017333984375, 0.026418685913085938, 0.028820037841796875, 0.031221389770507812, 0.03362274169921875, 0.03602409362792969, 0.038425445556640625, 0.04082679748535156, 0.0432281494140625, 0.04562950134277344, 0.048030853271484375, 0.05043220520019531, 0.05283355712890625, 0.05523490905761719, 0.057636260986328125, 0.06003761291503906, 0.06243896484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 12.0, 6.0, 6.0, 10.0, 26.0, 25.0, 33.0, 56.0, 73.0, 87.0, 120.0, 118.0, 111.0, 76.0, 57.0, 43.0, 28.0, 19.0, 19.0, 6.0, 14.0, 10.0, 6.0, 5.0, 9.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0219554901123047e-05, -2.925284206867218e-05, -2.8286129236221313e-05, -2.7319416403770447e-05, -2.635270357131958e-05, -2.5385990738868713e-05, -2.4419277906417847e-05, -2.345256507396698e-05, -2.2485852241516113e-05, -2.1519139409065247e-05, -2.055242657661438e-05, -1.9585713744163513e-05, -1.8619000911712646e-05, -1.765228807926178e-05, -1.6685575246810913e-05, -1.5718862414360046e-05, -1.475214958190918e-05, -1.3785436749458313e-05, -1.2818723917007446e-05, -1.185201108455658e-05, -1.0885298252105713e-05, -9.918585419654846e-06, -8.95187258720398e-06, -7.985159754753113e-06, -7.018446922302246e-06, -6.051734089851379e-06, -5.085021257400513e-06, -4.118308424949646e-06, -3.1515955924987793e-06, -2.1848827600479126e-06, -1.218169927597046e-06, -2.514570951461792e-07, 7.152557373046875e-07, 1.6819685697555542e-06, 2.648681402206421e-06, 3.6153942346572876e-06, 4.582107067108154e-06, 5.548819899559021e-06, 6.515532732009888e-06, 7.482245564460754e-06, 8.448958396911621e-06, 9.415671229362488e-06, 1.0382384061813354e-05, 1.1349096894264221e-05, 1.2315809726715088e-05, 1.3282522559165955e-05, 1.4249235391616821e-05, 1.5215948224067688e-05, 1.6182661056518555e-05, 1.714937388896942e-05, 1.8116086721420288e-05, 1.9082799553871155e-05, 2.004951238632202e-05, 2.1016225218772888e-05, 2.1982938051223755e-05, 2.294965088367462e-05, 2.3916363716125488e-05, 2.4883076548576355e-05, 2.584978938102722e-05, 2.681650221347809e-05, 2.7783215045928955e-05, 2.8749927878379822e-05, 2.971664071083069e-05, 3.0683353543281555e-05, 3.165006637573242e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 12.0, 17.0, 22.0, 45.0, 67.0, 114.0, 188.0, 355.0, 620.0, 1326.0, 2692.0, 6732.0, 20408.0, 84564.0, 552210.0, 304032.0, 51647.0, 14273.0, 4979.0, 2048.0, 971.0, 513.0, 250.0, 174.0, 96.0, 71.0, 32.0, 25.0, 14.0, 11.0, 12.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0802001953125, -0.0776815414428711, -0.07516288757324219, -0.07264423370361328, -0.07012557983398438, -0.06760692596435547, -0.06508827209472656, -0.06256961822509766, -0.06005096435546875, -0.057532310485839844, -0.05501365661621094, -0.05249500274658203, -0.049976348876953125, -0.04745769500732422, -0.04493904113769531, -0.042420387268066406, -0.0399017333984375, -0.037383079528808594, -0.03486442565917969, -0.03234577178955078, -0.029827117919921875, -0.02730846405029297, -0.024789810180664062, -0.022271156311035156, -0.01975250244140625, -0.017233848571777344, -0.014715194702148438, -0.012196540832519531, -0.009677886962890625, -0.007159233093261719, -0.0046405792236328125, -0.0021219253540039062, 0.000396728515625, 0.0029153823852539062, 0.0054340362548828125, 0.007952690124511719, 0.010471343994140625, 0.012989997863769531, 0.015508651733398438, 0.018027305603027344, 0.02054595947265625, 0.023064613342285156, 0.025583267211914062, 0.02810192108154297, 0.030620574951171875, 0.03313922882080078, 0.03565788269042969, 0.038176536560058594, 0.0406951904296875, 0.043213844299316406, 0.04573249816894531, 0.04825115203857422, 0.050769805908203125, 0.05328845977783203, 0.05580711364746094, 0.058325767517089844, 0.06084442138671875, 0.06336307525634766, 0.06588172912597656, 0.06840038299560547, 0.07091903686523438, 0.07343769073486328, 0.07595634460449219, 0.0784749984741211, 0.08099365234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 10.0, 8.0, 10.0, 13.0, 15.0, 20.0, 25.0, 29.0, 44.0, 57.0, 77.0, 107.0, 184.0, 113.0, 69.0, 38.0, 40.0, 30.0, 27.0, 19.0, 15.0, 12.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021881103515625, -0.021160125732421875, -0.02043914794921875, -0.019718170166015625, -0.0189971923828125, -0.018276214599609375, -0.01755523681640625, -0.016834259033203125, -0.01611328125, -0.015392303466796875, -0.01467132568359375, -0.013950347900390625, -0.0132293701171875, -0.012508392333984375, -0.01178741455078125, -0.011066436767578125, -0.010345458984375, -0.009624481201171875, -0.00890350341796875, -0.008182525634765625, -0.0074615478515625, -0.006740570068359375, -0.00601959228515625, -0.005298614501953125, -0.00457763671875, -0.003856658935546875, -0.00313568115234375, -0.002414703369140625, -0.0016937255859375, -0.000972747802734375, -0.00025177001953125, 0.000469207763671875, 0.001190185546875, 0.001911163330078125, 0.00263214111328125, 0.003353118896484375, 0.0040740966796875, 0.004795074462890625, 0.00551605224609375, 0.006237030029296875, 0.0069580078125, 0.007678985595703125, 0.00839996337890625, 0.009120941162109375, 0.0098419189453125, 0.010562896728515625, 0.01128387451171875, 0.012004852294921875, 0.012725830078125, 0.013446807861328125, 0.01416778564453125, 0.014888763427734375, 0.0156097412109375, 0.016330718994140625, 0.01705169677734375, 0.017772674560546875, 0.01849365234375, 0.019214630126953125, 0.01993560791015625, 0.020656585693359375, 0.0213775634765625, 0.022098541259765625, 0.02281951904296875, 0.023540496826171875, 0.024261474609375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 11.0, 43.0, 80.0, 132.0, 198.0, 225.0, 137.0, 85.0, 41.0, 19.0, 12.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5845848321914673, -1.5428975820541382, -1.5012104511260986, -1.4595232009887695, -1.4178359508514404, -1.3761487007141113, -1.3344614505767822, -1.2927743196487427, -1.2510870695114136, -1.2093998193740845, -1.167712688446045, -1.1260254383087158, -1.0843381881713867, -1.0426509380340576, -1.0009636878967285, -0.959276556968689, -0.9175893068313599, -0.8759020566940308, -0.8342148661613464, -0.7925276756286621, -0.750840425491333, -0.7091531753540039, -0.6674659848213196, -0.6257787942886353, -0.5840915441513062, -0.542404294013977, -0.5007171034812927, -0.459029883146286, -0.4173426628112793, -0.3756554424762726, -0.33396822214126587, -0.29228100180625916, -0.2505936622619629, -0.20890644192695618, -0.16721922159194946, -0.12553200125694275, -0.08384478092193604, -0.04215756058692932, -0.0004703402519226074, 0.041216880083084106, 0.08290410041809082, 0.12459132075309753, 0.16627854108810425, 0.20796576142311096, 0.24965298175811768, 0.2913402020931244, 0.3330274224281311, 0.3747146427631378, 0.41640186309814453, 0.45808908343315125, 0.49977630376815796, 0.5414634943008423, 0.5831507444381714, 0.6248379945755005, 0.6665251851081848, 0.7082123756408691, 0.7498996257781982, 0.7915868759155273, 0.8332740664482117, 0.874961256980896, 0.9166485071182251, 0.9583357572555542, 1.0000228881835938, 1.0417101383209229, 1.083397388458252]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 10.0, 14.0, 31.0, 22.0, 36.0, 48.0, 75.0, 85.0, 85.0, 68.0, 89.0, 86.0, 80.0, 59.0, 53.0, 51.0, 35.0, 21.0, 15.0, 6.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48361650109291077, -0.46334394812583923, -0.4430713951587677, -0.42279884219169617, -0.40252628922462463, -0.3822537362575531, -0.36198121309280396, -0.3417086601257324, -0.3214361071586609, -0.30116355419158936, -0.2808910012245178, -0.2606184482574463, -0.24034589529037476, -0.22007334232330322, -0.19980080425739288, -0.17952825129032135, -0.15925568342208862, -0.1389831304550171, -0.11871057748794556, -0.09843803197145462, -0.07816547900438309, -0.057892926037311554, -0.03762038052082062, -0.017347827553749084, 0.0029247254133224487, 0.023197276517748833, 0.04346982762217522, 0.06374237686395645, 0.08401492983102798, 0.10428748279809952, 0.12456002831459045, 0.144832581281662, 0.16510510444641113, 0.18537765741348267, 0.2056502103805542, 0.22592276334762573, 0.24619531631469727, 0.2664678692817688, 0.28674042224884033, 0.30701297521591187, 0.3272855281829834, 0.34755808115005493, 0.36783063411712646, 0.388103187084198, 0.40837574005126953, 0.42864829301834106, 0.4489208459854126, 0.46919339895248413, 0.4894659221172333, 0.5097384452819824, 0.530010998249054, 0.5502835512161255, 0.570556104183197, 0.5908286571502686, 0.6111012101173401, 0.6313737630844116, 0.6516463160514832, 0.6719188690185547, 0.6921914219856262, 0.7124639749526978, 0.7327365279197693, 0.7530090808868408, 0.7732816338539124, 0.7935541868209839, 0.8138267397880554]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 13.0, 13.0, 26.0, 35.0, 48.0, 113.0, 157.0, 203.0, 374.0, 678.0, 1351.0, 2752.0, 6377.0, 16769.0, 59002.0, 308447.0, 519136.0, 93464.0, 23871.0, 8508.0, 3586.0, 1652.0, 846.0, 429.0, 244.0, 172.0, 99.0, 47.0, 49.0, 33.0, 13.0, 11.0, 10.0, 5.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.417724609375, -0.4043159484863281, -0.39090728759765625, -0.3774986267089844, -0.3640899658203125, -0.3506813049316406, -0.33727264404296875, -0.3238639831542969, -0.310455322265625, -0.2970466613769531, -0.28363800048828125, -0.2702293395996094, -0.2568206787109375, -0.24341201782226562, -0.23000335693359375, -0.21659469604492188, -0.20318603515625, -0.18977737426757812, -0.17636871337890625, -0.16296005249023438, -0.1495513916015625, -0.13614273071289062, -0.12273406982421875, -0.10932540893554688, -0.095916748046875, -0.08250808715820312, -0.06909942626953125, -0.055690765380859375, -0.0422821044921875, -0.028873443603515625, -0.01546478271484375, -0.002056121826171875, 0.0113525390625, 0.024761199951171875, 0.03816986083984375, 0.051578521728515625, 0.0649871826171875, 0.07839584350585938, 0.09180450439453125, 0.10521316528320312, 0.118621826171875, 0.13203048706054688, 0.14543914794921875, 0.15884780883789062, 0.1722564697265625, 0.18566513061523438, 0.19907379150390625, 0.21248245239257812, 0.22589111328125, 0.23929977416992188, 0.25270843505859375, 0.2661170959472656, 0.2795257568359375, 0.2929344177246094, 0.30634307861328125, 0.3197517395019531, 0.333160400390625, 0.3465690612792969, 0.35997772216796875, 0.3733863830566406, 0.3867950439453125, 0.4002037048339844, 0.41361236572265625, 0.4270210266113281, 0.4404296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 9.0, 14.0, 16.0, 28.0, 30.0, 33.0, 51.0, 71.0, 62.0, 65.0, 72.0, 72.0, 75.0, 75.0, 62.0, 51.0, 39.0, 36.0, 34.0, 29.0, 18.0, 15.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9755859375, -0.94219970703125, -0.9088134765625, -0.87542724609375, -0.842041015625, -0.80865478515625, -0.7752685546875, -0.74188232421875, -0.70849609375, -0.67510986328125, -0.6417236328125, -0.60833740234375, -0.574951171875, -0.54156494140625, -0.5081787109375, -0.47479248046875, -0.44140625, -0.40802001953125, -0.3746337890625, -0.34124755859375, -0.307861328125, -0.27447509765625, -0.2410888671875, -0.20770263671875, -0.17431640625, -0.14093017578125, -0.1075439453125, -0.07415771484375, -0.040771484375, -0.00738525390625, 0.0260009765625, 0.05938720703125, 0.0927734375, 0.12615966796875, 0.1595458984375, 0.19293212890625, 0.226318359375, 0.25970458984375, 0.2930908203125, 0.32647705078125, 0.35986328125, 0.39324951171875, 0.4266357421875, 0.46002197265625, 0.493408203125, 0.52679443359375, 0.5601806640625, 0.59356689453125, 0.626953125, 0.66033935546875, 0.6937255859375, 0.72711181640625, 0.760498046875, 0.79388427734375, 0.8272705078125, 0.86065673828125, 0.89404296875, 0.92742919921875, 0.9608154296875, 0.99420166015625, 1.027587890625, 1.06097412109375, 1.0943603515625, 1.12774658203125, 1.1611328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 6.0, 6.0, 7.0, 9.0, 18.0, 17.0, 14.0, 31.0, 35.0, 49.0, 51.0, 86.0, 132.0, 211.0, 668.0, 4867.0, 443277.0, 592278.0, 5349.0, 713.0, 241.0, 151.0, 90.0, 58.0, 35.0, 29.0, 27.0, 18.0, 19.0, 14.0, 15.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.958984375, -1.90606689453125, -1.8531494140625, -1.80023193359375, -1.747314453125, -1.69439697265625, -1.6414794921875, -1.58856201171875, -1.53564453125, -1.48272705078125, -1.4298095703125, -1.37689208984375, -1.323974609375, -1.27105712890625, -1.2181396484375, -1.16522216796875, -1.1123046875, -1.05938720703125, -1.0064697265625, -0.95355224609375, -0.900634765625, -0.84771728515625, -0.7947998046875, -0.74188232421875, -0.68896484375, -0.63604736328125, -0.5831298828125, -0.53021240234375, -0.477294921875, -0.42437744140625, -0.3714599609375, -0.31854248046875, -0.265625, -0.21270751953125, -0.1597900390625, -0.10687255859375, -0.053955078125, -0.00103759765625, 0.0518798828125, 0.10479736328125, 0.15771484375, 0.21063232421875, 0.2635498046875, 0.31646728515625, 0.369384765625, 0.42230224609375, 0.4752197265625, 0.52813720703125, 0.5810546875, 0.63397216796875, 0.6868896484375, 0.73980712890625, 0.792724609375, 0.84564208984375, 0.8985595703125, 0.95147705078125, 1.00439453125, 1.05731201171875, 1.1102294921875, 1.16314697265625, 1.216064453125, 1.26898193359375, 1.3218994140625, 1.37481689453125, 1.427734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 9.0, 12.0, 15.0, 11.0, 15.0, 21.0, 18.0, 33.0, 36.0, 37.0, 43.0, 57.0, 45.0, 55.0, 46.0, 68.0, 41.0, 56.0, 54.0, 50.0, 39.0, 39.0, 20.0, 37.0, 26.0, 17.0, 15.0, 19.0, 12.0, 12.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.9918289184570312, -0.9602203369140625, -0.9286117553710938, -0.897003173828125, -0.8653945922851562, -0.8337860107421875, -0.8021774291992188, -0.77056884765625, -0.7389602661132812, -0.7073516845703125, -0.6757431030273438, -0.644134521484375, -0.6125259399414062, -0.5809173583984375, -0.5493087768554688, -0.5177001953125, -0.48609161376953125, -0.4544830322265625, -0.42287445068359375, -0.391265869140625, -0.35965728759765625, -0.3280487060546875, -0.29644012451171875, -0.26483154296875, -0.23322296142578125, -0.2016143798828125, -0.17000579833984375, -0.138397216796875, -0.10678863525390625, -0.0751800537109375, -0.04357147216796875, -0.011962890625, 0.01964569091796875, 0.0512542724609375, 0.08286285400390625, 0.114471435546875, 0.14608001708984375, 0.1776885986328125, 0.20929718017578125, 0.24090576171875, 0.27251434326171875, 0.3041229248046875, 0.33573150634765625, 0.367340087890625, 0.39894866943359375, 0.4305572509765625, 0.46216583251953125, 0.4937744140625, 0.5253829956054688, 0.5569915771484375, 0.5886001586914062, 0.620208740234375, 0.6518173217773438, 0.6834259033203125, 0.7150344848632812, 0.74664306640625, 0.7782516479492188, 0.8098602294921875, 0.8414688110351562, 0.873077392578125, 0.9046859741210938, 0.9362945556640625, 0.9679031372070312, 0.99951171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 14.0, 24.0, 42.0, 68.0, 153.0, 392.0, 1190.0, 10626.0, 667221.0, 359542.0, 7528.0, 1068.0, 371.0, 136.0, 71.0, 34.0, 19.0, 13.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.34539794921875, -0.3338623046875, -0.32232666015625, -0.310791015625, -0.29925537109375, -0.2877197265625, -0.27618408203125, -0.2646484375, -0.25311279296875, -0.2415771484375, -0.23004150390625, -0.218505859375, -0.20697021484375, -0.1954345703125, -0.18389892578125, -0.17236328125, -0.16082763671875, -0.1492919921875, -0.13775634765625, -0.126220703125, -0.11468505859375, -0.1031494140625, -0.09161376953125, -0.080078125, -0.06854248046875, -0.0570068359375, -0.04547119140625, -0.033935546875, -0.02239990234375, -0.0108642578125, 0.00067138671875, 0.01220703125, 0.02374267578125, 0.0352783203125, 0.04681396484375, 0.058349609375, 0.06988525390625, 0.0814208984375, 0.09295654296875, 0.1044921875, 0.11602783203125, 0.1275634765625, 0.13909912109375, 0.150634765625, 0.16217041015625, 0.1737060546875, 0.18524169921875, 0.19677734375, 0.20831298828125, 0.2198486328125, 0.23138427734375, 0.242919921875, 0.25445556640625, 0.2659912109375, 0.27752685546875, 0.2890625, 0.30059814453125, 0.3121337890625, 0.32366943359375, 0.335205078125, 0.34674072265625, 0.3582763671875, 0.36981201171875, 0.38134765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 4.0, 7.0, 11.0, 14.0, 14.0, 28.0, 34.0, 48.0, 78.0, 133.0, 178.0, 131.0, 80.0, 79.0, 48.0, 29.0, 21.0, 11.0, 15.0, 8.0, 9.0, 5.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5212764739990234e-05, -2.436712384223938e-05, -2.3521482944488525e-05, -2.267584204673767e-05, -2.1830201148986816e-05, -2.0984560251235962e-05, -2.0138919353485107e-05, -1.9293278455734253e-05, -1.84476375579834e-05, -1.7601996660232544e-05, -1.675635576248169e-05, -1.5910714864730835e-05, -1.506507396697998e-05, -1.4219433069229126e-05, -1.3373792171478271e-05, -1.2528151273727417e-05, -1.1682510375976562e-05, -1.0836869478225708e-05, -9.991228580474854e-06, -9.145587682723999e-06, -8.299946784973145e-06, -7.45430588722229e-06, -6.6086649894714355e-06, -5.763024091720581e-06, -4.9173831939697266e-06, -4.071742296218872e-06, -3.2261013984680176e-06, -2.380460500717163e-06, -1.5348196029663086e-06, -6.891787052154541e-07, 1.564621925354004e-07, 1.0021030902862549e-06, 1.8477439880371094e-06, 2.693384885787964e-06, 3.5390257835388184e-06, 4.384666681289673e-06, 5.230307579040527e-06, 6.075948476791382e-06, 6.921589374542236e-06, 7.76723027229309e-06, 8.612871170043945e-06, 9.4585120677948e-06, 1.0304152965545654e-05, 1.1149793863296509e-05, 1.1995434761047363e-05, 1.2841075658798218e-05, 1.3686716556549072e-05, 1.4532357454299927e-05, 1.537799835205078e-05, 1.6223639249801636e-05, 1.706928014755249e-05, 1.7914921045303345e-05, 1.87605619430542e-05, 1.9606202840805054e-05, 2.0451843738555908e-05, 2.1297484636306763e-05, 2.2143125534057617e-05, 2.298876643180847e-05, 2.3834407329559326e-05, 2.468004822731018e-05, 2.5525689125061035e-05, 2.637133002281189e-05, 2.7216970920562744e-05, 2.80626118183136e-05, 2.8908252716064453e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 13.0, 12.0, 12.0, 22.0, 32.0, 63.0, 135.0, 269.0, 705.0, 2527.0, 14421.0, 193059.0, 781517.0, 47716.0, 5790.0, 1325.0, 505.0, 223.0, 81.0, 46.0, 21.0, 21.0, 11.0, 8.0, 1.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32080078125, -0.31241607666015625, -0.3040313720703125, -0.29564666748046875, -0.287261962890625, -0.27887725830078125, -0.2704925537109375, -0.26210784912109375, -0.25372314453125, -0.24533843994140625, -0.2369537353515625, -0.22856903076171875, -0.220184326171875, -0.21179962158203125, -0.2034149169921875, -0.19503021240234375, -0.1866455078125, -0.17826080322265625, -0.1698760986328125, -0.16149139404296875, -0.153106689453125, -0.14472198486328125, -0.1363372802734375, -0.12795257568359375, -0.11956787109375, -0.11118316650390625, -0.1027984619140625, -0.09441375732421875, -0.086029052734375, -0.07764434814453125, -0.0692596435546875, -0.06087493896484375, -0.052490234375, -0.04410552978515625, -0.0357208251953125, -0.02733612060546875, -0.018951416015625, -0.01056671142578125, -0.0021820068359375, 0.00620269775390625, 0.01458740234375, 0.02297210693359375, 0.0313568115234375, 0.03974151611328125, 0.048126220703125, 0.05651092529296875, 0.0648956298828125, 0.07328033447265625, 0.0816650390625, 0.09004974365234375, 0.0984344482421875, 0.10681915283203125, 0.115203857421875, 0.12358856201171875, 0.1319732666015625, 0.14035797119140625, 0.14874267578125, 0.15712738037109375, 0.1655120849609375, 0.17389678955078125, 0.182281494140625, 0.19066619873046875, 0.1990509033203125, 0.20743560791015625, 0.2158203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 2.0, 13.0, 15.0, 7.0, 18.0, 23.0, 19.0, 32.0, 33.0, 66.0, 91.0, 168.0, 162.0, 95.0, 74.0, 47.0, 28.0, 21.0, 22.0, 11.0, 13.0, 6.0, 5.0, 7.0, 3.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06744384765625, -0.06474494934082031, -0.062046051025390625, -0.05934715270996094, -0.05664825439453125, -0.05394935607910156, -0.051250457763671875, -0.04855155944824219, -0.0458526611328125, -0.04315376281738281, -0.040454864501953125, -0.03775596618652344, -0.03505706787109375, -0.03235816955566406, -0.029659271240234375, -0.026960372924804688, -0.024261474609375, -0.021562576293945312, -0.018863677978515625, -0.016164779663085938, -0.01346588134765625, -0.010766983032226562, -0.008068084716796875, -0.0053691864013671875, -0.0026702880859375, 2.86102294921875e-05, 0.002727508544921875, 0.0054264068603515625, 0.00812530517578125, 0.010824203491210938, 0.013523101806640625, 0.016222000122070312, 0.0189208984375, 0.021619796752929688, 0.024318695068359375, 0.027017593383789062, 0.02971649169921875, 0.03241539001464844, 0.035114288330078125, 0.03781318664550781, 0.0405120849609375, 0.04321098327636719, 0.045909881591796875, 0.04860877990722656, 0.05130767822265625, 0.05400657653808594, 0.056705474853515625, 0.05940437316894531, 0.062103271484375, 0.06480216979980469, 0.06750106811523438, 0.07019996643066406, 0.07289886474609375, 0.07559776306152344, 0.07829666137695312, 0.08099555969238281, 0.0836944580078125, 0.08639335632324219, 0.08909225463867188, 0.09179115295410156, 0.09449005126953125, 0.09718894958496094, 0.09988784790039062, 0.10258674621582031, 0.10528564453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 14.0, 16.0, 20.0, 32.0, 39.0, 64.0, 84.0, 109.0, 116.0, 121.0, 101.0, 83.0, 64.0, 46.0, 24.0, 19.0, 13.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650704145431519, -1.1197429895401, -1.074415683746338, -1.0290882587432861, -0.9837608337402344, -0.9384334087371826, -0.8931060433387756, -0.8477786779403687, -0.8024512529373169, -0.7571238279342651, -0.7117964625358582, -0.6664690971374512, -0.6211416721343994, -0.5758142471313477, -0.5304868817329407, -0.4851594865322113, -0.43983209133148193, -0.39450469613075256, -0.3491773009300232, -0.3038499057292938, -0.25852251052856445, -0.21319511532783508, -0.1678677201271057, -0.12254032492637634, -0.07721292972564697, -0.0318855345249176, 0.013441860675811768, 0.05876925587654114, 0.10409665107727051, 0.14942404627799988, 0.19475144147872925, 0.24007883667945862, 0.28540611267089844, 0.3307335078716278, 0.3760609030723572, 0.42138829827308655, 0.4667156934738159, 0.5120431184768677, 0.5573704838752747, 0.6026978492736816, 0.6480252742767334, 0.6933526992797852, 0.7386800646781921, 0.7840074300765991, 0.8293348550796509, 0.8746622800827026, 0.9199896454811096, 0.9653170108795166, 1.0106444358825684, 1.0559718608856201, 1.1012992858886719, 1.146626591682434, 1.1919540166854858, 1.2372814416885376, 1.2826087474822998, 1.3279361724853516, 1.3732635974884033, 1.418591022491455, 1.4639184474945068, 1.509245753288269, 1.5545731782913208, 1.5999006032943726, 1.6452279090881348, 1.6905553340911865, 1.7358827590942383]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 7.0, 9.0, 4.0, 14.0, 11.0, 24.0, 17.0, 14.0, 16.0, 27.0, 31.0, 27.0, 25.0, 36.0, 32.0, 28.0, 29.0, 32.0, 47.0, 34.0, 37.0, 36.0, 38.0, 36.0, 47.0, 44.0, 35.0, 38.0, 32.0, 28.0, 30.0, 27.0, 14.0, 14.0, 9.0, 10.0, 11.0, 10.0, 5.0, 9.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 0.0, 4.0], "bins": [-1.4448002576828003, -1.4044328927993774, -1.3640656471252441, -1.3236982822418213, -1.2833309173583984, -1.2429635524749756, -1.2025963068008423, -1.1622289419174194, -1.1218616962432861, -1.0814943313598633, -1.04112708568573, -1.0007597208023071, -0.9603923559188843, -0.9200250506401062, -0.8796577453613281, -0.8392903804779053, -0.7989230155944824, -0.7585557103157043, -0.7181883454322815, -0.6778210401535034, -0.6374536752700806, -0.5970863699913025, -0.5567190647125244, -0.5163516998291016, -0.4759843945503235, -0.435617059469223, -0.39524972438812256, -0.3548824191093445, -0.314515084028244, -0.27414774894714355, -0.23378042876720428, -0.19341310858726501, -0.153045654296875, -0.11267832666635513, -0.07231099903583527, -0.0319436714053154, 0.008423656225204468, 0.04879099130630493, 0.0891583114862442, 0.12952563166618347, 0.16989296674728394, 0.2102603018283844, 0.25062763690948486, 0.29099494218826294, 0.3313622772693634, 0.37172961235046387, 0.41209691762924194, 0.4524642527103424, 0.49283158779144287, 0.533198893070221, 0.5735662579536438, 0.6139335632324219, 0.6543009281158447, 0.6946682333946228, 0.7350355386734009, 0.7754029035568237, 0.8157702088356018, 0.8561375141143799, 0.8965048789978027, 0.9368721842765808, 0.9772394895553589, 1.0176068544387817, 1.0579742193222046, 1.098341464996338, 1.1387088298797607]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 9.0, 20.0, 17.0, 19.0, 41.0, 44.0, 76.0, 106.0, 169.0, 294.0, 486.0, 826.0, 1932.0, 4404.0, 14529.0, 81399.0, 1892925.0, 2082649.0, 89530.0, 15801.0, 4804.0, 1937.0, 937.0, 492.0, 285.0, 182.0, 107.0, 77.0, 48.0, 41.0, 26.0, 21.0, 4.0, 8.0, 10.0, 7.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.810546875, -0.7816162109375, -0.752685546875, -0.7237548828125, -0.69482421875, -0.6658935546875, -0.636962890625, -0.6080322265625, -0.5791015625, -0.5501708984375, -0.521240234375, -0.4923095703125, -0.46337890625, -0.4344482421875, -0.405517578125, -0.3765869140625, -0.34765625, -0.3187255859375, -0.289794921875, -0.2608642578125, -0.23193359375, -0.2030029296875, -0.174072265625, -0.1451416015625, -0.1162109375, -0.0872802734375, -0.058349609375, -0.0294189453125, -0.00048828125, 0.0284423828125, 0.057373046875, 0.0863037109375, 0.115234375, 0.1441650390625, 0.173095703125, 0.2020263671875, 0.23095703125, 0.2598876953125, 0.288818359375, 0.3177490234375, 0.3466796875, 0.3756103515625, 0.404541015625, 0.4334716796875, 0.46240234375, 0.4913330078125, 0.520263671875, 0.5491943359375, 0.578125, 0.6070556640625, 0.635986328125, 0.6649169921875, 0.69384765625, 0.7227783203125, 0.751708984375, 0.7806396484375, 0.8095703125, 0.8385009765625, 0.867431640625, 0.8963623046875, 0.92529296875, 0.9542236328125, 0.983154296875, 1.0120849609375, 1.041015625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 7.0, 3.0, 8.0, 9.0, 13.0, 16.0, 22.0, 29.0, 25.0, 37.0, 29.0, 50.0, 51.0, 67.0, 52.0, 57.0, 55.0, 50.0, 49.0, 58.0, 53.0, 55.0, 39.0, 38.0, 32.0, 16.0, 22.0, 13.0, 9.0, 7.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.44446563720703125, -0.4306793212890625, -0.41689300537109375, -0.403106689453125, -0.38932037353515625, -0.3755340576171875, -0.36174774169921875, -0.34796142578125, -0.33417510986328125, -0.3203887939453125, -0.30660247802734375, -0.292816162109375, -0.27902984619140625, -0.2652435302734375, -0.25145721435546875, -0.2376708984375, -0.22388458251953125, -0.2100982666015625, -0.19631195068359375, -0.182525634765625, -0.16873931884765625, -0.1549530029296875, -0.14116668701171875, -0.12738037109375, -0.11359405517578125, -0.0998077392578125, -0.08602142333984375, -0.072235107421875, -0.05844879150390625, -0.0446624755859375, -0.03087615966796875, -0.01708984375, -0.00330352783203125, 0.0104827880859375, 0.02426910400390625, 0.038055419921875, 0.05184173583984375, 0.0656280517578125, 0.07941436767578125, 0.09320068359375, 0.10698699951171875, 0.1207733154296875, 0.13455963134765625, 0.148345947265625, 0.16213226318359375, 0.1759185791015625, 0.18970489501953125, 0.2034912109375, 0.21727752685546875, 0.2310638427734375, 0.24485015869140625, 0.258636474609375, 0.27242279052734375, 0.2862091064453125, 0.29999542236328125, 0.31378173828125, 0.32756805419921875, 0.3413543701171875, 0.35514068603515625, 0.368927001953125, 0.38271331787109375, 0.3964996337890625, 0.41028594970703125, 0.424072265625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 5.0, 10.0, 10.0, 16.0, 21.0, 36.0, 51.0, 69.0, 100.0, 153.0, 266.0, 483.0, 1048.0, 2923.0, 12783.0, 104028.0, 3553192.0, 481523.0, 29024.0, 5370.0, 1577.0, 693.0, 321.0, 202.0, 111.0, 73.0, 49.0, 47.0, 23.0, 20.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4074859619140625, -1.365753173828125, -1.3240203857421875, -1.28228759765625, -1.2405548095703125, -1.198822021484375, -1.1570892333984375, -1.1153564453125, -1.0736236572265625, -1.031890869140625, -0.9901580810546875, -0.94842529296875, -0.9066925048828125, -0.864959716796875, -0.8232269287109375, -0.781494140625, -0.7397613525390625, -0.698028564453125, -0.6562957763671875, -0.61456298828125, -0.5728302001953125, -0.531097412109375, -0.4893646240234375, -0.4476318359375, -0.4058990478515625, -0.364166259765625, -0.3224334716796875, -0.28070068359375, -0.2389678955078125, -0.197235107421875, -0.1555023193359375, -0.11376953125, -0.0720367431640625, -0.030303955078125, 0.0114288330078125, 0.05316162109375, 0.0948944091796875, 0.136627197265625, 0.1783599853515625, 0.2200927734375, 0.2618255615234375, 0.303558349609375, 0.3452911376953125, 0.38702392578125, 0.4287567138671875, 0.470489501953125, 0.5122222900390625, 0.553955078125, 0.5956878662109375, 0.637420654296875, 0.6791534423828125, 0.72088623046875, 0.7626190185546875, 0.804351806640625, 0.8460845947265625, 0.8878173828125, 0.9295501708984375, 0.971282958984375, 1.0130157470703125, 1.05474853515625, 1.0964813232421875, 1.138214111328125, 1.1799468994140625, 1.2216796875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 7.0, 15.0, 17.0, 38.0, 43.0, 70.0, 116.0, 197.0, 363.0, 583.0, 893.0, 721.0, 404.0, 207.0, 133.0, 85.0, 39.0, 35.0, 24.0, 16.0, 16.0, 8.0, 6.0, 5.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.297119140625, -0.2874183654785156, -0.27771759033203125, -0.2680168151855469, -0.2583160400390625, -0.24861526489257812, -0.23891448974609375, -0.22921371459960938, -0.219512939453125, -0.20981216430664062, -0.20011138916015625, -0.19041061401367188, -0.1807098388671875, -0.17100906372070312, -0.16130828857421875, -0.15160751342773438, -0.14190673828125, -0.13220596313476562, -0.12250518798828125, -0.11280441284179688, -0.1031036376953125, -0.09340286254882812, -0.08370208740234375, -0.07400131225585938, -0.064300537109375, -0.054599761962890625, -0.04489898681640625, -0.035198211669921875, -0.0254974365234375, -0.015796661376953125, -0.00609588623046875, 0.003604888916015625, 0.0133056640625, 0.023006439208984375, 0.03270721435546875, 0.042407989501953125, 0.0521087646484375, 0.061809539794921875, 0.07151031494140625, 0.08121109008789062, 0.090911865234375, 0.10061264038085938, 0.11031341552734375, 0.12001419067382812, 0.1297149658203125, 0.13941574096679688, 0.14911651611328125, 0.15881729125976562, 0.16851806640625, 0.17821884155273438, 0.18791961669921875, 0.19762039184570312, 0.2073211669921875, 0.21702194213867188, 0.22672271728515625, 0.23642349243164062, 0.246124267578125, 0.2558250427246094, 0.26552581787109375, 0.2752265930175781, 0.2849273681640625, 0.2946281433105469, 0.30432891845703125, 0.3140296936035156, 0.32373046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 0.0, 2.0, 5.0, 4.0, 8.0, 14.0, 15.0, 14.0, 32.0, 32.0, 30.0, 47.0, 65.0, 67.0, 89.0, 84.0, 89.0, 88.0, 67.0, 63.0, 48.0, 31.0, 29.0, 23.0, 14.0, 11.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8688849210739136, -0.8431196808815002, -0.8173544406890869, -0.7915891408920288, -0.7658239006996155, -0.7400586605072021, -0.7142934203147888, -0.6885281801223755, -0.6627628803253174, -0.636997640132904, -0.6112323999404907, -0.5854671001434326, -0.5597018599510193, -0.533936619758606, -0.5081713795661926, -0.4824061393737793, -0.45664089918136597, -0.43087565898895264, -0.4051103889942169, -0.3793451488018036, -0.35357987880706787, -0.32781463861465454, -0.3020493984222412, -0.2762841582298279, -0.25051888823509216, -0.22475363314151764, -0.19898837804794312, -0.17322313785552979, -0.14745788276195526, -0.12169262766838074, -0.09592738747596741, -0.07016213238239288, -0.044396936893463135, -0.01863168552517891, 0.007133565843105316, 0.03289881348609924, 0.05866406857967377, 0.08442932367324829, 0.11019456386566162, 0.13595981895923615, 0.16172507405281067, 0.1874903291463852, 0.21325558423995972, 0.23902082443237305, 0.2647860646247864, 0.2905513346195221, 0.3163165748119354, 0.34208184480667114, 0.3678470849990845, 0.3936123251914978, 0.4193775951862335, 0.44514283537864685, 0.47090810537338257, 0.4966733455657959, 0.5224385857582092, 0.5482038259506226, 0.5739691257476807, 0.599734365940094, 0.6254996061325073, 0.6512649059295654, 0.6770301461219788, 0.7027953863143921, 0.7285606265068054, 0.7543258666992188, 0.7800911068916321]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 6.0, 14.0, 9.0, 19.0, 7.0, 24.0, 24.0, 32.0, 30.0, 28.0, 38.0, 29.0, 36.0, 46.0, 49.0, 51.0, 56.0, 50.0, 42.0, 46.0, 40.0, 46.0, 35.0, 41.0, 32.0, 31.0, 21.0, 22.0, 21.0, 14.0, 13.0, 8.0, 11.0, 6.0, 5.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5837039947509766, -0.5664398670196533, -0.5491757988929749, -0.5319116711616516, -0.5146476030349731, -0.4973834753036499, -0.48011937737464905, -0.4628552794456482, -0.44559118151664734, -0.4283270835876465, -0.41106298565864563, -0.3937988877296448, -0.37653475999832153, -0.35927069187164307, -0.3420065641403198, -0.32474246621131897, -0.3074783682823181, -0.29021427035331726, -0.2729501724243164, -0.25568607449531555, -0.2384219616651535, -0.22115786373615265, -0.2038937509059906, -0.18662965297698975, -0.1693655550479889, -0.15210145711898804, -0.13483735918998718, -0.11757324635982513, -0.10030914843082428, -0.08304505050182343, -0.06578094512224197, -0.04851683974266052, -0.03125268220901489, -0.01398858055472374, 0.0032755210995674133, 0.020539622753858566, 0.03780372440814972, 0.055067822337150574, 0.07233192771673203, 0.08959603309631348, 0.10686013102531433, 0.12412422895431519, 0.14138832688331604, 0.1586524397134781, 0.17591653764247894, 0.1931806355714798, 0.21044474840164185, 0.2277088463306427, 0.24497294425964355, 0.2622370421886444, 0.27950114011764526, 0.2967652380466461, 0.314029335975647, 0.3312934637069702, 0.34855756163597107, 0.3658216595649719, 0.3830857574939728, 0.40034985542297363, 0.4176139533519745, 0.43487805128097534, 0.4521421790122986, 0.46940624713897705, 0.4866703748703003, 0.5039345026016235, 0.521198570728302]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 10.0, 6.0, 9.0, 27.0, 29.0, 53.0, 66.0, 90.0, 131.0, 224.0, 359.0, 596.0, 1114.0, 2087.0, 4040.0, 8338.0, 19034.0, 46272.0, 128440.0, 348262.0, 308992.0, 108431.0, 39847.0, 16684.0, 7384.0, 3657.0, 1816.0, 1027.0, 566.0, 340.0, 195.0, 130.0, 87.0, 66.0, 45.0, 27.0, 17.0, 17.0, 8.0, 8.0, 3.0, 1.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1319580078125, -0.12828445434570312, -0.12461090087890625, -0.12093734741210938, -0.1172637939453125, -0.11359024047851562, -0.10991668701171875, -0.10624313354492188, -0.102569580078125, -0.09889602661132812, -0.09522247314453125, -0.09154891967773438, -0.0878753662109375, -0.08420181274414062, -0.08052825927734375, -0.07685470581054688, -0.07318115234375, -0.06950759887695312, -0.06583404541015625, -0.062160491943359375, -0.0584869384765625, -0.054813385009765625, -0.05113983154296875, -0.047466278076171875, -0.043792724609375, -0.040119171142578125, -0.03644561767578125, -0.032772064208984375, -0.0290985107421875, -0.025424957275390625, -0.02175140380859375, -0.018077850341796875, -0.014404296875, -0.010730743408203125, -0.00705718994140625, -0.003383636474609375, 0.0002899169921875, 0.003963470458984375, 0.00763702392578125, 0.011310577392578125, 0.014984130859375, 0.018657684326171875, 0.02233123779296875, 0.026004791259765625, 0.0296783447265625, 0.033351898193359375, 0.03702545166015625, 0.040699005126953125, 0.04437255859375, 0.048046112060546875, 0.05171966552734375, 0.055393218994140625, 0.0590667724609375, 0.06274032592773438, 0.06641387939453125, 0.07008743286132812, 0.073760986328125, 0.07743453979492188, 0.08110809326171875, 0.08478164672851562, 0.0884552001953125, 0.09212875366210938, 0.09580230712890625, 0.09947586059570312, 0.1031494140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 17.0, 18.0, 22.0, 26.0, 33.0, 35.0, 34.0, 43.0, 38.0, 59.0, 54.0, 66.0, 46.0, 69.0, 50.0, 44.0, 48.0, 40.0, 39.0, 35.0, 25.0, 26.0, 26.0, 10.0, 14.0, 12.0, 9.0, 9.0, 7.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3874168395996094, -0.37541961669921875, -0.3634223937988281, -0.3514251708984375, -0.3394279479980469, -0.32743072509765625, -0.3154335021972656, -0.303436279296875, -0.2914390563964844, -0.27944183349609375, -0.2674446105957031, -0.2554473876953125, -0.24345016479492188, -0.23145294189453125, -0.21945571899414062, -0.20745849609375, -0.19546127319335938, -0.18346405029296875, -0.17146682739257812, -0.1594696044921875, -0.14747238159179688, -0.13547515869140625, -0.12347793579101562, -0.111480712890625, -0.09948348999023438, -0.08748626708984375, -0.07548904418945312, -0.0634918212890625, -0.051494598388671875, -0.03949737548828125, -0.027500152587890625, -0.0155029296875, -0.003505706787109375, 0.00849151611328125, 0.020488739013671875, 0.0324859619140625, 0.044483184814453125, 0.05648040771484375, 0.06847763061523438, 0.080474853515625, 0.09247207641601562, 0.10446929931640625, 0.11646652221679688, 0.1284637451171875, 0.14046096801757812, 0.15245819091796875, 0.16445541381835938, 0.17645263671875, 0.18844985961914062, 0.20044708251953125, 0.21244430541992188, 0.2244415283203125, 0.23643875122070312, 0.24843597412109375, 0.2604331970214844, 0.272430419921875, 0.2844276428222656, 0.29642486572265625, 0.3084220886230469, 0.3204193115234375, 0.3324165344238281, 0.34441375732421875, 0.3564109802246094, 0.368408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 5.0, 17.0, 19.0, 27.0, 42.0, 68.0, 97.0, 171.0, 305.0, 593.0, 1266.0, 3054.0, 10104.0, 44758.0, 290606.0, 567130.0, 102774.0, 18826.0, 5147.0, 1803.0, 808.0, 387.0, 221.0, 126.0, 63.0, 38.0, 29.0, 22.0, 13.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1614990234375, -0.15663909912109375, -0.1517791748046875, -0.14691925048828125, -0.142059326171875, -0.13719940185546875, -0.1323394775390625, -0.12747955322265625, -0.12261962890625, -0.11775970458984375, -0.1128997802734375, -0.10803985595703125, -0.103179931640625, -0.09832000732421875, -0.0934600830078125, -0.08860015869140625, -0.083740234375, -0.07888031005859375, -0.0740203857421875, -0.06916046142578125, -0.064300537109375, -0.05944061279296875, -0.0545806884765625, -0.04972076416015625, -0.04486083984375, -0.04000091552734375, -0.0351409912109375, -0.03028106689453125, -0.025421142578125, -0.02056121826171875, -0.0157012939453125, -0.01084136962890625, -0.0059814453125, -0.00112152099609375, 0.0037384033203125, 0.00859832763671875, 0.013458251953125, 0.01831817626953125, 0.0231781005859375, 0.02803802490234375, 0.03289794921875, 0.03775787353515625, 0.0426177978515625, 0.04747772216796875, 0.052337646484375, 0.05719757080078125, 0.0620574951171875, 0.06691741943359375, 0.07177734375, 0.07663726806640625, 0.0814971923828125, 0.08635711669921875, 0.091217041015625, 0.09607696533203125, 0.1009368896484375, 0.10579681396484375, 0.11065673828125, 0.11551666259765625, 0.1203765869140625, 0.12523651123046875, 0.130096435546875, 0.13495635986328125, 0.1398162841796875, 0.14467620849609375, 0.1495361328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 9.0, 4.0, 6.0, 7.0, 9.0, 11.0, 12.0, 17.0, 14.0, 15.0, 26.0, 42.0, 25.0, 22.0, 38.0, 30.0, 40.0, 42.0, 49.0, 61.0, 47.0, 45.0, 65.0, 30.0, 55.0, 39.0, 41.0, 34.0, 24.0, 24.0, 21.0, 16.0, 14.0, 19.0, 7.0, 5.0, 9.0, 5.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.67236328125, -0.650604248046875, -0.62884521484375, -0.607086181640625, -0.5853271484375, -0.563568115234375, -0.54180908203125, -0.520050048828125, -0.498291015625, -0.476531982421875, -0.45477294921875, -0.433013916015625, -0.4112548828125, -0.389495849609375, -0.36773681640625, -0.345977783203125, -0.32421875, -0.302459716796875, -0.28070068359375, -0.258941650390625, -0.2371826171875, -0.215423583984375, -0.19366455078125, -0.171905517578125, -0.150146484375, -0.128387451171875, -0.10662841796875, -0.084869384765625, -0.0631103515625, -0.041351318359375, -0.01959228515625, 0.002166748046875, 0.02392578125, 0.045684814453125, 0.06744384765625, 0.089202880859375, 0.1109619140625, 0.132720947265625, 0.15447998046875, 0.176239013671875, 0.197998046875, 0.219757080078125, 0.24151611328125, 0.263275146484375, 0.2850341796875, 0.306793212890625, 0.32855224609375, 0.350311279296875, 0.3720703125, 0.393829345703125, 0.41558837890625, 0.437347412109375, 0.4591064453125, 0.480865478515625, 0.50262451171875, 0.524383544921875, 0.546142578125, 0.567901611328125, 0.58966064453125, 0.611419677734375, 0.6331787109375, 0.654937744140625, 0.67669677734375, 0.698455810546875, 0.72021484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 13.0, 29.0, 33.0, 43.0, 90.0, 152.0, 278.0, 600.0, 1112.0, 2431.0, 6358.0, 20085.0, 93995.0, 632245.0, 235594.0, 38019.0, 10455.0, 3688.0, 1508.0, 800.0, 396.0, 216.0, 135.0, 86.0, 52.0, 30.0, 21.0, 20.0, 11.0, 15.0, 6.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.1046142578125, -0.1019124984741211, -0.09921073913574219, -0.09650897979736328, -0.09380722045898438, -0.09110546112060547, -0.08840370178222656, -0.08570194244384766, -0.08300018310546875, -0.08029842376708984, -0.07759666442871094, -0.07489490509033203, -0.07219314575195312, -0.06949138641357422, -0.06678962707519531, -0.0640878677368164, -0.0613861083984375, -0.058684349060058594, -0.05598258972167969, -0.05328083038330078, -0.050579071044921875, -0.04787731170654297, -0.04517555236816406, -0.042473793029785156, -0.03977203369140625, -0.037070274353027344, -0.03436851501464844, -0.03166675567626953, -0.028964996337890625, -0.02626323699951172, -0.023561477661132812, -0.020859718322753906, -0.018157958984375, -0.015456199645996094, -0.012754440307617188, -0.010052680969238281, -0.007350921630859375, -0.004649162292480469, -0.0019474029541015625, 0.0007543563842773438, 0.00345611572265625, 0.006157875061035156, 0.008859634399414062, 0.011561393737792969, 0.014263153076171875, 0.01696491241455078, 0.019666671752929688, 0.022368431091308594, 0.0250701904296875, 0.027771949768066406, 0.030473709106445312, 0.03317546844482422, 0.035877227783203125, 0.03857898712158203, 0.04128074645996094, 0.043982505798339844, 0.04668426513671875, 0.049386024475097656, 0.05208778381347656, 0.05478954315185547, 0.057491302490234375, 0.06019306182861328, 0.06289482116699219, 0.0655965805053711, 0.06829833984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 14.0, 13.0, 17.0, 25.0, 30.0, 54.0, 68.0, 85.0, 117.0, 145.0, 101.0, 72.0, 76.0, 46.0, 46.0, 18.0, 10.0, 12.0, 15.0, 7.0, 7.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.947185516357422e-05, -4.8177316784858704e-05, -4.688277840614319e-05, -4.558824002742767e-05, -4.429370164871216e-05, -4.299916326999664e-05, -4.170462489128113e-05, -4.041008651256561e-05, -3.91155481338501e-05, -3.782100975513458e-05, -3.652647137641907e-05, -3.523193299770355e-05, -3.393739461898804e-05, -3.264285624027252e-05, -3.134831786155701e-05, -3.0053779482841492e-05, -2.8759241104125977e-05, -2.746470272541046e-05, -2.6170164346694946e-05, -2.487562596797943e-05, -2.3581087589263916e-05, -2.22865492105484e-05, -2.0992010831832886e-05, -1.969747245311737e-05, -1.8402934074401855e-05, -1.710839569568634e-05, -1.5813857316970825e-05, -1.451931893825531e-05, -1.3224780559539795e-05, -1.193024218082428e-05, -1.0635703802108765e-05, -9.34116542339325e-06, -8.046627044677734e-06, -6.752088665962219e-06, -5.457550287246704e-06, -4.163011908531189e-06, -2.868473529815674e-06, -1.5739351511001587e-06, -2.7939677238464355e-07, 1.0151416063308716e-06, 2.3096799850463867e-06, 3.604218363761902e-06, 4.898756742477417e-06, 6.193295121192932e-06, 7.487833499908447e-06, 8.782371878623962e-06, 1.0076910257339478e-05, 1.1371448636054993e-05, 1.2665987014770508e-05, 1.3960525393486023e-05, 1.5255063772201538e-05, 1.6549602150917053e-05, 1.784414052963257e-05, 1.9138678908348083e-05, 2.04332172870636e-05, 2.1727755665779114e-05, 2.302229404449463e-05, 2.4316832423210144e-05, 2.561137080192566e-05, 2.6905909180641174e-05, 2.820044755935669e-05, 2.9494985938072205e-05, 3.078952431678772e-05, 3.2084062695503235e-05, 3.337860107421875e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 21.0, 34.0, 32.0, 75.0, 120.0, 199.0, 309.0, 590.0, 1081.0, 2015.0, 3961.0, 8769.0, 21196.0, 56299.0, 186724.0, 492887.0, 181585.0, 54909.0, 20626.0, 8714.0, 3950.0, 2007.0, 1046.0, 564.0, 333.0, 207.0, 101.0, 59.0, 54.0, 29.0, 16.0, 12.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06670761108398438, -0.06444549560546875, -0.062183380126953125, -0.0599212646484375, -0.057659149169921875, -0.05539703369140625, -0.053134918212890625, -0.050872802734375, -0.048610687255859375, -0.04634857177734375, -0.044086456298828125, -0.0418243408203125, -0.039562225341796875, -0.03730010986328125, -0.035037994384765625, -0.03277587890625, -0.030513763427734375, -0.02825164794921875, -0.025989532470703125, -0.0237274169921875, -0.021465301513671875, -0.01920318603515625, -0.016941070556640625, -0.014678955078125, -0.012416839599609375, -0.01015472412109375, -0.007892608642578125, -0.0056304931640625, -0.003368377685546875, -0.00110626220703125, 0.001155853271484375, 0.00341796875, 0.005680084228515625, 0.00794219970703125, 0.010204315185546875, 0.0124664306640625, 0.014728546142578125, 0.01699066162109375, 0.019252777099609375, 0.021514892578125, 0.023777008056640625, 0.02603912353515625, 0.028301239013671875, 0.0305633544921875, 0.032825469970703125, 0.03508758544921875, 0.037349700927734375, 0.03961181640625, 0.041873931884765625, 0.04413604736328125, 0.046398162841796875, 0.0486602783203125, 0.050922393798828125, 0.05318450927734375, 0.055446624755859375, 0.057708740234375, 0.059970855712890625, 0.06223297119140625, 0.06449508666992188, 0.0667572021484375, 0.06901931762695312, 0.07128143310546875, 0.07354354858398438, 0.0758056640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 5.0, 6.0, 9.0, 9.0, 7.0, 8.0, 13.0, 19.0, 16.0, 43.0, 50.0, 61.0, 68.0, 70.0, 109.0, 94.0, 89.0, 61.0, 51.0, 43.0, 34.0, 21.0, 23.0, 19.0, 7.0, 10.0, 7.0, 11.0, 8.0, 2.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015533447265625, -0.014957189559936523, -0.014380931854248047, -0.01380467414855957, -0.013228416442871094, -0.012652158737182617, -0.01207590103149414, -0.011499643325805664, -0.010923385620117188, -0.010347127914428711, -0.009770870208740234, -0.009194612503051758, -0.008618354797363281, -0.008042097091674805, -0.007465839385986328, -0.0068895816802978516, -0.006313323974609375, -0.0057370662689208984, -0.005160808563232422, -0.004584550857543945, -0.004008293151855469, -0.003432035446166992, -0.0028557777404785156, -0.002279520034790039, -0.0017032623291015625, -0.001127004623413086, -0.0005507469177246094, 2.5510787963867188e-05, 0.0006017684936523438, 0.0011780261993408203, 0.0017542839050292969, 0.0023305416107177734, 0.00290679931640625, 0.0034830570220947266, 0.004059314727783203, 0.00463557243347168, 0.005211830139160156, 0.005788087844848633, 0.006364345550537109, 0.006940603256225586, 0.0075168609619140625, 0.008093118667602539, 0.008669376373291016, 0.009245634078979492, 0.009821891784667969, 0.010398149490356445, 0.010974407196044922, 0.011550664901733398, 0.012126922607421875, 0.012703180313110352, 0.013279438018798828, 0.013855695724487305, 0.014431953430175781, 0.015008211135864258, 0.015584468841552734, 0.01616072654724121, 0.016736984252929688, 0.017313241958618164, 0.01788949966430664, 0.018465757369995117, 0.019042015075683594, 0.01961827278137207, 0.020194530487060547, 0.020770788192749023, 0.0213470458984375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 18.0, 9.0, 13.0, 21.0, 22.0, 44.0, 42.0, 57.0, 71.0, 77.0, 74.0, 99.0, 86.0, 86.0, 76.0, 50.0, 36.0, 26.0, 29.0, 11.0, 11.0, 10.0, 6.0, 4.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43381404876708984, -0.4177893102169037, -0.4017646014690399, -0.38573986291885376, -0.36971515417099, -0.35369041562080383, -0.3376656770706177, -0.3216409683227539, -0.30561622977256775, -0.2895914912223816, -0.2735667824745178, -0.25754204392433167, -0.2415173202753067, -0.22549259662628174, -0.20946785807609558, -0.19344313442707062, -0.17741841077804565, -0.1613936871290207, -0.14536896347999573, -0.12934422492980957, -0.1133195012807846, -0.09729477763175964, -0.08127004653215408, -0.06524531543254852, -0.04922059178352356, -0.0331958644092083, -0.017171137034893036, -0.001146409660577774, 0.014878317713737488, 0.03090304136276245, 0.04692777246236801, 0.06295250356197357, 0.07897722721099854, 0.0950019508600235, 0.11102668195962906, 0.12705141305923462, 0.14307613670825958, 0.15910086035728455, 0.1751255989074707, 0.19115032255649567, 0.20717504620552063, 0.2231997698545456, 0.23922449350357056, 0.2552492320537567, 0.27127397060394287, 0.28729867935180664, 0.3033234179019928, 0.31934815645217896, 0.3353728652000427, 0.3513976037502289, 0.36742231249809265, 0.3834470510482788, 0.3994717597961426, 0.41549649834632874, 0.4315212368965149, 0.44754594564437866, 0.4635706841945648, 0.479595422744751, 0.49562013149261475, 0.5116448402404785, 0.5276696085929871, 0.5436943173408508, 0.5597190260887146, 0.5757437944412231, 0.5917685031890869]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 12.0, 12.0, 13.0, 12.0, 19.0, 32.0, 21.0, 37.0, 43.0, 42.0, 38.0, 42.0, 59.0, 58.0, 61.0, 59.0, 49.0, 51.0, 57.0, 34.0, 55.0, 34.0, 27.0, 26.0, 20.0, 20.0, 17.0, 6.0, 6.0, 8.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.43590986728668213, -0.424064040184021, -0.41221821308135986, -0.40037235617637634, -0.3885265290737152, -0.3766807019710541, -0.36483484506607056, -0.3529890179634094, -0.3411431908607483, -0.32929736375808716, -0.317451536655426, -0.3056056797504425, -0.29375985264778137, -0.28191402554512024, -0.2700681686401367, -0.2582223415374756, -0.24637651443481445, -0.23453068733215332, -0.222684845328331, -0.21083900332450867, -0.19899317622184753, -0.1871473491191864, -0.17530150711536407, -0.16345566511154175, -0.15160983800888062, -0.13976401090621948, -0.12791816890239716, -0.11607233434915543, -0.1042264997959137, -0.09238066524267197, -0.08053483068943024, -0.06868899613618851, -0.05684316158294678, -0.04499732702970505, -0.03315149247646332, -0.021305657923221588, -0.009459823369979858, 0.0023860111832618713, 0.014231845736503601, 0.02607768028974533, 0.03792351484298706, 0.04976934939622879, 0.06161518394947052, 0.07346101850271225, 0.08530685305595398, 0.09715268760919571, 0.10899852216243744, 0.12084435671567917, 0.1326901912689209, 0.14453601837158203, 0.15638186037540436, 0.16822770237922668, 0.18007352948188782, 0.19191935658454895, 0.20376519858837128, 0.2156110405921936, 0.22745686769485474, 0.23930269479751587, 0.251148521900177, 0.2629943788051605, 0.27484020590782166, 0.2866860330104828, 0.2985318899154663, 0.31037771701812744, 0.3222235441207886]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 18.0, 32.0, 33.0, 55.0, 80.0, 129.0, 227.0, 405.0, 607.0, 1140.0, 1904.0, 3254.0, 5989.0, 11417.0, 23175.0, 59920.0, 230472.0, 492540.0, 136710.0, 42130.0, 18057.0, 9020.0, 4791.0, 2663.0, 1447.0, 923.0, 521.0, 335.0, 204.0, 123.0, 73.0, 50.0, 36.0, 21.0, 16.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4716796875, -0.45793914794921875, -0.4441986083984375, -0.43045806884765625, -0.416717529296875, -0.40297698974609375, -0.3892364501953125, -0.37549591064453125, -0.36175537109375, -0.34801483154296875, -0.3342742919921875, -0.32053375244140625, -0.306793212890625, -0.29305267333984375, -0.2793121337890625, -0.26557159423828125, -0.2518310546875, -0.23809051513671875, -0.2243499755859375, -0.21060943603515625, -0.196868896484375, -0.18312835693359375, -0.1693878173828125, -0.15564727783203125, -0.14190673828125, -0.12816619873046875, -0.1144256591796875, -0.10068511962890625, -0.086944580078125, -0.07320404052734375, -0.0594635009765625, -0.04572296142578125, -0.031982421875, -0.01824188232421875, -0.0045013427734375, 0.00923919677734375, 0.022979736328125, 0.03672027587890625, 0.0504608154296875, 0.06420135498046875, 0.07794189453125, 0.09168243408203125, 0.1054229736328125, 0.11916351318359375, 0.132904052734375, 0.14664459228515625, 0.1603851318359375, 0.17412567138671875, 0.1878662109375, 0.20160675048828125, 0.2153472900390625, 0.22908782958984375, 0.242828369140625, 0.25656890869140625, 0.2703094482421875, 0.28404998779296875, 0.29779052734375, 0.31153106689453125, 0.3252716064453125, 0.33901214599609375, 0.352752685546875, 0.36649322509765625, 0.3802337646484375, 0.39397430419921875, 0.40771484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 7.0, 6.0, 13.0, 15.0, 14.0, 21.0, 26.0, 25.0, 43.0, 33.0, 45.0, 37.0, 53.0, 47.0, 50.0, 54.0, 65.0, 58.0, 54.0, 49.0, 39.0, 42.0, 32.0, 40.0, 22.0, 26.0, 18.0, 15.0, 9.0, 9.0, 5.0, 7.0, 6.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84814453125, -0.8230438232421875, -0.797943115234375, -0.7728424072265625, -0.74774169921875, -0.7226409912109375, -0.697540283203125, -0.6724395751953125, -0.6473388671875, -0.6222381591796875, -0.597137451171875, -0.5720367431640625, -0.54693603515625, -0.5218353271484375, -0.496734619140625, -0.4716339111328125, -0.446533203125, -0.4214324951171875, -0.396331787109375, -0.3712310791015625, -0.34613037109375, -0.3210296630859375, -0.295928955078125, -0.2708282470703125, -0.2457275390625, -0.2206268310546875, -0.195526123046875, -0.1704254150390625, -0.14532470703125, -0.1202239990234375, -0.095123291015625, -0.0700225830078125, -0.044921875, -0.0198211669921875, 0.005279541015625, 0.0303802490234375, 0.05548095703125, 0.0805816650390625, 0.105682373046875, 0.1307830810546875, 0.1558837890625, 0.1809844970703125, 0.206085205078125, 0.2311859130859375, 0.25628662109375, 0.2813873291015625, 0.306488037109375, 0.3315887451171875, 0.356689453125, 0.3817901611328125, 0.406890869140625, 0.4319915771484375, 0.45709228515625, 0.4821929931640625, 0.507293701171875, 0.5323944091796875, 0.5574951171875, 0.5825958251953125, 0.607696533203125, 0.6327972412109375, 0.65789794921875, 0.6829986572265625, 0.708099365234375, 0.7332000732421875, 0.75830078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 14.0, 27.0, 49.0, 116.0, 250.0, 685.0, 2401.0, 12026.0, 122324.0, 854959.0, 46493.0, 6846.0, 1534.0, 463.0, 152.0, 101.0, 44.0, 22.0, 13.0, 10.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2041015625, -1.163055419921875, -1.12200927734375, -1.080963134765625, -1.0399169921875, -0.998870849609375, -0.95782470703125, -0.916778564453125, -0.875732421875, -0.834686279296875, -0.79364013671875, -0.752593994140625, -0.7115478515625, -0.670501708984375, -0.62945556640625, -0.588409423828125, -0.54736328125, -0.506317138671875, -0.46527099609375, -0.424224853515625, -0.3831787109375, -0.342132568359375, -0.30108642578125, -0.260040283203125, -0.218994140625, -0.177947998046875, -0.13690185546875, -0.095855712890625, -0.0548095703125, -0.013763427734375, 0.02728271484375, 0.068328857421875, 0.109375, 0.150421142578125, 0.19146728515625, 0.232513427734375, 0.2735595703125, 0.314605712890625, 0.35565185546875, 0.396697998046875, 0.437744140625, 0.478790283203125, 0.51983642578125, 0.560882568359375, 0.6019287109375, 0.642974853515625, 0.68402099609375, 0.725067138671875, 0.76611328125, 0.807159423828125, 0.84820556640625, 0.889251708984375, 0.9302978515625, 0.971343994140625, 1.01239013671875, 1.053436279296875, 1.094482421875, 1.135528564453125, 1.17657470703125, 1.217620849609375, 1.2586669921875, 1.299713134765625, 1.34075927734375, 1.381805419921875, 1.4228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 8.0, 11.0, 18.0, 13.0, 16.0, 20.0, 19.0, 36.0, 37.0, 31.0, 45.0, 40.0, 47.0, 50.0, 45.0, 57.0, 56.0, 58.0, 43.0, 36.0, 44.0, 34.0, 32.0, 28.0, 32.0, 27.0, 25.0, 19.0, 8.0, 5.0, 7.0, 7.0, 2.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.94384765625, -0.9179840087890625, -0.892120361328125, -0.8662567138671875, -0.84039306640625, -0.8145294189453125, -0.788665771484375, -0.7628021240234375, -0.7369384765625, -0.7110748291015625, -0.685211181640625, -0.6593475341796875, -0.63348388671875, -0.6076202392578125, -0.581756591796875, -0.5558929443359375, -0.530029296875, -0.5041656494140625, -0.478302001953125, -0.4524383544921875, -0.42657470703125, -0.4007110595703125, -0.374847412109375, -0.3489837646484375, -0.3231201171875, -0.2972564697265625, -0.271392822265625, -0.2455291748046875, -0.21966552734375, -0.1938018798828125, -0.167938232421875, -0.1420745849609375, -0.1162109375, -0.0903472900390625, -0.064483642578125, -0.0386199951171875, -0.01275634765625, 0.0131072998046875, 0.038970947265625, 0.0648345947265625, 0.0906982421875, 0.1165618896484375, 0.142425537109375, 0.1682891845703125, 0.19415283203125, 0.2200164794921875, 0.245880126953125, 0.2717437744140625, 0.297607421875, 0.3234710693359375, 0.349334716796875, 0.3751983642578125, 0.40106201171875, 0.4269256591796875, 0.452789306640625, 0.4786529541015625, 0.5045166015625, 0.5303802490234375, 0.556243896484375, 0.5821075439453125, 0.60797119140625, 0.6338348388671875, 0.659698486328125, 0.6855621337890625, 0.71142578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 7.0, 4.0, 10.0, 15.0, 17.0, 31.0, 73.0, 137.0, 303.0, 883.0, 2912.0, 14954.0, 115646.0, 699699.0, 185336.0, 22748.0, 4027.0, 1049.0, 380.0, 136.0, 80.0, 35.0, 22.0, 16.0, 13.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1737060546875, -0.16664695739746094, -0.15958786010742188, -0.1525287628173828, -0.14546966552734375, -0.1384105682373047, -0.13135147094726562, -0.12429237365722656, -0.1172332763671875, -0.11017417907714844, -0.10311508178710938, -0.09605598449707031, -0.08899688720703125, -0.08193778991699219, -0.07487869262695312, -0.06781959533691406, -0.060760498046875, -0.05370140075683594, -0.046642303466796875, -0.03958320617675781, -0.03252410888671875, -0.025465011596679688, -0.018405914306640625, -0.011346817016601562, -0.0042877197265625, 0.0027713775634765625, 0.009830474853515625, 0.016889572143554688, 0.02394866943359375, 0.031007766723632812, 0.038066864013671875, 0.04512596130371094, 0.05218505859375, 0.05924415588378906, 0.06630325317382812, 0.07336235046386719, 0.08042144775390625, 0.08748054504394531, 0.09453964233398438, 0.10159873962402344, 0.1086578369140625, 0.11571693420410156, 0.12277603149414062, 0.1298351287841797, 0.13689422607421875, 0.1439533233642578, 0.15101242065429688, 0.15807151794433594, 0.165130615234375, 0.17218971252441406, 0.17924880981445312, 0.1863079071044922, 0.19336700439453125, 0.2004261016845703, 0.20748519897460938, 0.21454429626464844, 0.2216033935546875, 0.22866249084472656, 0.23572158813476562, 0.2427806854248047, 0.24983978271484375, 0.2568988800048828, 0.2639579772949219, 0.27101707458496094, 0.278076171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 11.0, 4.0, 6.0, 13.0, 7.0, 9.0, 22.0, 30.0, 27.0, 41.0, 59.0, 63.0, 91.0, 123.0, 107.0, 92.0, 74.0, 59.0, 46.0, 20.0, 22.0, 25.0, 12.0, 18.0, 14.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.11732292175293e-05, -3.033410757780075e-05, -2.9494985938072205e-05, -2.865586429834366e-05, -2.7816742658615112e-05, -2.6977621018886566e-05, -2.613849937915802e-05, -2.5299377739429474e-05, -2.4460256099700928e-05, -2.362113445997238e-05, -2.2782012820243835e-05, -2.194289118051529e-05, -2.1103769540786743e-05, -2.0264647901058197e-05, -1.942552626132965e-05, -1.8586404621601105e-05, -1.774728298187256e-05, -1.6908161342144012e-05, -1.6069039702415466e-05, -1.522991806268692e-05, -1.4390796422958374e-05, -1.3551674783229828e-05, -1.2712553143501282e-05, -1.1873431503772736e-05, -1.103430986404419e-05, -1.0195188224315643e-05, -9.356066584587097e-06, -8.516944944858551e-06, -7.677823305130005e-06, -6.838701665401459e-06, -5.999580025672913e-06, -5.1604583859443665e-06, -4.32133674621582e-06, -3.482215106487274e-06, -2.643093466758728e-06, -1.8039718270301819e-06, -9.648501873016357e-07, -1.257285475730896e-07, 7.133930921554565e-07, 1.5525147318840027e-06, 2.391636371612549e-06, 3.230758011341095e-06, 4.069879651069641e-06, 4.909001290798187e-06, 5.748122930526733e-06, 6.5872445702552795e-06, 7.426366209983826e-06, 8.265487849712372e-06, 9.104609489440918e-06, 9.943731129169464e-06, 1.078285276889801e-05, 1.1621974408626556e-05, 1.2461096048355103e-05, 1.3300217688083649e-05, 1.4139339327812195e-05, 1.4978460967540741e-05, 1.5817582607269287e-05, 1.6656704246997833e-05, 1.749582588672638e-05, 1.8334947526454926e-05, 1.917406916618347e-05, 2.0013190805912018e-05, 2.0852312445640564e-05, 2.169143408536911e-05, 2.2530555725097656e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 11.0, 8.0, 13.0, 22.0, 20.0, 30.0, 64.0, 103.0, 255.0, 701.0, 2130.0, 9160.0, 55004.0, 437698.0, 471320.0, 58753.0, 9764.0, 2300.0, 628.0, 255.0, 106.0, 74.0, 43.0, 20.0, 16.0, 15.0, 7.0, 12.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208984375, -0.2017822265625, -0.194580078125, -0.1873779296875, -0.18017578125, -0.1729736328125, -0.165771484375, -0.1585693359375, -0.1513671875, -0.1441650390625, -0.136962890625, -0.1297607421875, -0.12255859375, -0.1153564453125, -0.108154296875, -0.1009521484375, -0.09375, -0.0865478515625, -0.079345703125, -0.0721435546875, -0.06494140625, -0.0577392578125, -0.050537109375, -0.0433349609375, -0.0361328125, -0.0289306640625, -0.021728515625, -0.0145263671875, -0.00732421875, -0.0001220703125, 0.007080078125, 0.0142822265625, 0.021484375, 0.0286865234375, 0.035888671875, 0.0430908203125, 0.05029296875, 0.0574951171875, 0.064697265625, 0.0718994140625, 0.0791015625, 0.0863037109375, 0.093505859375, 0.1007080078125, 0.10791015625, 0.1151123046875, 0.122314453125, 0.1295166015625, 0.13671875, 0.1439208984375, 0.151123046875, 0.1583251953125, 0.16552734375, 0.1727294921875, 0.179931640625, 0.1871337890625, 0.1943359375, 0.2015380859375, 0.208740234375, 0.2159423828125, 0.22314453125, 0.2303466796875, 0.237548828125, 0.2447509765625, 0.251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 16.0, 13.0, 22.0, 18.0, 32.0, 28.0, 37.0, 42.0, 48.0, 71.0, 74.0, 118.0, 87.0, 66.0, 46.0, 54.0, 41.0, 45.0, 35.0, 24.0, 14.0, 20.0, 13.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06256103515625, -0.059897422790527344, -0.05723381042480469, -0.05457019805908203, -0.051906585693359375, -0.04924297332763672, -0.04657936096191406, -0.043915748596191406, -0.04125213623046875, -0.038588523864746094, -0.03592491149902344, -0.03326129913330078, -0.030597686767578125, -0.02793407440185547, -0.025270462036132812, -0.022606849670410156, -0.0199432373046875, -0.017279624938964844, -0.014616012573242188, -0.011952400207519531, -0.009288787841796875, -0.006625175476074219, -0.0039615631103515625, -0.0012979507446289062, 0.00136566162109375, 0.004029273986816406, 0.0066928863525390625, 0.009356498718261719, 0.012020111083984375, 0.014683723449707031, 0.017347335815429688, 0.020010948181152344, 0.022674560546875, 0.025338172912597656, 0.028001785278320312, 0.03066539764404297, 0.033329010009765625, 0.03599262237548828, 0.03865623474121094, 0.041319847106933594, 0.04398345947265625, 0.046647071838378906, 0.04931068420410156, 0.05197429656982422, 0.054637908935546875, 0.05730152130126953, 0.05996513366699219, 0.06262874603271484, 0.0652923583984375, 0.06795597076416016, 0.07061958312988281, 0.07328319549560547, 0.07594680786132812, 0.07861042022705078, 0.08127403259277344, 0.0839376449584961, 0.08660125732421875, 0.0892648696899414, 0.09192848205566406, 0.09459209442138672, 0.09725570678710938, 0.09991931915283203, 0.10258293151855469, 0.10524654388427734, 0.10791015625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 18.0, 30.0, 53.0, 95.0, 139.0, 191.0, 174.0, 129.0, 84.0, 44.0, 27.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4290276765823364, -1.353173851966858, -1.2773200273513794, -1.2014660835266113, -1.1256122589111328, -1.0497584342956543, -0.9739046096801758, -0.8980507254600525, -0.822196900844574, -0.7463430762290955, -0.6704891920089722, -0.5946353673934937, -0.5187815427780151, -0.44292765855789185, -0.36707383394241333, -0.29121994972229004, -0.21536612510681152, -0.13951227068901062, -0.06365843117237091, 0.012195408344268799, 0.0880492627620697, 0.1639031171798706, 0.23975694179534912, 0.3156108260154724, 0.3914646506309509, 0.46731850504875183, 0.5431723594665527, 0.6190261840820312, 0.6948800086975098, 0.7707338929176331, 0.8465877175331116, 0.9224416017532349, 0.9982953071594238, 1.0741491317749023, 1.1500029563903809, 1.2258567810058594, 1.3017107248306274, 1.377564549446106, 1.4534183740615845, 1.5292723178863525, 1.605126142501831, 1.6809799671173096, 1.756833791732788, 1.8326876163482666, 1.9085415601730347, 1.9843953847885132, 2.0602493286132812, 2.1361031532287598, 2.2119569778442383, 2.287810802459717, 2.3636646270751953, 2.439518451690674, 2.5153722763061523, 2.591226100921631, 2.6670799255371094, 2.742933988571167, 2.8187875747680664, 2.894641399383545, 2.9704952239990234, 3.046349048614502, 3.1222028732299805, 3.198056697845459, 3.2739105224609375, 3.349764585494995, 3.4256184101104736]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 6.0, 4.0, 5.0, 7.0, 13.0, 7.0, 10.0, 18.0, 19.0, 18.0, 24.0, 34.0, 22.0, 30.0, 35.0, 44.0, 55.0, 40.0, 35.0, 41.0, 40.0, 53.0, 34.0, 41.0, 37.0, 41.0, 44.0, 38.0, 40.0, 22.0, 22.0, 21.0, 16.0, 16.0, 10.0, 11.0, 9.0, 10.0, 5.0, 4.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2290598154067993, -1.1891682147979736, -1.149276614189148, -1.1093850135803223, -1.0694934129714966, -1.029601812362671, -0.9897102117538452, -0.9498186111450195, -0.9099270105361938, -0.8700354099273682, -0.8301438093185425, -0.7902522087097168, -0.7503606081008911, -0.7104690074920654, -0.6705774068832397, -0.6306858062744141, -0.5907941460609436, -0.5509025454521179, -0.5110109448432922, -0.47111934423446655, -0.43122774362564087, -0.3913361430168152, -0.3514445126056671, -0.31155291199684143, -0.27166131138801575, -0.23176971077919006, -0.19187811017036438, -0.1519864946603775, -0.11209489405155182, -0.07220329344272614, -0.03231167793273926, 0.007579922676086426, 0.04747152328491211, 0.08736312389373779, 0.12725472450256348, 0.16714634001255035, 0.20703794062137604, 0.24692954123020172, 0.2868211567401886, 0.3267127573490143, 0.36660435795783997, 0.40649595856666565, 0.44638755917549133, 0.4862791895866394, 0.5261707901954651, 0.5660623908042908, 0.6059539914131165, 0.6458455920219421, 0.6857371926307678, 0.7256287932395935, 0.7655203938484192, 0.8054119944572449, 0.8453035950660706, 0.8851951956748962, 0.9250868558883667, 0.9649784564971924, 1.004870057106018, 1.0447616577148438, 1.0846532583236694, 1.1245448589324951, 1.1644364595413208, 1.2043280601501465, 1.2442196607589722, 1.2841112613677979, 1.3240028619766235]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 10.0, 6.0, 15.0, 15.0, 22.0, 26.0, 44.0, 57.0, 73.0, 109.0, 144.0, 183.0, 282.0, 473.0, 710.0, 1193.0, 2124.0, 4104.0, 8482.0, 21958.0, 80337.0, 723258.0, 2847475.0, 411283.0, 57942.0, 18156.0, 7265.0, 3614.0, 1916.0, 1040.0, 625.0, 422.0, 272.0, 185.0, 132.0, 81.0, 61.0, 44.0, 35.0, 22.0, 24.0, 23.0, 9.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-0.6552734375, -0.6343994140625, -0.613525390625, -0.5926513671875, -0.57177734375, -0.5509033203125, -0.530029296875, -0.5091552734375, -0.48828125, -0.4674072265625, -0.446533203125, -0.4256591796875, -0.40478515625, -0.3839111328125, -0.363037109375, -0.3421630859375, -0.3212890625, -0.3004150390625, -0.279541015625, -0.2586669921875, -0.23779296875, -0.2169189453125, -0.196044921875, -0.1751708984375, -0.154296875, -0.1334228515625, -0.112548828125, -0.0916748046875, -0.07080078125, -0.0499267578125, -0.029052734375, -0.0081787109375, 0.0126953125, 0.0335693359375, 0.054443359375, 0.0753173828125, 0.09619140625, 0.1170654296875, 0.137939453125, 0.1588134765625, 0.1796875, 0.2005615234375, 0.221435546875, 0.2423095703125, 0.26318359375, 0.2840576171875, 0.304931640625, 0.3258056640625, 0.3466796875, 0.3675537109375, 0.388427734375, 0.4093017578125, 0.43017578125, 0.4510498046875, 0.471923828125, 0.4927978515625, 0.513671875, 0.5345458984375, 0.555419921875, 0.5762939453125, 0.59716796875, 0.6180419921875, 0.638916015625, 0.6597900390625, 0.6806640625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 15.0, 18.0, 9.0, 15.0, 24.0, 33.0, 24.0, 35.0, 46.0, 38.0, 74.0, 46.0, 54.0, 61.0, 60.0, 41.0, 57.0, 56.0, 46.0, 45.0, 37.0, 35.0, 24.0, 18.0, 16.0, 12.0, 9.0, 11.0, 3.0, 4.0, 3.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.431640625, -0.4202384948730469, -0.40883636474609375, -0.3974342346191406, -0.3860321044921875, -0.3746299743652344, -0.36322784423828125, -0.3518257141113281, -0.340423583984375, -0.3290214538574219, -0.31761932373046875, -0.3062171936035156, -0.2948150634765625, -0.2834129333496094, -0.27201080322265625, -0.2606086730957031, -0.24920654296875, -0.23780441284179688, -0.22640228271484375, -0.21500015258789062, -0.2035980224609375, -0.19219589233398438, -0.18079376220703125, -0.16939163208007812, -0.157989501953125, -0.14658737182617188, -0.13518524169921875, -0.12378311157226562, -0.1123809814453125, -0.10097885131835938, -0.08957672119140625, -0.07817459106445312, -0.0667724609375, -0.055370330810546875, -0.04396820068359375, -0.032566070556640625, -0.0211639404296875, -0.009761810302734375, 0.00164031982421875, 0.013042449951171875, 0.024444580078125, 0.035846710205078125, 0.04724884033203125, 0.058650970458984375, 0.0700531005859375, 0.08145523071289062, 0.09285736083984375, 0.10425949096679688, 0.11566162109375, 0.12706375122070312, 0.13846588134765625, 0.14986801147460938, 0.1612701416015625, 0.17267227172851562, 0.18407440185546875, 0.19547653198242188, 0.206878662109375, 0.21828079223632812, 0.22968292236328125, 0.24108505249023438, 0.2524871826171875, 0.2638893127441406, 0.27529144287109375, 0.2866935729980469, 0.298095703125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 4.0, 8.0, 9.0, 13.0, 15.0, 23.0, 49.0, 66.0, 118.0, 222.0, 499.0, 1420.0, 5698.0, 43627.0, 2687962.0, 1415247.0, 32294.0, 4622.0, 1316.0, 515.0, 247.0, 118.0, 73.0, 37.0, 24.0, 17.0, 5.0, 6.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.857421875, -1.8057403564453125, -1.754058837890625, -1.7023773193359375, -1.65069580078125, -1.5990142822265625, -1.547332763671875, -1.4956512451171875, -1.4439697265625, -1.3922882080078125, -1.340606689453125, -1.2889251708984375, -1.23724365234375, -1.1855621337890625, -1.133880615234375, -1.0821990966796875, -1.030517578125, -0.9788360595703125, -0.927154541015625, -0.8754730224609375, -0.82379150390625, -0.7721099853515625, -0.720428466796875, -0.6687469482421875, -0.6170654296875, -0.5653839111328125, -0.513702392578125, -0.4620208740234375, -0.41033935546875, -0.3586578369140625, -0.306976318359375, -0.2552947998046875, -0.20361328125, -0.1519317626953125, -0.100250244140625, -0.0485687255859375, 0.00311279296875, 0.0547943115234375, 0.106475830078125, 0.1581573486328125, 0.2098388671875, 0.2615203857421875, 0.313201904296875, 0.3648834228515625, 0.41656494140625, 0.4682464599609375, 0.519927978515625, 0.5716094970703125, 0.623291015625, 0.6749725341796875, 0.726654052734375, 0.7783355712890625, 0.83001708984375, 0.8816986083984375, 0.933380126953125, 0.9850616455078125, 1.0367431640625, 1.0884246826171875, 1.140106201171875, 1.1917877197265625, 1.24346923828125, 1.2951507568359375, 1.346832275390625, 1.3985137939453125, 1.4501953125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 7.0, 24.0, 27.0, 48.0, 63.0, 85.0, 138.0, 207.0, 376.0, 671.0, 836.0, 642.0, 395.0, 196.0, 122.0, 64.0, 45.0, 37.0, 20.0, 16.0, 9.0, 13.0, 2.0, 5.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29931640625, -0.2888069152832031, -0.27829742431640625, -0.2677879333496094, -0.2572784423828125, -0.24676895141601562, -0.23625946044921875, -0.22574996948242188, -0.215240478515625, -0.20473098754882812, -0.19422149658203125, -0.18371200561523438, -0.1732025146484375, -0.16269302368164062, -0.15218353271484375, -0.14167404174804688, -0.13116455078125, -0.12065505981445312, -0.11014556884765625, -0.09963607788085938, -0.0891265869140625, -0.07861709594726562, -0.06810760498046875, -0.057598114013671875, -0.047088623046875, -0.036579132080078125, -0.02606964111328125, -0.015560150146484375, -0.0050506591796875, 0.005458831787109375, 0.01596832275390625, 0.026477813720703125, 0.0369873046875, 0.047496795654296875, 0.05800628662109375, 0.06851577758789062, 0.0790252685546875, 0.08953475952148438, 0.10004425048828125, 0.11055374145507812, 0.121063232421875, 0.13157272338867188, 0.14208221435546875, 0.15259170532226562, 0.1631011962890625, 0.17361068725585938, 0.18412017822265625, 0.19462966918945312, 0.20513916015625, 0.21564865112304688, 0.22615814208984375, 0.23666763305664062, 0.2471771240234375, 0.2576866149902344, 0.26819610595703125, 0.2787055969238281, 0.289215087890625, 0.2997245788574219, 0.31023406982421875, 0.3207435607910156, 0.3312530517578125, 0.3417625427246094, 0.35227203369140625, 0.3627815246582031, 0.373291015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 5.0, 12.0, 9.0, 22.0, 20.0, 23.0, 28.0, 46.0, 53.0, 62.0, 61.0, 56.0, 83.0, 75.0, 65.0, 64.0, 68.0, 36.0, 44.0, 27.0, 34.0, 24.0, 20.0, 19.0, 12.0, 4.0, 8.0, 7.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.793707013130188, -0.770160436630249, -0.7466138601303101, -0.7230673432350159, -0.6995207667350769, -0.6759741902351379, -0.6524276733398438, -0.6288810968399048, -0.6053345203399658, -0.5817879438400269, -0.5582413673400879, -0.5346948504447937, -0.5111482739448547, -0.48760169744491577, -0.4640551507472992, -0.4405086040496826, -0.41696202754974365, -0.3934154510498047, -0.3698689043521881, -0.34632235765457153, -0.32277578115463257, -0.2992292046546936, -0.275682657957077, -0.25213611125946045, -0.22858953475952148, -0.2050429731607437, -0.18149641156196594, -0.15794984996318817, -0.1344032883644104, -0.11085672676563263, -0.08731016516685486, -0.06376360356807709, -0.04021698236465454, -0.01667042076587677, 0.006876140832901001, 0.030422702431678772, 0.05396926403045654, 0.07751582562923431, 0.10106238722801208, 0.12460894882678986, 0.14815551042556763, 0.1717020720243454, 0.19524863362312317, 0.21879519522190094, 0.2423417568206787, 0.2658883333206177, 0.28943488001823425, 0.31298142671585083, 0.3365280032157898, 0.36007457971572876, 0.38362112641334534, 0.4071676731109619, 0.4307142496109009, 0.45426082611083984, 0.4778073728084564, 0.501353919506073, 0.524900496006012, 0.5484470725059509, 0.5719935894012451, 0.5955401659011841, 0.619086742401123, 0.642633318901062, 0.666179895401001, 0.6897264122962952, 0.7132729887962341]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 13.0, 9.0, 6.0, 14.0, 21.0, 15.0, 13.0, 32.0, 26.0, 36.0, 30.0, 42.0, 37.0, 48.0, 46.0, 34.0, 33.0, 29.0, 39.0, 45.0, 44.0, 28.0, 35.0, 44.0, 40.0, 27.0, 28.0, 27.0, 24.0, 12.0, 14.0, 18.0, 17.0, 14.0, 8.0, 10.0, 8.0, 10.0, 5.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5025694966316223, -0.48626694083213806, -0.4699643850326538, -0.45366182923316956, -0.4373592734336853, -0.42105668783187866, -0.4047541320323944, -0.38845157623291016, -0.3721490204334259, -0.35584646463394165, -0.3395439088344574, -0.32324135303497314, -0.3069387674331665, -0.29063624143600464, -0.274333655834198, -0.25803110003471375, -0.2417285442352295, -0.22542598843574524, -0.209123432636261, -0.19282086193561554, -0.1765183061361313, -0.16021575033664703, -0.1439131796360016, -0.12761062383651733, -0.11130806803703308, -0.09500551223754883, -0.07870294898748398, -0.06240038946270943, -0.046097829937934875, -0.029795274138450623, -0.013492710888385773, 0.002809852361679077, 0.019112467765808105, 0.03541502729058266, 0.05171758681535721, 0.06802015006542206, 0.08432270586490631, 0.10062526166439056, 0.11692782491445541, 0.13323038816452026, 0.14953294396400452, 0.16583549976348877, 0.18213805556297302, 0.19844062626361847, 0.21474318206310272, 0.23104573786258698, 0.24734830856323242, 0.2636508643627167, 0.2799534201622009, 0.2962559759616852, 0.31255853176116943, 0.3288610875606537, 0.34516364336013794, 0.3614662289619446, 0.37776878476142883, 0.3940713405609131, 0.41037389636039734, 0.4266764521598816, 0.44297900795936584, 0.4592815637588501, 0.47558414936065674, 0.4918866753578186, 0.5081892609596252, 0.5244917869567871, 0.5407943725585938]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 7.0, 16.0, 9.0, 22.0, 23.0, 18.0, 29.0, 44.0, 50.0, 76.0, 78.0, 117.0, 148.0, 211.0, 340.0, 592.0, 1107.0, 2040.0, 4275.0, 9991.0, 35713.0, 271161.0, 597278.0, 94354.0, 17623.0, 6383.0, 2958.0, 1480.0, 861.0, 481.0, 310.0, 199.0, 137.0, 107.0, 82.0, 49.0, 40.0, 37.0, 30.0, 9.0, 12.0, 10.0, 9.0, 5.0, 4.0, 8.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.18017578125, -0.17422103881835938, -0.16826629638671875, -0.16231155395507812, -0.1563568115234375, -0.15040206909179688, -0.14444732666015625, -0.13849258422851562, -0.132537841796875, -0.12658309936523438, -0.12062835693359375, -0.11467361450195312, -0.1087188720703125, -0.10276412963867188, -0.09680938720703125, -0.09085464477539062, -0.08489990234375, -0.07894515991210938, -0.07299041748046875, -0.06703567504882812, -0.0610809326171875, -0.055126190185546875, -0.04917144775390625, -0.043216705322265625, -0.037261962890625, -0.031307220458984375, -0.02535247802734375, -0.019397735595703125, -0.0134429931640625, -0.007488250732421875, -0.00153350830078125, 0.004421234130859375, 0.0103759765625, 0.016330718994140625, 0.02228546142578125, 0.028240203857421875, 0.0341949462890625, 0.040149688720703125, 0.04610443115234375, 0.052059173583984375, 0.058013916015625, 0.06396865844726562, 0.06992340087890625, 0.07587814331054688, 0.0818328857421875, 0.08778762817382812, 0.09374237060546875, 0.09969711303710938, 0.10565185546875, 0.11160659790039062, 0.11756134033203125, 0.12351608276367188, 0.1294708251953125, 0.13542556762695312, 0.14138031005859375, 0.14733505249023438, 0.153289794921875, 0.15924453735351562, 0.16519927978515625, 0.17115402221679688, 0.1771087646484375, 0.18306350708007812, 0.18901824951171875, 0.19497299194335938, 0.200927734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 4.0, 9.0, 7.0, 15.0, 12.0, 18.0, 23.0, 26.0, 24.0, 33.0, 37.0, 33.0, 46.0, 35.0, 52.0, 32.0, 27.0, 37.0, 39.0, 50.0, 50.0, 31.0, 27.0, 44.0, 32.0, 28.0, 26.0, 30.0, 16.0, 24.0, 10.0, 10.0, 16.0, 16.0, 16.0, 12.0, 8.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.346435546875, -0.3357048034667969, -0.32497406005859375, -0.3142433166503906, -0.3035125732421875, -0.2927818298339844, -0.28205108642578125, -0.2713203430175781, -0.260589599609375, -0.24985885620117188, -0.23912811279296875, -0.22839736938476562, -0.2176666259765625, -0.20693588256835938, -0.19620513916015625, -0.18547439575195312, -0.17474365234375, -0.16401290893554688, -0.15328216552734375, -0.14255142211914062, -0.1318206787109375, -0.12108993530273438, -0.11035919189453125, -0.09962844848632812, -0.088897705078125, -0.07816696166992188, -0.06743621826171875, -0.056705474853515625, -0.0459747314453125, -0.035243988037109375, -0.02451324462890625, -0.013782501220703125, -0.0030517578125, 0.007678985595703125, 0.01840972900390625, 0.029140472412109375, 0.0398712158203125, 0.050601959228515625, 0.06133270263671875, 0.07206344604492188, 0.082794189453125, 0.09352493286132812, 0.10425567626953125, 0.11498641967773438, 0.1257171630859375, 0.13644790649414062, 0.14717864990234375, 0.15790939331054688, 0.16864013671875, 0.17937088012695312, 0.19010162353515625, 0.20083236694335938, 0.2115631103515625, 0.22229385375976562, 0.23302459716796875, 0.24375534057617188, 0.254486083984375, 0.2652168273925781, 0.27594757080078125, 0.2866783142089844, 0.2974090576171875, 0.3081398010253906, 0.31887054443359375, 0.3296012878417969, 0.34033203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 7.0, 13.0, 12.0, 20.0, 31.0, 29.0, 72.0, 111.0, 155.0, 273.0, 526.0, 1092.0, 2538.0, 7543.0, 32860.0, 302074.0, 608400.0, 72841.0, 12823.0, 3910.0, 1589.0, 682.0, 355.0, 212.0, 112.0, 84.0, 47.0, 37.0, 21.0, 19.0, 8.0, 12.0, 11.0, 8.0, 7.0, 3.0, 6.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1973876953125, -0.19178009033203125, -0.1861724853515625, -0.18056488037109375, -0.174957275390625, -0.16934967041015625, -0.1637420654296875, -0.15813446044921875, -0.15252685546875, -0.14691925048828125, -0.1413116455078125, -0.13570404052734375, -0.130096435546875, -0.12448883056640625, -0.1188812255859375, -0.11327362060546875, -0.107666015625, -0.10205841064453125, -0.0964508056640625, -0.09084320068359375, -0.085235595703125, -0.07962799072265625, -0.0740203857421875, -0.06841278076171875, -0.06280517578125, -0.05719757080078125, -0.0515899658203125, -0.04598236083984375, -0.040374755859375, -0.03476715087890625, -0.0291595458984375, -0.02355194091796875, -0.0179443359375, -0.01233673095703125, -0.0067291259765625, -0.00112152099609375, 0.004486083984375, 0.01009368896484375, 0.0157012939453125, 0.02130889892578125, 0.02691650390625, 0.03252410888671875, 0.0381317138671875, 0.04373931884765625, 0.049346923828125, 0.05495452880859375, 0.0605621337890625, 0.06616973876953125, 0.07177734375, 0.07738494873046875, 0.0829925537109375, 0.08860015869140625, 0.094207763671875, 0.09981536865234375, 0.1054229736328125, 0.11103057861328125, 0.11663818359375, 0.12224578857421875, 0.1278533935546875, 0.13346099853515625, 0.139068603515625, 0.14467620849609375, 0.1502838134765625, 0.15589141845703125, 0.1614990234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 8.0, 16.0, 14.0, 16.0, 25.0, 31.0, 19.0, 41.0, 37.0, 32.0, 36.0, 51.0, 41.0, 46.0, 46.0, 50.0, 37.0, 55.0, 43.0, 29.0, 42.0, 39.0, 25.0, 38.0, 28.0, 16.0, 16.0, 21.0, 19.0, 12.0, 13.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.8501434326171875, -0.821380615234375, -0.7926177978515625, -0.76385498046875, -0.7350921630859375, -0.706329345703125, -0.6775665283203125, -0.6488037109375, -0.6200408935546875, -0.591278076171875, -0.5625152587890625, -0.53375244140625, -0.5049896240234375, -0.476226806640625, -0.4474639892578125, -0.418701171875, -0.3899383544921875, -0.361175537109375, -0.3324127197265625, -0.30364990234375, -0.2748870849609375, -0.246124267578125, -0.2173614501953125, -0.1885986328125, -0.1598358154296875, -0.131072998046875, -0.1023101806640625, -0.07354736328125, -0.0447845458984375, -0.016021728515625, 0.0127410888671875, 0.04150390625, 0.0702667236328125, 0.099029541015625, 0.1277923583984375, 0.15655517578125, 0.1853179931640625, 0.214080810546875, 0.2428436279296875, 0.2716064453125, 0.3003692626953125, 0.329132080078125, 0.3578948974609375, 0.38665771484375, 0.4154205322265625, 0.444183349609375, 0.4729461669921875, 0.501708984375, 0.5304718017578125, 0.559234619140625, 0.5879974365234375, 0.61676025390625, 0.6455230712890625, 0.674285888671875, 0.7030487060546875, 0.7318115234375, 0.7605743408203125, 0.789337158203125, 0.8180999755859375, 0.84686279296875, 0.8756256103515625, 0.904388427734375, 0.9331512451171875, 0.9619140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 6.0, 12.0, 17.0, 18.0, 21.0, 32.0, 48.0, 64.0, 131.0, 135.0, 231.0, 397.0, 561.0, 975.0, 1697.0, 3064.0, 6274.0, 14968.0, 55552.0, 547880.0, 352632.0, 39258.0, 12368.0, 5457.0, 2729.0, 1543.0, 894.0, 570.0, 341.0, 203.0, 136.0, 89.0, 58.0, 55.0, 32.0, 31.0, 19.0, 16.0, 6.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08355712890625, -0.08093738555908203, -0.07831764221191406, -0.0756978988647461, -0.07307815551757812, -0.07045841217041016, -0.06783866882324219, -0.06521892547607422, -0.06259918212890625, -0.05997943878173828, -0.05735969543457031, -0.054739952087402344, -0.052120208740234375, -0.049500465393066406, -0.04688072204589844, -0.04426097869873047, -0.0416412353515625, -0.03902149200439453, -0.03640174865722656, -0.033782005310058594, -0.031162261962890625, -0.028542518615722656, -0.025922775268554688, -0.02330303192138672, -0.02068328857421875, -0.01806354522705078, -0.015443801879882812, -0.012824058532714844, -0.010204315185546875, -0.007584571838378906, -0.0049648284912109375, -0.0023450851440429688, 0.000274658203125, 0.0028944015502929688, 0.0055141448974609375, 0.008133888244628906, 0.010753631591796875, 0.013373374938964844, 0.015993118286132812, 0.01861286163330078, 0.02123260498046875, 0.02385234832763672, 0.026472091674804688, 0.029091835021972656, 0.031711578369140625, 0.034331321716308594, 0.03695106506347656, 0.03957080841064453, 0.0421905517578125, 0.04481029510498047, 0.04743003845214844, 0.050049781799316406, 0.052669525146484375, 0.055289268493652344, 0.05790901184082031, 0.06052875518798828, 0.06314849853515625, 0.06576824188232422, 0.06838798522949219, 0.07100772857666016, 0.07362747192382812, 0.0762472152709961, 0.07886695861816406, 0.08148670196533203, 0.0841064453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 6.0, 5.0, 19.0, 31.0, 57.0, 114.0, 208.0, 212.0, 155.0, 72.0, 35.0, 26.0, 5.0, 13.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.389617919921875e-05, -6.177462637424469e-05, -5.965307354927063e-05, -5.753152072429657e-05, -5.540996789932251e-05, -5.328841507434845e-05, -5.116686224937439e-05, -4.904530942440033e-05, -4.692375659942627e-05, -4.480220377445221e-05, -4.268065094947815e-05, -4.055909812450409e-05, -3.843754529953003e-05, -3.631599247455597e-05, -3.419443964958191e-05, -3.207288682460785e-05, -2.995133399963379e-05, -2.782978117465973e-05, -2.570822834968567e-05, -2.358667552471161e-05, -2.146512269973755e-05, -1.934356987476349e-05, -1.722201704978943e-05, -1.5100464224815369e-05, -1.2978911399841309e-05, -1.0857358574867249e-05, -8.735805749893188e-06, -6.614252924919128e-06, -4.492700099945068e-06, -2.3711472749710083e-06, -2.4959444999694824e-07, 1.8719583749771118e-06, 3.993511199951172e-06, 6.115064024925232e-06, 8.236616849899292e-06, 1.0358169674873352e-05, 1.2479722499847412e-05, 1.4601275324821472e-05, 1.6722828149795532e-05, 1.8844380974769592e-05, 2.0965933799743652e-05, 2.3087486624717712e-05, 2.5209039449691772e-05, 2.7330592274665833e-05, 2.9452145099639893e-05, 3.157369792461395e-05, 3.369525074958801e-05, 3.581680357456207e-05, 3.793835639953613e-05, 4.005990922451019e-05, 4.218146204948425e-05, 4.430301487445831e-05, 4.642456769943237e-05, 4.854612052440643e-05, 5.066767334938049e-05, 5.278922617435455e-05, 5.491077899932861e-05, 5.703233182430267e-05, 5.9153884649276733e-05, 6.12754374742508e-05, 6.339699029922485e-05, 6.551854312419891e-05, 6.764009594917297e-05, 6.976164877414703e-05, 7.18832015991211e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 14.0, 9.0, 15.0, 40.0, 50.0, 46.0, 83.0, 106.0, 171.0, 216.0, 310.0, 412.0, 616.0, 1010.0, 1577.0, 2652.0, 4974.0, 10315.0, 27673.0, 115658.0, 534895.0, 267404.0, 49230.0, 15474.0, 6627.0, 3510.0, 1867.0, 1166.0, 763.0, 526.0, 354.0, 252.0, 159.0, 119.0, 83.0, 42.0, 33.0, 25.0, 22.0, 12.0, 10.0, 8.0, 5.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07073974609375, -0.0683603286743164, -0.06598091125488281, -0.06360149383544922, -0.061222076416015625, -0.05884265899658203, -0.05646324157714844, -0.054083824157714844, -0.05170440673828125, -0.049324989318847656, -0.04694557189941406, -0.04456615447998047, -0.042186737060546875, -0.03980731964111328, -0.03742790222167969, -0.035048484802246094, -0.0326690673828125, -0.030289649963378906, -0.027910232543945312, -0.02553081512451172, -0.023151397705078125, -0.02077198028564453, -0.018392562866210938, -0.016013145446777344, -0.01363372802734375, -0.011254310607910156, -0.008874893188476562, -0.006495475769042969, -0.004116058349609375, -0.0017366409301757812, 0.0006427764892578125, 0.0030221939086914062, 0.005401611328125, 0.007781028747558594, 0.010160446166992188, 0.012539863586425781, 0.014919281005859375, 0.01729869842529297, 0.019678115844726562, 0.022057533264160156, 0.02443695068359375, 0.026816368103027344, 0.029195785522460938, 0.03157520294189453, 0.033954620361328125, 0.03633403778076172, 0.03871345520019531, 0.041092872619628906, 0.0434722900390625, 0.045851707458496094, 0.04823112487792969, 0.05061054229736328, 0.052989959716796875, 0.05536937713623047, 0.05774879455566406, 0.060128211975097656, 0.06250762939453125, 0.06488704681396484, 0.06726646423339844, 0.06964588165283203, 0.07202529907226562, 0.07440471649169922, 0.07678413391113281, 0.0791635513305664, 0.08154296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 10.0, 26.0, 33.0, 71.0, 76.0, 112.0, 176.0, 161.0, 107.0, 89.0, 52.0, 22.0, 19.0, 12.0, 3.0, 6.0, 1.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03990435600280762, -0.038823604583740234, -0.03774285316467285, -0.03666210174560547, -0.035581350326538086, -0.0345005989074707, -0.03341984748840332, -0.03233909606933594, -0.031258344650268555, -0.030177593231201172, -0.02909684181213379, -0.028016090393066406, -0.026935338973999023, -0.02585458755493164, -0.024773836135864258, -0.023693084716796875, -0.022612333297729492, -0.02153158187866211, -0.020450830459594727, -0.019370079040527344, -0.01828932762145996, -0.017208576202392578, -0.016127824783325195, -0.015047073364257812, -0.01396632194519043, -0.012885570526123047, -0.011804819107055664, -0.010724067687988281, -0.009643316268920898, -0.008562564849853516, -0.007481813430786133, -0.00640106201171875, -0.005320310592651367, -0.004239559173583984, -0.0031588077545166016, -0.0020780563354492188, -0.000997304916381836, 8.344650268554688e-05, 0.0011641979217529297, 0.0022449493408203125, 0.0033257007598876953, 0.004406452178955078, 0.005487203598022461, 0.006567955017089844, 0.0076487064361572266, 0.00872945785522461, 0.009810209274291992, 0.010890960693359375, 0.011971712112426758, 0.01305246353149414, 0.014133214950561523, 0.015213966369628906, 0.01629471778869629, 0.017375469207763672, 0.018456220626831055, 0.019536972045898438, 0.02061772346496582, 0.021698474884033203, 0.022779226303100586, 0.02385997772216797, 0.02494072914123535, 0.026021480560302734, 0.027102231979370117, 0.0281829833984375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 6.0, 9.0, 12.0, 16.0, 18.0, 30.0, 51.0, 45.0, 42.0, 56.0, 60.0, 67.0, 69.0, 81.0, 62.0, 52.0, 49.0, 46.0, 35.0, 29.0, 29.0, 17.0, 29.0, 13.0, 12.0, 15.0, 8.0, 9.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4364004135131836, -0.4223867654800415, -0.4083731174468994, -0.3943594694137573, -0.38034582138061523, -0.36633217334747314, -0.35231852531433105, -0.33830487728118896, -0.3242912292480469, -0.3102775812149048, -0.2962639331817627, -0.2822502851486206, -0.2682366371154785, -0.2542229890823364, -0.24020932614803314, -0.22619567811489105, -0.21218201518058777, -0.19816836714744568, -0.1841547191143036, -0.1701410710811615, -0.1561274230480194, -0.14211377501487732, -0.12810011208057404, -0.11408646404743195, -0.10007281601428986, -0.08605916798114777, -0.07204551994800568, -0.05803186446428299, -0.0440182164311409, -0.03000456839799881, -0.015990912914276123, -0.001977264881134033, 0.012036412954330444, 0.026050062850117683, 0.04006371274590492, 0.05407736450433731, 0.0680910125374794, 0.08210466057062149, 0.09611831605434418, 0.11013196408748627, 0.12414561212062836, 0.13815926015377045, 0.15217290818691254, 0.16618657112121582, 0.1802002191543579, 0.1942138671875, 0.2082275152206421, 0.22224116325378418, 0.23625481128692627, 0.25026845932006836, 0.26428210735321045, 0.27829575538635254, 0.29230940341949463, 0.3063230514526367, 0.3203366994857788, 0.3343503475189209, 0.348363995552063, 0.3623776435852051, 0.37639129161834717, 0.39040493965148926, 0.40441858768463135, 0.41843223571777344, 0.4324458837509155, 0.4464595317840576, 0.4604732096195221]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 12.0, 12.0, 8.0, 10.0, 19.0, 25.0, 19.0, 25.0, 21.0, 34.0, 45.0, 31.0, 42.0, 42.0, 42.0, 42.0, 36.0, 33.0, 37.0, 42.0, 44.0, 41.0, 42.0, 34.0, 25.0, 38.0, 28.0, 28.0, 15.0, 16.0, 16.0, 17.0, 16.0, 9.0, 7.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3180714547634125, -0.30745241045951843, -0.2968333661556244, -0.28621432185173035, -0.2755952775478363, -0.26497626304626465, -0.2543572187423706, -0.24373817443847656, -0.23311913013458252, -0.22250008583068848, -0.21188104152679443, -0.2012619972229004, -0.19064296782016754, -0.1800239235162735, -0.16940487921237946, -0.1587858498096466, -0.14816679060459137, -0.13754774630069733, -0.12692870199680328, -0.11630966514348984, -0.10569062829017639, -0.09507158398628235, -0.0844525396823883, -0.07383350282907486, -0.06321445852518082, -0.05259541794657707, -0.04197637736797333, -0.031357333064079285, -0.02073829248547554, -0.010119251906871796, 0.0004997923970222473, 0.011118829250335693, 0.021737873554229736, 0.03235691413283348, 0.042975954711437225, 0.05359499901533127, 0.06421403586864471, 0.07483308017253876, 0.0854521244764328, 0.09607116132974625, 0.10669020563364029, 0.11730924993753433, 0.12792828679084778, 0.13854733109474182, 0.14916637539863586, 0.1597854197025299, 0.17040446400642395, 0.1810234934091568, 0.19164253771305084, 0.20226158201694489, 0.21288062632083893, 0.22349965572357178, 0.23411870002746582, 0.24473774433135986, 0.2553567886352539, 0.26597583293914795, 0.276594877243042, 0.28721392154693604, 0.2978329658508301, 0.3084520101547241, 0.31907105445861816, 0.3296900987625122, 0.34030914306640625, 0.3509281575679779, 0.36154720187187195]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 11.0, 25.0, 20.0, 35.0, 48.0, 66.0, 109.0, 177.0, 261.0, 462.0, 744.0, 1265.0, 2453.0, 4540.0, 9227.0, 20377.0, 49400.0, 171457.0, 495105.0, 196204.0, 54076.0, 21599.0, 9909.0, 4960.0, 2508.0, 1429.0, 734.0, 505.0, 283.0, 196.0, 127.0, 69.0, 47.0, 35.0, 29.0, 17.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6021041870117188, -0.5836029052734375, -0.5651016235351562, -0.546600341796875, -0.5280990600585938, -0.5095977783203125, -0.49109649658203125, -0.47259521484375, -0.45409393310546875, -0.4355926513671875, -0.41709136962890625, -0.398590087890625, -0.38008880615234375, -0.3615875244140625, -0.34308624267578125, -0.3245849609375, -0.30608367919921875, -0.2875823974609375, -0.26908111572265625, -0.250579833984375, -0.23207855224609375, -0.2135772705078125, -0.19507598876953125, -0.17657470703125, -0.15807342529296875, -0.1395721435546875, -0.12107086181640625, -0.102569580078125, -0.08406829833984375, -0.0655670166015625, -0.04706573486328125, -0.028564453125, -0.01006317138671875, 0.0084381103515625, 0.02693939208984375, 0.045440673828125, 0.06394195556640625, 0.0824432373046875, 0.10094451904296875, 0.11944580078125, 0.13794708251953125, 0.1564483642578125, 0.17494964599609375, 0.193450927734375, 0.21195220947265625, 0.2304534912109375, 0.24895477294921875, 0.2674560546875, 0.28595733642578125, 0.3044586181640625, 0.32295989990234375, 0.341461181640625, 0.35996246337890625, 0.3784637451171875, 0.39696502685546875, 0.41546630859375, 0.43396759033203125, 0.4524688720703125, 0.47097015380859375, 0.489471435546875, 0.5079727172851562, 0.5264739990234375, 0.5449752807617188, 0.5634765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 10.0, 14.0, 11.0, 14.0, 17.0, 17.0, 22.0, 29.0, 39.0, 28.0, 41.0, 50.0, 44.0, 54.0, 33.0, 45.0, 46.0, 53.0, 30.0, 44.0, 43.0, 38.0, 38.0, 33.0, 32.0, 25.0, 22.0, 17.0, 15.0, 20.0, 10.0, 10.0, 7.0, 6.0, 11.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5205078125, -0.5, -0.4794921875, -0.458984375, -0.4384765625, -0.41796875, -0.3974609375, -0.376953125, -0.3564453125, -0.3359375, -0.3154296875, -0.294921875, -0.2744140625, -0.25390625, -0.2333984375, -0.212890625, -0.1923828125, -0.171875, -0.1513671875, -0.130859375, -0.1103515625, -0.08984375, -0.0693359375, -0.048828125, -0.0283203125, -0.0078125, 0.0126953125, 0.033203125, 0.0537109375, 0.07421875, 0.0947265625, 0.115234375, 0.1357421875, 0.15625, 0.1767578125, 0.197265625, 0.2177734375, 0.23828125, 0.2587890625, 0.279296875, 0.2998046875, 0.3203125, 0.3408203125, 0.361328125, 0.3818359375, 0.40234375, 0.4228515625, 0.443359375, 0.4638671875, 0.484375, 0.5048828125, 0.525390625, 0.5458984375, 0.56640625, 0.5869140625, 0.607421875, 0.6279296875, 0.6484375, 0.6689453125, 0.689453125, 0.7099609375, 0.73046875, 0.7509765625, 0.771484375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 17.0, 15.0, 25.0, 32.0, 41.0, 58.0, 78.0, 148.0, 148.0, 263.0, 390.0, 658.0, 977.0, 1738.0, 3066.0, 6078.0, 11958.0, 25494.0, 62393.0, 206549.0, 459674.0, 169134.0, 53908.0, 22518.0, 10761.0, 5313.0, 2870.0, 1574.0, 926.0, 563.0, 353.0, 256.0, 160.0, 102.0, 89.0, 61.0, 44.0, 42.0, 25.0, 18.0, 9.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.56494140625, -0.5498466491699219, -0.5347518920898438, -0.5196571350097656, -0.5045623779296875, -0.4894676208496094, -0.47437286376953125, -0.4592781066894531, -0.444183349609375, -0.4290885925292969, -0.41399383544921875, -0.3988990783691406, -0.3838043212890625, -0.3687095642089844, -0.35361480712890625, -0.3385200500488281, -0.32342529296875, -0.3083305358886719, -0.29323577880859375, -0.2781410217285156, -0.2630462646484375, -0.24795150756835938, -0.23285675048828125, -0.21776199340820312, -0.202667236328125, -0.18757247924804688, -0.17247772216796875, -0.15738296508789062, -0.1422882080078125, -0.12719345092773438, -0.11209869384765625, -0.09700393676757812, -0.0819091796875, -0.06681442260742188, -0.05171966552734375, -0.036624908447265625, -0.0215301513671875, -0.006435394287109375, 0.00865936279296875, 0.023754119873046875, 0.038848876953125, 0.053943634033203125, 0.06903839111328125, 0.08413314819335938, 0.0992279052734375, 0.11432266235351562, 0.12941741943359375, 0.14451217651367188, 0.15960693359375, 0.17470169067382812, 0.18979644775390625, 0.20489120483398438, 0.2199859619140625, 0.23508071899414062, 0.25017547607421875, 0.2652702331542969, 0.280364990234375, 0.2954597473144531, 0.31055450439453125, 0.3256492614746094, 0.3407440185546875, 0.3558387756347656, 0.37093353271484375, 0.3860282897949219, 0.401123046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 11.0, 9.0, 8.0, 12.0, 7.0, 16.0, 16.0, 14.0, 22.0, 20.0, 20.0, 25.0, 33.0, 36.0, 37.0, 32.0, 51.0, 49.0, 43.0, 46.0, 47.0, 40.0, 57.0, 44.0, 27.0, 32.0, 31.0, 29.0, 31.0, 23.0, 18.0, 20.0, 21.0, 14.0, 13.0, 5.0, 14.0, 1.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7421875, -0.7194061279296875, -0.696624755859375, -0.6738433837890625, -0.65106201171875, -0.6282806396484375, -0.605499267578125, -0.5827178955078125, -0.5599365234375, -0.5371551513671875, -0.514373779296875, -0.4915924072265625, -0.46881103515625, -0.4460296630859375, -0.423248291015625, -0.4004669189453125, -0.377685546875, -0.3549041748046875, -0.332122802734375, -0.3093414306640625, -0.28656005859375, -0.2637786865234375, -0.240997314453125, -0.2182159423828125, -0.1954345703125, -0.1726531982421875, -0.149871826171875, -0.1270904541015625, -0.10430908203125, -0.0815277099609375, -0.058746337890625, -0.0359649658203125, -0.01318359375, 0.0095977783203125, 0.032379150390625, 0.0551605224609375, 0.07794189453125, 0.1007232666015625, 0.123504638671875, 0.1462860107421875, 0.1690673828125, 0.1918487548828125, 0.214630126953125, 0.2374114990234375, 0.26019287109375, 0.2829742431640625, 0.305755615234375, 0.3285369873046875, 0.351318359375, 0.3740997314453125, 0.396881103515625, 0.4196624755859375, 0.44244384765625, 0.4652252197265625, 0.488006591796875, 0.5107879638671875, 0.5335693359375, 0.5563507080078125, 0.579132080078125, 0.6019134521484375, 0.62469482421875, 0.6474761962890625, 0.670257568359375, 0.6930389404296875, 0.7158203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 6.0, 5.0, 11.0, 12.0, 13.0, 18.0, 23.0, 47.0, 50.0, 72.0, 102.0, 157.0, 239.0, 309.0, 461.0, 677.0, 949.0, 1396.0, 2064.0, 3209.0, 5104.0, 8036.0, 12909.0, 21166.0, 35881.0, 59621.0, 99236.0, 152250.0, 246128.0, 150434.0, 98114.0, 58892.0, 34750.0, 20994.0, 12792.0, 7710.0, 4933.0, 3132.0, 2198.0, 1403.0, 933.0, 651.0, 418.0, 307.0, 217.0, 154.0, 97.0, 74.0, 51.0, 57.0, 31.0, 21.0, 18.0, 9.0, 13.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.06610107421875, -0.06406593322753906, -0.062030792236328125, -0.05999565124511719, -0.05796051025390625, -0.05592536926269531, -0.053890228271484375, -0.05185508728027344, -0.0498199462890625, -0.04778480529785156, -0.045749664306640625, -0.04371452331542969, -0.04167938232421875, -0.03964424133300781, -0.037609100341796875, -0.03557395935058594, -0.033538818359375, -0.03150367736816406, -0.029468536376953125, -0.027433395385742188, -0.02539825439453125, -0.023363113403320312, -0.021327972412109375, -0.019292831420898438, -0.0172576904296875, -0.015222549438476562, -0.013187408447265625, -0.011152267456054688, -0.00911712646484375, -0.0070819854736328125, -0.005046844482421875, -0.0030117034912109375, -0.0009765625, 0.0010585784912109375, 0.003093719482421875, 0.0051288604736328125, 0.00716400146484375, 0.009199142456054688, 0.011234283447265625, 0.013269424438476562, 0.0153045654296875, 0.017339706420898438, 0.019374847412109375, 0.021409988403320312, 0.02344512939453125, 0.025480270385742188, 0.027515411376953125, 0.029550552368164062, 0.031585693359375, 0.03362083435058594, 0.035655975341796875, 0.03769111633300781, 0.03972625732421875, 0.04176139831542969, 0.043796539306640625, 0.04583168029785156, 0.0478668212890625, 0.04990196228027344, 0.051937103271484375, 0.05397224426269531, 0.05600738525390625, 0.05804252624511719, 0.060077667236328125, 0.06211280822753906, 0.06414794921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 14.0, 9.0, 20.0, 18.0, 31.0, 20.0, 36.0, 40.0, 43.0, 55.0, 43.0, 53.0, 90.0, 88.0, 66.0, 57.0, 49.0, 35.0, 36.0, 32.0, 33.0, 28.0, 18.0, 14.0, 15.0, 8.0, 9.0, 9.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0], "bins": [-3.2007694244384766e-05, -3.1186267733573914e-05, -3.036484122276306e-05, -2.954341471195221e-05, -2.8721988201141357e-05, -2.7900561690330505e-05, -2.7079135179519653e-05, -2.62577086687088e-05, -2.543628215789795e-05, -2.4614855647087097e-05, -2.3793429136276245e-05, -2.2972002625465393e-05, -2.215057611465454e-05, -2.132914960384369e-05, -2.0507723093032837e-05, -1.9686296582221985e-05, -1.8864870071411133e-05, -1.804344356060028e-05, -1.722201704978943e-05, -1.6400590538978577e-05, -1.5579164028167725e-05, -1.4757737517356873e-05, -1.393631100654602e-05, -1.3114884495735168e-05, -1.2293457984924316e-05, -1.1472031474113464e-05, -1.0650604963302612e-05, -9.82917845249176e-06, -9.007751941680908e-06, -8.186325430870056e-06, -7.364898920059204e-06, -6.543472409248352e-06, -5.7220458984375e-06, -4.900619387626648e-06, -4.079192876815796e-06, -3.257766366004944e-06, -2.436339855194092e-06, -1.6149133443832397e-06, -7.934868335723877e-07, 2.7939677238464355e-08, 8.493661880493164e-07, 1.6707926988601685e-06, 2.4922192096710205e-06, 3.3136457204818726e-06, 4.135072231292725e-06, 4.956498742103577e-06, 5.777925252914429e-06, 6.599351763725281e-06, 7.420778274536133e-06, 8.242204785346985e-06, 9.063631296157837e-06, 9.885057806968689e-06, 1.0706484317779541e-05, 1.1527910828590393e-05, 1.2349337339401245e-05, 1.3170763850212097e-05, 1.399219036102295e-05, 1.4813616871833801e-05, 1.5635043382644653e-05, 1.6456469893455505e-05, 1.7277896404266357e-05, 1.809932291507721e-05, 1.892074942588806e-05, 1.9742175936698914e-05, 2.0563602447509766e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 9.0, 6.0, 18.0, 13.0, 30.0, 32.0, 40.0, 57.0, 71.0, 126.0, 204.0, 365.0, 564.0, 1035.0, 1839.0, 3378.0, 6553.0, 13733.0, 31298.0, 78085.0, 205525.0, 402071.0, 181324.0, 69078.0, 27565.0, 12500.0, 5970.0, 3051.0, 1681.0, 910.0, 535.0, 284.0, 191.0, 144.0, 62.0, 57.0, 40.0, 31.0, 27.0, 8.0, 4.0, 9.0, 7.0, 11.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1416015625, -0.1372356414794922, -0.13286972045898438, -0.12850379943847656, -0.12413787841796875, -0.11977195739746094, -0.11540603637695312, -0.11104011535644531, -0.1066741943359375, -0.10230827331542969, -0.09794235229492188, -0.09357643127441406, -0.08921051025390625, -0.08484458923339844, -0.08047866821289062, -0.07611274719238281, -0.071746826171875, -0.06738090515136719, -0.06301498413085938, -0.05864906311035156, -0.05428314208984375, -0.04991722106933594, -0.045551300048828125, -0.04118537902832031, -0.0368194580078125, -0.03245353698730469, -0.028087615966796875, -0.023721694946289062, -0.01935577392578125, -0.014989852905273438, -0.010623931884765625, -0.0062580108642578125, -0.00189208984375, 0.0024738311767578125, 0.006839752197265625, 0.011205673217773438, 0.01557159423828125, 0.019937515258789062, 0.024303436279296875, 0.028669357299804688, 0.0330352783203125, 0.03740119934082031, 0.041767120361328125, 0.04613304138183594, 0.05049896240234375, 0.05486488342285156, 0.059230804443359375, 0.06359672546386719, 0.067962646484375, 0.07232856750488281, 0.07669448852539062, 0.08106040954589844, 0.08542633056640625, 0.08979225158691406, 0.09415817260742188, 0.09852409362792969, 0.1028900146484375, 0.10725593566894531, 0.11162185668945312, 0.11598777770996094, 0.12035369873046875, 0.12471961975097656, 0.12908554077148438, 0.1334514617919922, 0.1378173828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 4.0, 14.0, 14.0, 12.0, 14.0, 21.0, 38.0, 31.0, 53.0, 40.0, 67.0, 74.0, 90.0, 132.0, 71.0, 72.0, 48.0, 37.0, 45.0, 23.0, 18.0, 24.0, 19.0, 5.0, 6.0, 5.0, 2.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111572265625, -0.10848617553710938, -0.10540008544921875, -0.10231399536132812, -0.0992279052734375, -0.09614181518554688, -0.09305572509765625, -0.08996963500976562, -0.086883544921875, -0.08379745483398438, -0.08071136474609375, -0.07762527465820312, -0.0745391845703125, -0.07145309448242188, -0.06836700439453125, -0.06528091430664062, -0.06219482421875, -0.059108734130859375, -0.05602264404296875, -0.052936553955078125, -0.0498504638671875, -0.046764373779296875, -0.04367828369140625, -0.040592193603515625, -0.037506103515625, -0.034420013427734375, -0.03133392333984375, -0.028247833251953125, -0.0251617431640625, -0.022075653076171875, -0.01898956298828125, -0.015903472900390625, -0.0128173828125, -0.009731292724609375, -0.00664520263671875, -0.003559112548828125, -0.0004730224609375, 0.002613067626953125, 0.00569915771484375, 0.008785247802734375, 0.011871337890625, 0.014957427978515625, 0.01804351806640625, 0.021129608154296875, 0.0242156982421875, 0.027301788330078125, 0.03038787841796875, 0.033473968505859375, 0.03656005859375, 0.039646148681640625, 0.04273223876953125, 0.045818328857421875, 0.0489044189453125, 0.051990509033203125, 0.05507659912109375, 0.058162689208984375, 0.061248779296875, 0.06433486938476562, 0.06742095947265625, 0.07050704956054688, 0.0735931396484375, 0.07667922973632812, 0.07976531982421875, 0.08285140991210938, 0.0859375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 18.0, 30.0, 39.0, 47.0, 88.0, 112.0, 129.0, 138.0, 132.0, 85.0, 58.0, 40.0, 25.0, 18.0, 6.0, 4.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7422631978988647, -1.6838864088058472, -1.6255096197128296, -1.567132830619812, -1.5087560415267944, -1.4503792524337769, -1.3920024633407593, -1.3336256742477417, -1.2752488851547241, -1.2168720960617065, -1.158495306968689, -1.1001185178756714, -1.0417417287826538, -0.9833649396896362, -0.9249881505966187, -0.8666113615036011, -0.8082345128059387, -0.7498577237129211, -0.6914809346199036, -0.633104145526886, -0.5747273564338684, -0.516350507736206, -0.45797374844551086, -0.3995969593524933, -0.3412201702594757, -0.28284338116645813, -0.22446659207344055, -0.16608978807926178, -0.1077129989862442, -0.04933619499206543, 0.009040594100952148, 0.06741738319396973, 0.1257941722869873, 0.18417096138000488, 0.24254775047302246, 0.30092453956604004, 0.3593013286590576, 0.4176781475543976, 0.47605493664741516, 0.5344316959381104, 0.5928084850311279, 0.6511852741241455, 0.7095620632171631, 0.7679388523101807, 0.8263156414031982, 0.8846924304962158, 0.9430692195892334, 1.001446008682251, 1.0598227977752686, 1.1181995868682861, 1.1765763759613037, 1.2349531650543213, 1.2933299541473389, 1.3517067432403564, 1.410083532333374, 1.4684603214263916, 1.5268372297286987, 1.5852140188217163, 1.6435908079147339, 1.7019675970077515, 1.760344386100769, 1.8187211751937866, 1.8770979642868042, 1.9354747533798218, 1.9938515424728394]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 7.0, 6.0, 4.0, 7.0, 9.0, 9.0, 12.0, 15.0, 10.0, 17.0, 23.0, 25.0, 27.0, 22.0, 34.0, 30.0, 37.0, 26.0, 47.0, 37.0, 38.0, 57.0, 37.0, 42.0, 58.0, 41.0, 48.0, 42.0, 33.0, 21.0, 23.0, 25.0, 22.0, 21.0, 17.0, 14.0, 16.0, 9.0, 7.0, 9.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-1.433144211769104, -1.3912572860717773, -1.3493704795837402, -1.3074835538864136, -1.2655967473983765, -1.2237098217010498, -1.1818230152130127, -1.139936089515686, -1.098049283027649, -1.0561623573303223, -1.0142755508422852, -0.9723886847496033, -0.9305018186569214, -0.8886149525642395, -0.8467280864715576, -0.804841160774231, -0.7629542946815491, -0.7210674285888672, -0.6791805624961853, -0.6372936964035034, -0.5954068303108215, -0.5535199642181396, -0.511633038520813, -0.4697462022304535, -0.4278593361377716, -0.3859724700450897, -0.34408560395240784, -0.30219870805740356, -0.2603118419647217, -0.218424990773201, -0.1765381097793579, -0.13465124368667603, -0.09276437759399414, -0.05087750777602196, -0.008990637958049774, 0.03289623558521271, 0.07478310167789459, 0.11666996777057648, 0.15855684876441956, 0.20044371485710144, 0.24233058094978333, 0.2842174470424652, 0.3261043131351471, 0.36799120903015137, 0.40987807512283325, 0.45176494121551514, 0.493651807308197, 0.5355386734008789, 0.5774255394935608, 0.6193124055862427, 0.6611992716789246, 0.7030861377716064, 0.7449730038642883, 0.7868598699569702, 0.8287467956542969, 0.870633602142334, 0.9125205278396606, 0.9544073939323425, 0.9962942600250244, 1.038181185722351, 1.0800679922103882, 1.1219549179077148, 1.163841724395752, 1.2057286500930786, 1.2476154565811157]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 11.0, 10.0, 6.0, 10.0, 22.0, 21.0, 32.0, 27.0, 34.0, 72.0, 80.0, 91.0, 137.0, 150.0, 212.0, 300.0, 430.0, 568.0, 956.0, 1556.0, 2443.0, 5537.0, 1030562.0, 2488.0, 1575.0, 912.0, 646.0, 448.0, 310.0, 232.0, 168.0, 130.0, 84.0, 81.0, 72.0, 24.0, 40.0, 27.0, 26.0, 15.0, 13.0, 12.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6053814888000488, -1.5552562475204468, -1.5051310062408447, -1.4550058841705322, -1.4048806428909302, -1.3547554016113281, -1.304630160331726, -1.254504919052124, -1.204379677772522, -1.15425443649292, -1.1041291952133179, -1.0540039539337158, -1.0038788318634033, -0.9537535905838013, -0.9036283493041992, -0.8535031080245972, -0.8033779263496399, -0.7532526850700378, -0.7031275033950806, -0.6530022621154785, -0.6028770208358765, -0.5527517795562744, -0.5026265978813171, -0.4525013566017151, -0.4023761451244354, -0.35225093364715576, -0.3021256923675537, -0.25200048089027405, -0.2018752545118332, -0.15175002813339233, -0.10162481665611267, -0.05149957537651062, -0.001374363899230957, 0.0487508587539196, 0.09887608140707016, 0.14900130033493042, 0.19912652671337128, 0.24925175309181213, 0.2993769645690918, 0.34950220584869385, 0.3996274173259735, 0.4497526288032532, 0.4998778700828552, 0.5500030517578125, 0.6001282930374146, 0.6502535343170166, 0.7003787755966187, 0.7505040168762207, 0.800629198551178, 0.85075443983078, 0.9008796215057373, 0.9510048627853394, 1.0011301040649414, 1.0512553453445435, 1.1013805866241455, 1.151505708694458, 1.20163094997406, 1.251756191253662, 1.3018814325332642, 1.3520066738128662, 1.4021317958831787, 1.4522570371627808, 1.5023822784423828, 1.5525075197219849, 1.602632761001587]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 10.0, 12.0, 46.0, 89.0, 222.0, 887.0, 3409.0, 16280.0, 51430152.0, 15165.0, 3631.0, 920.0, 274.0, 113.0, 52.0, 29.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.324853420257568, -7.037331581115723, -6.749809741973877, -6.462287902832031, -6.1747660636901855, -5.88724422454834, -5.599722862243652, -5.312200546264648, -5.024679183959961, -4.737157344818115, -4.4496355056762695, -4.162113666534424, -3.874591827392578, -3.5870699882507324, -3.299548387527466, -3.01202654838562, -2.7245044708251953, -2.4369826316833496, -2.149460792541504, -1.8619390726089478, -1.574417233467102, -1.2868953943252563, -0.9993736743927002, -0.7118518352508545, -0.4243299961090088, -0.13680818676948547, 0.15071362257003784, 0.43823540210723877, 0.7257572412490845, 1.0132790803909302, 1.3008008003234863, 1.588322639465332, 1.875844955444336, 2.1633667945861816, 2.4508886337280273, 2.738410472869873, 3.0259323120117188, 3.3134541511535645, 3.600975751876831, 3.8884975910186768, 4.176019668579102, 4.463541507720947, 4.751063346862793, 5.038585186004639, 5.326107025146484, 5.61362886428833, 5.901150703430176, 6.188672065734863, 6.476193904876709, 6.763715744018555, 7.0512375831604, 7.338759422302246, 7.626281261444092, 7.9138031005859375, 8.201324462890625, 8.488846778869629, 8.776368141174316, 9.063889503479004, 9.351411819458008, 9.638933181762695, 9.9264554977417, 10.213976860046387, 10.50149917602539, 10.789020538330078, 11.076542854309082]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 2.0, 8.0, 3.0, 11.0, 10.0, 13.0, 31.0, 29.0, 45.0, 66.0, 104.0, 118.0, 194.0, 278.0, 442.0, 674.0, 1141.0, 1876.0, 3151.0, 5407.0, 9585.0, 17501.0, 32572.0, 64593.0, 131992.0, 271405.0, 543741.0, 3049914.0, 1323754.0, 416783.0, 208115.0, 101063.0, 49569.0, 25241.0, 13484.0, 7665.0, 4306.0, 2638.0, 1489.0, 883.0, 525.0, 356.0, 236.0, 121.0, 94.0, 66.0, 34.0, 27.0, 20.0, 22.0, 13.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.470703125, -0.4559059143066406, -0.44110870361328125, -0.4263114929199219, -0.4115142822265625, -0.3967170715332031, -0.38191986083984375, -0.3671226501464844, -0.352325439453125, -0.3375282287597656, -0.32273101806640625, -0.3079338073730469, -0.2931365966796875, -0.2783393859863281, -0.26354217529296875, -0.24874496459960938, -0.23394775390625, -0.21915054321289062, -0.20435333251953125, -0.18955612182617188, -0.1747589111328125, -0.15996170043945312, -0.14516448974609375, -0.13036727905273438, -0.115570068359375, -0.10077285766601562, -0.08597564697265625, -0.07117843627929688, -0.0563812255859375, -0.041584014892578125, -0.02678680419921875, -0.011989593505859375, 0.0028076171875, 0.017604827880859375, 0.03240203857421875, 0.047199249267578125, 0.0619964599609375, 0.07679367065429688, 0.09159088134765625, 0.10638809204101562, 0.121185302734375, 0.13598251342773438, 0.15077972412109375, 0.16557693481445312, 0.1803741455078125, 0.19517135620117188, 0.20996856689453125, 0.22476577758789062, 0.23956298828125, 0.2543601989746094, 0.26915740966796875, 0.2839546203613281, 0.2987518310546875, 0.3135490417480469, 0.32834625244140625, 0.3431434631347656, 0.357940673828125, 0.3727378845214844, 0.38753509521484375, 0.4023323059082031, 0.4171295166015625, 0.4319267272949219, 0.44672393798828125, 0.4615211486816406, 0.476318359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 12.0, 11.0, 9.0, 18.0, 26.0, 17.0, 25.0, 37.0, 23.0, 40.0, 41.0, 49.0, 50.0, 55.0, 269.0, 774.0, 118.0, 53.0, 59.0, 38.0, 41.0, 30.0, 42.0, 23.0, 25.0, 22.0, 15.0, 18.0, 18.0, 12.0, 12.0, 9.0, 3.0, 6.0, 4.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40234375, -4.273773193359375, -4.14520263671875, -4.016632080078125, -3.8880615234375, -3.759490966796875, -3.63092041015625, -3.502349853515625, -3.373779296875, -3.245208740234375, -3.11663818359375, -2.988067626953125, -2.8594970703125, -2.730926513671875, -2.60235595703125, -2.473785400390625, -2.34521484375, -2.216644287109375, -2.08807373046875, -1.959503173828125, -1.8309326171875, -1.702362060546875, -1.57379150390625, -1.445220947265625, -1.316650390625, -1.188079833984375, -1.05950927734375, -0.930938720703125, -0.8023681640625, -0.673797607421875, -0.54522705078125, -0.416656494140625, -0.2880859375, -0.159515380859375, -0.03094482421875, 0.097625732421875, 0.2261962890625, 0.354766845703125, 0.48333740234375, 0.611907958984375, 0.740478515625, 0.869049072265625, 0.99761962890625, 1.126190185546875, 1.2547607421875, 1.383331298828125, 1.51190185546875, 1.640472412109375, 1.76904296875, 1.897613525390625, 2.02618408203125, 2.154754638671875, 2.2833251953125, 2.411895751953125, 2.54046630859375, 2.669036865234375, 2.797607421875, 2.926177978515625, 3.05474853515625, 3.183319091796875, 3.3118896484375, 3.440460205078125, 3.56903076171875, 3.697601318359375, 3.826171875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 9.0, 15.0, 18.0, 34.0, 51.0, 75.0, 126.0, 201.0, 294.0, 532.0, 866.0, 1527.0, 2373.0, 4281.0, 7396.0, 13462.0, 23903.0, 44830.0, 81635.0, 144652.0, 240551.0, 363375.0, 760659.0, 3274336.0, 510165.0, 327723.0, 211122.0, 124675.0, 68565.0, 37387.0, 20296.0, 11235.0, 6120.0, 3581.0, 2081.0, 1226.0, 780.0, 459.0, 293.0, 180.0, 114.0, 72.0, 62.0, 39.0, 26.0, 14.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.262939453125, -0.25481414794921875, -0.2466888427734375, -0.23856353759765625, -0.230438232421875, -0.22231292724609375, -0.2141876220703125, -0.20606231689453125, -0.19793701171875, -0.18981170654296875, -0.1816864013671875, -0.17356109619140625, -0.165435791015625, -0.15731048583984375, -0.1491851806640625, -0.14105987548828125, -0.1329345703125, -0.12480926513671875, -0.1166839599609375, -0.10855865478515625, -0.100433349609375, -0.09230804443359375, -0.0841827392578125, -0.07605743408203125, -0.06793212890625, -0.05980682373046875, -0.0516815185546875, -0.04355621337890625, -0.035430908203125, -0.02730560302734375, -0.0191802978515625, -0.01105499267578125, -0.0029296875, 0.00519561767578125, 0.0133209228515625, 0.02144622802734375, 0.029571533203125, 0.03769683837890625, 0.0458221435546875, 0.05394744873046875, 0.06207275390625, 0.07019805908203125, 0.0783233642578125, 0.08644866943359375, 0.094573974609375, 0.10269927978515625, 0.1108245849609375, 0.11894989013671875, 0.1270751953125, 0.13520050048828125, 0.1433258056640625, 0.15145111083984375, 0.159576416015625, 0.16770172119140625, 0.1758270263671875, 0.18395233154296875, 0.19207763671875, 0.20020294189453125, 0.2083282470703125, 0.21645355224609375, 0.224578857421875, 0.23270416259765625, 0.2408294677734375, 0.24895477294921875, 0.257080078125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 10.0, 7.0, 6.0, 10.0, 10.0, 18.0, 17.0, 30.0, 14.0, 34.0, 34.0, 37.0, 40.0, 43.0, 42.0, 46.0, 41.0, 83.0, 890.0, 195.0, 44.0, 33.0, 31.0, 36.0, 36.0, 35.0, 36.0, 22.0, 31.0, 17.0, 19.0, 16.0, 13.0, 9.0, 10.0, 8.0, 5.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.640625, -3.540985107421875, -3.44134521484375, -3.341705322265625, -3.2420654296875, -3.142425537109375, -3.04278564453125, -2.943145751953125, -2.843505859375, -2.743865966796875, -2.64422607421875, -2.544586181640625, -2.4449462890625, -2.345306396484375, -2.24566650390625, -2.146026611328125, -2.04638671875, -1.946746826171875, -1.84710693359375, -1.747467041015625, -1.6478271484375, -1.548187255859375, -1.44854736328125, -1.348907470703125, -1.249267578125, -1.149627685546875, -1.04998779296875, -0.950347900390625, -0.8507080078125, -0.751068115234375, -0.65142822265625, -0.551788330078125, -0.4521484375, -0.352508544921875, -0.25286865234375, -0.153228759765625, -0.0535888671875, 0.046051025390625, 0.14569091796875, 0.245330810546875, 0.344970703125, 0.444610595703125, 0.54425048828125, 0.643890380859375, 0.7435302734375, 0.843170166015625, 0.94281005859375, 1.042449951171875, 1.14208984375, 1.241729736328125, 1.34136962890625, 1.441009521484375, 1.5406494140625, 1.640289306640625, 1.73992919921875, 1.839569091796875, 1.939208984375, 2.038848876953125, 2.13848876953125, 2.238128662109375, 2.3377685546875, 2.437408447265625, 2.53704833984375, 2.636688232421875, 2.736328125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 10.0, 10.0, 11.0, 19.0, 43.0, 34.0, 54.0, 82.0, 124.0, 162.0, 226.0, 325.0, 426.0, 663.0, 1023.0, 1681.0, 2782.0, 5326.0, 11682.0, 29766.0, 88490.0, 278136.0, 765019.0, 4161191.0, 616737.0, 214330.0, 68417.0, 24019.0, 9461.0, 4363.0, 2411.0, 1457.0, 935.0, 583.0, 414.0, 293.0, 211.0, 138.0, 89.0, 72.0, 52.0, 44.0, 27.0, 26.0, 18.0, 14.0, 9.0, 10.0, 6.0, 4.0, 4.0, 2.0, 5.0], "bins": [-0.5595703125, -0.5432968139648438, -0.5270233154296875, -0.5107498168945312, -0.494476318359375, -0.47820281982421875, -0.4619293212890625, -0.44565582275390625, -0.42938232421875, -0.41310882568359375, -0.3968353271484375, -0.38056182861328125, -0.364288330078125, -0.34801483154296875, -0.3317413330078125, -0.31546783447265625, -0.2991943359375, -0.28292083740234375, -0.2666473388671875, -0.25037384033203125, -0.234100341796875, -0.21782684326171875, -0.2015533447265625, -0.18527984619140625, -0.16900634765625, -0.15273284912109375, -0.1364593505859375, -0.12018585205078125, -0.103912353515625, -0.08763885498046875, -0.0713653564453125, -0.05509185791015625, -0.038818359375, -0.02254486083984375, -0.0062713623046875, 0.01000213623046875, 0.026275634765625, 0.04254913330078125, 0.0588226318359375, 0.07509613037109375, 0.09136962890625, 0.10764312744140625, 0.1239166259765625, 0.14019012451171875, 0.156463623046875, 0.17273712158203125, 0.1890106201171875, 0.20528411865234375, 0.2215576171875, 0.23783111572265625, 0.2541046142578125, 0.27037811279296875, 0.286651611328125, 0.30292510986328125, 0.3191986083984375, 0.33547210693359375, 0.35174560546875, 0.36801910400390625, 0.3842926025390625, 0.40056610107421875, 0.416839599609375, 0.43311309814453125, 0.4493865966796875, 0.46566009521484375, 0.48193359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 10.0, 6.0, 4.0, 12.0, 8.0, 11.0, 19.0, 21.0, 21.0, 27.0, 25.0, 41.0, 24.0, 27.0, 45.0, 39.0, 30.0, 38.0, 40.0, 105.0, 923.0, 115.0, 49.0, 34.0, 39.0, 35.0, 24.0, 32.0, 24.0, 28.0, 25.0, 21.0, 21.0, 20.0, 21.0, 18.0, 9.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.095672607421875, -2.99407958984375, -2.892486572265625, -2.7908935546875, -2.689300537109375, -2.58770751953125, -2.486114501953125, -2.384521484375, -2.282928466796875, -2.18133544921875, -2.079742431640625, -1.9781494140625, -1.876556396484375, -1.77496337890625, -1.673370361328125, -1.57177734375, -1.470184326171875, -1.36859130859375, -1.266998291015625, -1.1654052734375, -1.063812255859375, -0.96221923828125, -0.860626220703125, -0.759033203125, -0.657440185546875, -0.55584716796875, -0.454254150390625, -0.3526611328125, -0.251068115234375, -0.14947509765625, -0.047882080078125, 0.0537109375, 0.155303955078125, 0.25689697265625, 0.358489990234375, 0.4600830078125, 0.561676025390625, 0.66326904296875, 0.764862060546875, 0.866455078125, 0.968048095703125, 1.06964111328125, 1.171234130859375, 1.2728271484375, 1.374420166015625, 1.47601318359375, 1.577606201171875, 1.67919921875, 1.780792236328125, 1.88238525390625, 1.983978271484375, 2.0855712890625, 2.187164306640625, 2.28875732421875, 2.390350341796875, 2.491943359375, 2.593536376953125, 2.69512939453125, 2.796722412109375, 2.8983154296875, 2.999908447265625, 3.10150146484375, 3.203094482421875, 3.3046875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 10.0, 11.0, 9.0, 35.0, 89.0, 331.0, 319.0, 117.0, 53.0, 16.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.579322814941406, -19.090288162231445, -18.601253509521484, -18.112218856811523, -17.623184204101562, -17.13414764404297, -16.64511489868164, -16.156078338623047, -15.667043685913086, -15.178009033203125, -14.688974380493164, -14.199939727783203, -13.710904121398926, -13.221869468688965, -12.732834815979004, -12.243800163269043, -11.754765510559082, -11.265730857849121, -10.77669620513916, -10.287660598754883, -9.798625946044922, -9.309591293334961, -8.820556640625, -8.331521987915039, -7.84248685836792, -7.353452205657959, -6.86441707611084, -6.375382423400879, -5.886347770690918, -5.397312641143799, -4.908277988433838, -4.419242858886719, -3.9302072525024414, -3.4411723613739014, -2.9521374702453613, -2.4631028175354004, -1.9740679264068604, -1.4850330352783203, -0.9959983825683594, -0.5069634914398193, -0.017928600311279297, 0.47110623121261597, 0.9601410627365112, 1.4491758346557617, 1.9382107257843018, 2.427245616912842, 2.9162802696228027, 3.4053151607513428, 3.894350051879883, 4.383384704589844, 4.872419834136963, 5.361454486846924, 5.850489616394043, 6.339524269104004, 6.828558921813965, 7.317593574523926, 7.806628704071045, 8.295663833618164, 8.784698486328125, 9.273733139038086, 9.762767791748047, 10.251802444458008, 10.740837097167969, 11.229872703552246, 11.718907356262207]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 9.0, 7.0, 7.0, 13.0, 19.0, 14.0, 25.0, 25.0, 27.0, 36.0, 31.0, 32.0, 48.0, 44.0, 45.0, 42.0, 40.0, 54.0, 57.0, 35.0, 46.0, 38.0, 38.0, 38.0, 30.0, 26.0, 35.0, 27.0, 19.0, 20.0, 11.0, 11.0, 10.0, 8.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.10011100769043, -9.768705368041992, -9.437298774719238, -9.1058931350708, -8.774486541748047, -8.44308090209961, -8.111675262451172, -7.780269145965576, -7.4488630294799805, -7.117456912994385, -6.786050796508789, -6.454645156860352, -6.123239040374756, -5.79183292388916, -5.460427284240723, -5.129021167755127, -4.797615051269531, -4.4662089347839355, -4.13480281829834, -3.8033971786499023, -3.4719910621643066, -3.140584945678711, -2.8091790676116943, -2.4777731895446777, -2.146367073059082, -1.8149610757827759, -1.4835550785064697, -1.1521490812301636, -0.8207430839538574, -0.48933708667755127, -0.15793108940124512, 0.17347478866577148, 0.5048809051513672, 0.8362869024276733, 1.1676928997039795, 1.4990988969802856, 1.8305048942565918, 2.1619110107421875, 2.493316888809204, 2.8247227668762207, 3.1561288833618164, 3.487534999847412, 3.8189408779144287, 4.150346755981445, 4.481752872467041, 4.813158988952637, 5.144564628601074, 5.47597074508667, 5.807376861572266, 6.138782978057861, 6.470189094543457, 6.8015947341918945, 7.13300085067749, 7.464406967163086, 7.795812606811523, 8.127218246459961, 8.458624839782715, 8.790030479431152, 9.121437072753906, 9.452842712402344, 9.784248352050781, 10.115654945373535, 10.447060585021973, 10.778467178344727, 11.109872817993164]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 4.0, 6.0, 16.0, 21.0, 24.0, 29.0, 36.0, 57.0, 94.0, 110.0, 161.0, 290.0, 556.0, 1303.0, 3872.0, 14577.0, 112770.0, 3952287.0, 88110.0, 13562.0, 3976.0, 1258.0, 509.0, 218.0, 121.0, 72.0, 54.0, 40.0, 38.0, 31.0, 23.0, 18.0, 14.0, 15.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22752952575683594, -0.22092819213867188, -0.2143268585205078, -0.20772552490234375, -0.2011241912841797, -0.19452285766601562, -0.18792152404785156, -0.1813201904296875, -0.17471885681152344, -0.16811752319335938, -0.1615161895751953, -0.15491485595703125, -0.1483135223388672, -0.14171218872070312, -0.13511085510253906, -0.128509521484375, -0.12190818786621094, -0.11530685424804688, -0.10870552062988281, -0.10210418701171875, -0.09550285339355469, -0.08890151977539062, -0.08230018615722656, -0.0756988525390625, -0.06909751892089844, -0.062496185302734375, -0.05589485168457031, -0.04929351806640625, -0.04269218444824219, -0.036090850830078125, -0.029489517211914062, -0.02288818359375, -0.016286849975585938, -0.009685516357421875, -0.0030841827392578125, 0.00351715087890625, 0.010118484497070312, 0.016719818115234375, 0.023321151733398438, 0.0299224853515625, 0.03652381896972656, 0.043125152587890625, 0.04972648620605469, 0.05632781982421875, 0.06292915344238281, 0.06953048706054688, 0.07613182067871094, 0.082733154296875, 0.08933448791503906, 0.09593582153320312, 0.10253715515136719, 0.10913848876953125, 0.11573982238769531, 0.12234115600585938, 0.12894248962402344, 0.1355438232421875, 0.14214515686035156, 0.14874649047851562, 0.1553478240966797, 0.16194915771484375, 0.1685504913330078, 0.17515182495117188, 0.18175315856933594, 0.1883544921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 9.0, 7.0, 14.0, 16.0, 25.0, 22.0, 19.0, 25.0, 33.0, 38.0, 46.0, 51.0, 58.0, 53.0, 61.0, 60.0, 53.0, 53.0, 50.0, 45.0, 40.0, 33.0, 22.0, 32.0, 16.0, 10.0, 16.0, 14.0, 15.0, 12.0, 10.0, 4.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042877197265625, -0.04157590866088867, -0.040274620056152344, -0.038973331451416016, -0.03767204284667969, -0.03637075424194336, -0.03506946563720703, -0.0337681770324707, -0.032466888427734375, -0.031165599822998047, -0.02986431121826172, -0.02856302261352539, -0.027261734008789062, -0.025960445404052734, -0.024659156799316406, -0.023357868194580078, -0.02205657958984375, -0.020755290985107422, -0.019454002380371094, -0.018152713775634766, -0.016851425170898438, -0.01555013656616211, -0.014248847961425781, -0.012947559356689453, -0.011646270751953125, -0.010344982147216797, -0.009043693542480469, -0.007742404937744141, -0.0064411163330078125, -0.005139827728271484, -0.0038385391235351562, -0.002537250518798828, -0.0012359619140625, 6.532669067382812e-05, 0.0013666152954101562, 0.0026679039001464844, 0.0039691925048828125, 0.005270481109619141, 0.006571769714355469, 0.007873058319091797, 0.009174346923828125, 0.010475635528564453, 0.011776924133300781, 0.01307821273803711, 0.014379501342773438, 0.015680789947509766, 0.016982078552246094, 0.018283367156982422, 0.01958465576171875, 0.020885944366455078, 0.022187232971191406, 0.023488521575927734, 0.024789810180664062, 0.02609109878540039, 0.02739238739013672, 0.028693675994873047, 0.029994964599609375, 0.0312962532043457, 0.03259754180908203, 0.03389883041381836, 0.03520011901855469, 0.036501407623291016, 0.037802696228027344, 0.03910398483276367, 0.0404052734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 7.0, 10.0, 17.0, 13.0, 31.0, 39.0, 59.0, 91.0, 270.0, 1474.0, 59622.0, 4122011.0, 9568.0, 703.0, 127.0, 62.0, 43.0, 23.0, 15.0, 15.0, 14.0, 5.0, 7.0, 8.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.279052734375, -0.2709197998046875, -0.262786865234375, -0.2546539306640625, -0.24652099609375, -0.2383880615234375, -0.230255126953125, -0.2221221923828125, -0.2139892578125, -0.2058563232421875, -0.197723388671875, -0.1895904541015625, -0.18145751953125, -0.1733245849609375, -0.165191650390625, -0.1570587158203125, -0.14892578125, -0.1407928466796875, -0.132659912109375, -0.1245269775390625, -0.11639404296875, -0.1082611083984375, -0.100128173828125, -0.0919952392578125, -0.0838623046875, -0.0757293701171875, -0.067596435546875, -0.0594635009765625, -0.05133056640625, -0.0431976318359375, -0.035064697265625, -0.0269317626953125, -0.018798828125, -0.0106658935546875, -0.002532958984375, 0.0055999755859375, 0.01373291015625, 0.0218658447265625, 0.029998779296875, 0.0381317138671875, 0.0462646484375, 0.0543975830078125, 0.062530517578125, 0.0706634521484375, 0.07879638671875, 0.0869293212890625, 0.095062255859375, 0.1031951904296875, 0.111328125, 0.1194610595703125, 0.127593994140625, 0.1357269287109375, 0.14385986328125, 0.1519927978515625, 0.160125732421875, 0.1682586669921875, 0.1763916015625, 0.1845245361328125, 0.192657470703125, 0.2007904052734375, 0.20892333984375, 0.2170562744140625, 0.225189208984375, 0.2333221435546875, 0.241455078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 8.0, 4.0, 2.0, 10.0, 14.0, 13.0, 27.0, 48.0, 77.0, 182.0, 441.0, 1107.0, 1181.0, 522.0, 196.0, 92.0, 46.0, 26.0, 25.0, 16.0, 8.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0911865234375, -0.08833789825439453, -0.08548927307128906, -0.0826406478881836, -0.07979202270507812, -0.07694339752197266, -0.07409477233886719, -0.07124614715576172, -0.06839752197265625, -0.06554889678955078, -0.06270027160644531, -0.059851646423339844, -0.057003021240234375, -0.054154396057128906, -0.05130577087402344, -0.04845714569091797, -0.0456085205078125, -0.04275989532470703, -0.03991127014160156, -0.037062644958496094, -0.034214019775390625, -0.031365394592285156, -0.028516769409179688, -0.02566814422607422, -0.02281951904296875, -0.01997089385986328, -0.017122268676757812, -0.014273643493652344, -0.011425018310546875, -0.008576393127441406, -0.0057277679443359375, -0.0028791427612304688, -3.0517578125e-05, 0.0028181076049804688, 0.0056667327880859375, 0.008515357971191406, 0.011363983154296875, 0.014212608337402344, 0.017061233520507812, 0.01990985870361328, 0.02275848388671875, 0.02560710906982422, 0.028455734252929688, 0.031304359436035156, 0.034152984619140625, 0.037001609802246094, 0.03985023498535156, 0.04269886016845703, 0.0455474853515625, 0.04839611053466797, 0.05124473571777344, 0.054093360900878906, 0.056941986083984375, 0.059790611267089844, 0.06263923645019531, 0.06548786163330078, 0.06833648681640625, 0.07118511199951172, 0.07403373718261719, 0.07688236236572266, 0.07973098754882812, 0.0825796127319336, 0.08542823791503906, 0.08827686309814453, 0.09112548828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 793.0, 199.0, 10.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1575231552124023, -1.0923783779144287, -1.027233600616455, -0.9620888233184814, -0.8969440460205078, -0.8317992687225342, -0.7666545510292053, -0.7015097737312317, -0.6363649964332581, -0.5712202191352844, -0.5060754418373108, -0.44093069434165955, -0.3757859170436859, -0.3106411397457123, -0.24549639225006104, -0.1803516149520874, -0.11520683765411377, -0.050062067806720734, 0.015082702040672302, 0.08022746443748474, 0.14537224173545837, 0.210517019033432, 0.27566176652908325, 0.3408065438270569, 0.4059513211250305, 0.47109609842300415, 0.5362408757209778, 0.6013855934143066, 0.6665303707122803, 0.7316751480102539, 0.7968199253082275, 0.8619647026062012, 0.9271094799041748, 0.9922542572021484, 1.057399034500122, 1.1225438117980957, 1.1876885890960693, 1.252833366394043, 1.3179781436920166, 1.3831229209899902, 1.4482676982879639, 1.5134124755859375, 1.5785572528839111, 1.6437020301818848, 1.7088468074798584, 1.773991584777832, 1.8391363620758057, 1.9042811393737793, 1.9694257974624634, 2.0345704555511475, 2.099715232849121, 2.1648600101470947, 2.2300047874450684, 2.295149564743042, 2.3602943420410156, 2.4254391193389893, 2.490583896636963, 2.5557286739349365, 2.62087345123291, 2.686018228530884, 2.7511630058288574, 2.816307783126831, 2.8814525604248047, 2.9465973377227783, 3.011742115020752]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 2.0, 5.0, 4.0, 2.0, 9.0, 11.0, 11.0, 13.0, 18.0, 17.0, 31.0, 23.0, 26.0, 20.0, 31.0, 39.0, 39.0, 33.0, 31.0, 30.0, 50.0, 38.0, 39.0, 36.0, 37.0, 41.0, 57.0, 34.0, 36.0, 30.0, 22.0, 26.0, 26.0, 13.0, 19.0, 22.0, 13.0, 14.0, 14.0, 10.0, 6.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.15533310174942017, -0.15025539696216583, -0.1451776921749115, -0.14009998738765717, -0.13502228260040283, -0.1299445629119873, -0.12486685812473297, -0.11978915333747864, -0.1147114485502243, -0.10963374376296997, -0.10455603897571564, -0.0994783267378807, -0.09440062195062637, -0.08932291716337204, -0.08424520492553711, -0.07916750013828278, -0.07408979535102844, -0.06901209056377411, -0.06393438577651978, -0.058856673538684845, -0.05377896875143051, -0.04870126396417618, -0.043623555451631546, -0.038545846939086914, -0.03346814215183258, -0.028390435501933098, -0.023312728852033615, -0.018235022202134132, -0.01315731555223465, -0.008079608902335167, -0.003001902252435684, 0.0020758062601089478, 0.007153511047363281, 0.012231217697262764, 0.017308924347162247, 0.02238663099706173, 0.027464337646961212, 0.032542042434215546, 0.03761975094676018, 0.04269745945930481, 0.04777516424655914, 0.05285286903381348, 0.05793057754635811, 0.06300828605890274, 0.06808599084615707, 0.07316369563341141, 0.07824140787124634, 0.08331911265850067, 0.088396817445755, 0.09347452223300934, 0.09855222702026367, 0.1036299392580986, 0.10870764404535294, 0.11378534883260727, 0.1188630610704422, 0.12394076585769653, 0.12901847064495087, 0.1340961754322052, 0.13917388021945953, 0.14425158500671387, 0.1493293046951294, 0.15440700948238373, 0.15948471426963806, 0.1645624190568924, 0.16964012384414673]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 18.0, 14.0, 21.0, 23.0, 33.0, 42.0, 74.0, 93.0, 129.0, 191.0, 249.0, 442.0, 648.0, 1070.0, 1952.0, 3891.0, 9424.0, 40764.0, 808077.0, 152252.0, 16883.0, 5726.0, 2678.0, 1411.0, 872.0, 518.0, 320.0, 231.0, 143.0, 106.0, 65.0, 37.0, 32.0, 30.0, 21.0, 18.0, 14.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20849609375, -0.20124053955078125, -0.1939849853515625, -0.18672943115234375, -0.179473876953125, -0.17221832275390625, -0.1649627685546875, -0.15770721435546875, -0.15045166015625, -0.14319610595703125, -0.1359405517578125, -0.12868499755859375, -0.121429443359375, -0.11417388916015625, -0.1069183349609375, -0.09966278076171875, -0.0924072265625, -0.08515167236328125, -0.0778961181640625, -0.07064056396484375, -0.063385009765625, -0.05612945556640625, -0.0488739013671875, -0.04161834716796875, -0.03436279296875, -0.02710723876953125, -0.0198516845703125, -0.01259613037109375, -0.005340576171875, 0.00191497802734375, 0.0091705322265625, 0.01642608642578125, 0.023681640625, 0.03093719482421875, 0.0381927490234375, 0.04544830322265625, 0.052703857421875, 0.05995941162109375, 0.0672149658203125, 0.07447052001953125, 0.08172607421875, 0.08898162841796875, 0.0962371826171875, 0.10349273681640625, 0.110748291015625, 0.11800384521484375, 0.1252593994140625, 0.13251495361328125, 0.1397705078125, 0.14702606201171875, 0.1542816162109375, 0.16153717041015625, 0.168792724609375, 0.17604827880859375, 0.1833038330078125, 0.19055938720703125, 0.19781494140625, 0.20507049560546875, 0.2123260498046875, 0.21958160400390625, 0.226837158203125, 0.23409271240234375, 0.2413482666015625, 0.24860382080078125, 0.255859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 9.0, 10.0, 19.0, 18.0, 16.0, 18.0, 28.0, 25.0, 32.0, 37.0, 42.0, 53.0, 51.0, 53.0, 57.0, 58.0, 47.0, 51.0, 44.0, 41.0, 29.0, 47.0, 26.0, 30.0, 22.0, 17.0, 13.0, 19.0, 11.0, 12.0, 8.0, 8.0, 7.0, 4.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046173095703125, -0.04496145248413086, -0.04374980926513672, -0.04253816604614258, -0.04132652282714844, -0.0401148796081543, -0.038903236389160156, -0.037691593170166016, -0.036479949951171875, -0.035268306732177734, -0.034056663513183594, -0.03284502029418945, -0.03163337707519531, -0.030421733856201172, -0.02921009063720703, -0.02799844741821289, -0.02678680419921875, -0.02557516098022461, -0.02436351776123047, -0.023151874542236328, -0.021940231323242188, -0.020728588104248047, -0.019516944885253906, -0.018305301666259766, -0.017093658447265625, -0.015882015228271484, -0.014670372009277344, -0.013458728790283203, -0.012247085571289062, -0.011035442352294922, -0.009823799133300781, -0.00861215591430664, -0.0074005126953125, -0.006188869476318359, -0.004977226257324219, -0.003765583038330078, -0.0025539398193359375, -0.0013422966003417969, -0.00013065338134765625, 0.0010809898376464844, 0.002292633056640625, 0.0035042762756347656, 0.004715919494628906, 0.005927562713623047, 0.0071392059326171875, 0.008350849151611328, 0.009562492370605469, 0.01077413558959961, 0.01198577880859375, 0.01319742202758789, 0.014409065246582031, 0.015620708465576172, 0.016832351684570312, 0.018043994903564453, 0.019255638122558594, 0.020467281341552734, 0.021678924560546875, 0.022890567779541016, 0.024102210998535156, 0.025313854217529297, 0.026525497436523438, 0.027737140655517578, 0.02894878387451172, 0.03016042709350586, 0.0313720703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 3.0, 8.0, 5.0, 16.0, 24.0, 28.0, 40.0, 44.0, 48.0, 68.0, 86.0, 162.0, 241.0, 658.0, 2375.0, 18089.0, 401264.0, 593738.0, 26963.0, 3081.0, 750.0, 322.0, 149.0, 86.0, 80.0, 38.0, 45.0, 35.0, 21.0, 13.0, 16.0, 13.0, 6.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1156005859375, -0.11199665069580078, -0.10839271545410156, -0.10478878021240234, -0.10118484497070312, -0.0975809097290039, -0.09397697448730469, -0.09037303924560547, -0.08676910400390625, -0.08316516876220703, -0.07956123352050781, -0.0759572982788086, -0.07235336303710938, -0.06874942779541016, -0.06514549255371094, -0.06154155731201172, -0.0579376220703125, -0.05433368682861328, -0.05072975158691406, -0.047125816345214844, -0.043521881103515625, -0.039917945861816406, -0.03631401062011719, -0.03271007537841797, -0.02910614013671875, -0.02550220489501953, -0.021898269653320312, -0.018294334411621094, -0.014690399169921875, -0.011086463928222656, -0.0074825286865234375, -0.0038785934448242188, -0.000274658203125, 0.0033292770385742188, 0.0069332122802734375, 0.010537147521972656, 0.014141082763671875, 0.017745018005371094, 0.021348953247070312, 0.02495288848876953, 0.02855682373046875, 0.03216075897216797, 0.03576469421386719, 0.039368629455566406, 0.042972564697265625, 0.046576499938964844, 0.05018043518066406, 0.05378437042236328, 0.0573883056640625, 0.06099224090576172, 0.06459617614746094, 0.06820011138916016, 0.07180404663085938, 0.0754079818725586, 0.07901191711425781, 0.08261585235595703, 0.08621978759765625, 0.08982372283935547, 0.09342765808105469, 0.0970315933227539, 0.10063552856445312, 0.10423946380615234, 0.10784339904785156, 0.11144733428955078, 0.11505126953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 12.0, 15.0, 10.0, 18.0, 31.0, 22.0, 26.0, 25.0, 34.0, 43.0, 37.0, 43.0, 46.0, 46.0, 48.0, 51.0, 45.0, 54.0, 43.0, 33.0, 33.0, 38.0, 33.0, 36.0, 15.0, 19.0, 21.0, 21.0, 15.0, 21.0, 17.0, 3.0, 9.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.10675048828125, -0.10381507873535156, -0.10087966918945312, -0.09794425964355469, -0.09500885009765625, -0.09207344055175781, -0.08913803100585938, -0.08620262145996094, -0.0832672119140625, -0.08033180236816406, -0.07739639282226562, -0.07446098327636719, -0.07152557373046875, -0.06859016418457031, -0.06565475463867188, -0.06271934509277344, -0.059783935546875, -0.05684852600097656, -0.053913116455078125, -0.05097770690917969, -0.04804229736328125, -0.04510688781738281, -0.042171478271484375, -0.03923606872558594, -0.0363006591796875, -0.03336524963378906, -0.030429840087890625, -0.027494430541992188, -0.02455902099609375, -0.021623611450195312, -0.018688201904296875, -0.015752792358398438, -0.0128173828125, -0.009881973266601562, -0.006946563720703125, -0.0040111541748046875, -0.00107574462890625, 0.0018596649169921875, 0.004795074462890625, 0.0077304840087890625, 0.0106658935546875, 0.013601303100585938, 0.016536712646484375, 0.019472122192382812, 0.02240753173828125, 0.025342941284179688, 0.028278350830078125, 0.031213760375976562, 0.034149169921875, 0.03708457946777344, 0.040019989013671875, 0.04295539855957031, 0.04589080810546875, 0.04882621765136719, 0.051761627197265625, 0.05469703674316406, 0.0576324462890625, 0.06056785583496094, 0.06350326538085938, 0.06643867492675781, 0.06937408447265625, 0.07230949401855469, 0.07524490356445312, 0.07818031311035156, 0.08111572265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 9.0, 10.0, 6.0, 20.0, 15.0, 29.0, 50.0, 57.0, 77.0, 118.0, 193.0, 390.0, 811.0, 1921.0, 5057.0, 22955.0, 492696.0, 492391.0, 22950.0, 5021.0, 1929.0, 823.0, 399.0, 213.0, 120.0, 76.0, 60.0, 44.0, 29.0, 21.0, 20.0, 9.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02484130859375, -0.02403998374938965, -0.023238658905029297, -0.022437334060668945, -0.021636009216308594, -0.020834684371948242, -0.02003335952758789, -0.01923203468322754, -0.018430709838867188, -0.017629384994506836, -0.016828060150146484, -0.016026735305786133, -0.015225410461425781, -0.01442408561706543, -0.013622760772705078, -0.012821435928344727, -0.012020111083984375, -0.011218786239624023, -0.010417461395263672, -0.00961613655090332, -0.008814811706542969, -0.008013486862182617, -0.007212162017822266, -0.006410837173461914, -0.0056095123291015625, -0.004808187484741211, -0.004006862640380859, -0.003205537796020508, -0.0024042129516601562, -0.0016028881072998047, -0.0008015632629394531, -2.384185791015625e-07, 0.00080108642578125, 0.0016024112701416016, 0.002403736114501953, 0.0032050609588623047, 0.004006385803222656, 0.004807710647583008, 0.005609035491943359, 0.006410360336303711, 0.0072116851806640625, 0.008013010025024414, 0.008814334869384766, 0.009615659713745117, 0.010416984558105469, 0.01121830940246582, 0.012019634246826172, 0.012820959091186523, 0.013622283935546875, 0.014423608779907227, 0.015224933624267578, 0.01602625846862793, 0.01682758331298828, 0.017628908157348633, 0.018430233001708984, 0.019231557846069336, 0.020032882690429688, 0.02083420753479004, 0.02163553237915039, 0.022436857223510742, 0.023238182067871094, 0.024039506912231445, 0.024840831756591797, 0.02564215660095215, 0.0264434814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 15.0, 18.0, 15.0, 30.0, 40.0, 49.0, 58.0, 54.0, 82.0, 77.0, 84.0, 68.0, 53.0, 65.0, 53.0, 35.0, 47.0, 21.0, 26.0, 15.0, 17.0, 9.0, 12.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0728836059570312e-05, -1.044292002916336e-05, -1.0157003998756409e-05, -9.871087968349457e-06, -9.585171937942505e-06, -9.299255907535553e-06, -9.013339877128601e-06, -8.72742384672165e-06, -8.441507816314697e-06, -8.155591785907745e-06, -7.869675755500793e-06, -7.5837597250938416e-06, -7.29784369468689e-06, -7.011927664279938e-06, -6.726011633872986e-06, -6.440095603466034e-06, -6.154179573059082e-06, -5.86826354265213e-06, -5.582347512245178e-06, -5.296431481838226e-06, -5.010515451431274e-06, -4.7245994210243225e-06, -4.438683390617371e-06, -4.152767360210419e-06, -3.866851329803467e-06, -3.580935299396515e-06, -3.295019268989563e-06, -3.009103238582611e-06, -2.723187208175659e-06, -2.4372711777687073e-06, -2.1513551473617554e-06, -1.8654391169548035e-06, -1.5795230865478516e-06, -1.2936070561408997e-06, -1.0076910257339478e-06, -7.217749953269958e-07, -4.3585896492004395e-07, -1.4994293451309204e-07, 1.3597309589385986e-07, 4.2188912630081177e-07, 7.078051567077637e-07, 9.937211871147156e-07, 1.2796372175216675e-06, 1.5655532479286194e-06, 1.8514692783355713e-06, 2.137385308742523e-06, 2.423301339149475e-06, 2.709217369556427e-06, 2.995133399963379e-06, 3.281049430370331e-06, 3.5669654607772827e-06, 3.852881491184235e-06, 4.1387975215911865e-06, 4.4247135519981384e-06, 4.71062958240509e-06, 4.996545612812042e-06, 5.282461643218994e-06, 5.568377673625946e-06, 5.854293704032898e-06, 6.14020973443985e-06, 6.426125764846802e-06, 6.712041795253754e-06, 6.9979578256607056e-06, 7.2838738560676575e-06, 7.569789886474609e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 11.0, 6.0, 15.0, 20.0, 40.0, 88.0, 196.0, 377.0, 739.0, 1592.0, 3579.0, 10678.0, 344021.0, 666267.0, 13428.0, 3943.0, 1773.0, 875.0, 419.0, 225.0, 101.0, 54.0, 32.0, 15.0, 11.0, 6.0, 6.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04595947265625, -0.04432201385498047, -0.04268455505371094, -0.041047096252441406, -0.039409637451171875, -0.037772178649902344, -0.03613471984863281, -0.03449726104736328, -0.03285980224609375, -0.03122234344482422, -0.029584884643554688, -0.027947425842285156, -0.026309967041015625, -0.024672508239746094, -0.023035049438476562, -0.02139759063720703, -0.0197601318359375, -0.01812267303466797, -0.016485214233398438, -0.014847755432128906, -0.013210296630859375, -0.011572837829589844, -0.009935379028320312, -0.008297920227050781, -0.00666046142578125, -0.005023002624511719, -0.0033855438232421875, -0.0017480850219726562, -0.000110626220703125, 0.0015268325805664062, 0.0031642913818359375, 0.004801750183105469, 0.006439208984375, 0.008076667785644531, 0.009714126586914062, 0.011351585388183594, 0.012989044189453125, 0.014626502990722656, 0.016263961791992188, 0.01790142059326172, 0.01953887939453125, 0.02117633819580078, 0.022813796997070312, 0.024451255798339844, 0.026088714599609375, 0.027726173400878906, 0.029363632202148438, 0.03100109100341797, 0.0326385498046875, 0.03427600860595703, 0.03591346740722656, 0.037550926208496094, 0.039188385009765625, 0.040825843811035156, 0.04246330261230469, 0.04410076141357422, 0.04573822021484375, 0.04737567901611328, 0.04901313781738281, 0.050650596618652344, 0.052288055419921875, 0.053925514221191406, 0.05556297302246094, 0.05720043182373047, 0.058837890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 5.0, 9.0, 17.0, 24.0, 34.0, 52.0, 101.0, 130.0, 192.0, 147.0, 107.0, 45.0, 36.0, 24.0, 15.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04559326171875, -0.04431343078613281, -0.043033599853515625, -0.04175376892089844, -0.04047393798828125, -0.03919410705566406, -0.037914276123046875, -0.03663444519042969, -0.0353546142578125, -0.03407478332519531, -0.032794952392578125, -0.03151512145996094, -0.03023529052734375, -0.028955459594726562, -0.027675628662109375, -0.026395797729492188, -0.025115966796875, -0.023836135864257812, -0.022556304931640625, -0.021276473999023438, -0.01999664306640625, -0.018716812133789062, -0.017436981201171875, -0.016157150268554688, -0.0148773193359375, -0.013597488403320312, -0.012317657470703125, -0.011037826538085938, -0.00975799560546875, -0.008478164672851562, -0.007198333740234375, -0.0059185028076171875, -0.004638671875, -0.0033588409423828125, -0.002079010009765625, -0.0007991790771484375, 0.00048065185546875, 0.0017604827880859375, 0.003040313720703125, 0.0043201446533203125, 0.0055999755859375, 0.0068798065185546875, 0.008159637451171875, 0.009439468383789062, 0.01071929931640625, 0.011999130249023438, 0.013278961181640625, 0.014558792114257812, 0.015838623046875, 0.017118453979492188, 0.018398284912109375, 0.019678115844726562, 0.02095794677734375, 0.022237777709960938, 0.023517608642578125, 0.024797439575195312, 0.0260772705078125, 0.027357101440429688, 0.028636932373046875, 0.029916763305664062, 0.03119659423828125, 0.03247642517089844, 0.033756256103515625, 0.03503608703613281, 0.03631591796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 32.0, 240.0, 568.0, 135.0, 21.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7432074546813965, -1.6939830780029297, -1.644758701324463, -1.5955342054367065, -1.5463098287582397, -1.497085452079773, -1.4478610754013062, -1.3986365795135498, -1.349412202835083, -1.3001878261566162, -1.2509634494781494, -1.201738953590393, -1.1525145769119263, -1.1032902002334595, -1.0540658235549927, -1.0048413276672363, -0.9556170105934143, -0.9063926339149475, -0.8571681976318359, -0.8079438209533691, -0.7587193846702576, -0.7094950079917908, -0.6602705717086792, -0.6110461950302124, -0.5618218183517456, -0.5125974416732788, -0.46337300539016724, -0.41414862871170044, -0.36492419242858887, -0.31569981575012207, -0.2664754092693329, -0.2172510027885437, -0.16802656650543213, -0.11880216002464294, -0.06957776099443436, -0.02035336196422577, 0.028871044516563416, 0.0780954509973526, 0.1273198425769806, 0.17654424905776978, 0.22576865553855896, 0.27499306201934814, 0.32421746850013733, 0.3734418749809265, 0.4226662516593933, 0.4718906879425049, 0.5211150646209717, 0.5703394412994385, 0.61956387758255, 0.6687882542610168, 0.7180126905441284, 0.7672370672225952, 0.8164615035057068, 0.8656858801841736, 0.9149103164672852, 0.964134693145752, 1.0133590698242188, 1.0625834465026855, 1.1118078231811523, 1.1610323190689087, 1.2102566957473755, 1.2594810724258423, 1.308705449104309, 1.3579299449920654, 1.4071543216705322]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 4.0, 9.0, 6.0, 7.0, 7.0, 11.0, 10.0, 16.0, 16.0, 21.0, 15.0, 18.0, 26.0, 31.0, 22.0, 33.0, 35.0, 28.0, 39.0, 30.0, 38.0, 34.0, 38.0, 35.0, 35.0, 51.0, 32.0, 48.0, 34.0, 36.0, 36.0, 26.0, 25.0, 18.0, 22.0, 20.0, 16.0, 20.0, 7.0, 13.0, 10.0, 4.0, 4.0, 3.0, 4.0, 5.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.49558281898498535, -0.4802844822406769, -0.464986115694046, -0.44968777894973755, -0.4343894124031067, -0.4190910756587982, -0.40379270911216736, -0.3884943723678589, -0.373196005821228, -0.35789766907691956, -0.3425993025302887, -0.3273009657859802, -0.31200259923934937, -0.2967042624950409, -0.28140589594841003, -0.26610755920410156, -0.2508091926574707, -0.23551084101200104, -0.22021248936653137, -0.2049141377210617, -0.18961578607559204, -0.17431744933128357, -0.1590190827846527, -0.14372074604034424, -0.12842240929603577, -0.1131240576505661, -0.09782570600509644, -0.08252735435962677, -0.0672290027141571, -0.051930658519268036, -0.03663230687379837, -0.021333955228328705, -0.006035596132278442, 0.009262754581868649, 0.02456110529601574, 0.039859455078840256, 0.05515780672430992, 0.07045615464448929, 0.08575450628995895, 0.10105285793542862, 0.11635120958089828, 0.13164955377578735, 0.14694790542125702, 0.16224625706672668, 0.17754460871219635, 0.19284296035766602, 0.20814131200313568, 0.22343966364860535, 0.238738015294075, 0.2540363669395447, 0.26933470368385315, 0.284633070230484, 0.2999314069747925, 0.31522977352142334, 0.3305281102657318, 0.34582647681236267, 0.36112481355667114, 0.3764231503009796, 0.3917215168476105, 0.40701985359191895, 0.4223182201385498, 0.4376165568828583, 0.45291492342948914, 0.4682132601737976, 0.48351162672042847]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 10.0, 11.0, 17.0, 17.0, 9.0, 27.0, 36.0, 38.0, 48.0, 64.0, 102.0, 266.0, 1035.0, 5574.0, 4116116.0, 67274.0, 2579.0, 553.0, 156.0, 90.0, 45.0, 32.0, 24.0, 33.0, 21.0, 14.0, 18.0, 11.0, 9.0, 13.0, 8.0, 7.0, 1.0, 6.0, 4.0, 3.0, 1.0], "bins": [-0.63916015625, -0.6238632202148438, -0.6085662841796875, -0.5932693481445312, -0.577972412109375, -0.5626754760742188, -0.5473785400390625, -0.5320816040039062, -0.51678466796875, -0.5014877319335938, -0.4861907958984375, -0.47089385986328125, -0.455596923828125, -0.44029998779296875, -0.4250030517578125, -0.40970611572265625, -0.3944091796875, -0.37911224365234375, -0.3638153076171875, -0.34851837158203125, -0.333221435546875, -0.31792449951171875, -0.3026275634765625, -0.28733062744140625, -0.27203369140625, -0.25673675537109375, -0.2414398193359375, -0.22614288330078125, -0.210845947265625, -0.19554901123046875, -0.1802520751953125, -0.16495513916015625, -0.149658203125, -0.13436126708984375, -0.1190643310546875, -0.10376739501953125, -0.088470458984375, -0.07317352294921875, -0.0578765869140625, -0.04257965087890625, -0.02728271484375, -0.01198577880859375, 0.0033111572265625, 0.01860809326171875, 0.033905029296875, 0.04920196533203125, 0.0644989013671875, 0.07979583740234375, 0.0950927734375, 0.11038970947265625, 0.1256866455078125, 0.14098358154296875, 0.156280517578125, 0.17157745361328125, 0.1868743896484375, 0.20217132568359375, 0.21746826171875, 0.23276519775390625, 0.2480621337890625, 0.26335906982421875, 0.278656005859375, 0.29395294189453125, 0.3092498779296875, 0.32454681396484375, 0.33984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 10.0, 5.0, 9.0, 19.0, 13.0, 11.0, 11.0, 26.0, 22.0, 27.0, 33.0, 31.0, 46.0, 51.0, 55.0, 58.0, 64.0, 43.0, 55.0, 52.0, 50.0, 41.0, 44.0, 31.0, 22.0, 35.0, 19.0, 20.0, 19.0, 15.0, 10.0, 18.0, 7.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04669189453125, -0.04546976089477539, -0.04424762725830078, -0.04302549362182617, -0.04180335998535156, -0.04058122634887695, -0.039359092712402344, -0.038136959075927734, -0.036914825439453125, -0.035692691802978516, -0.034470558166503906, -0.0332484245300293, -0.03202629089355469, -0.030804157257080078, -0.02958202362060547, -0.02835988998413086, -0.02713775634765625, -0.02591562271118164, -0.02469348907470703, -0.023471355438232422, -0.022249221801757812, -0.021027088165283203, -0.019804954528808594, -0.018582820892333984, -0.017360687255859375, -0.016138553619384766, -0.014916419982910156, -0.013694286346435547, -0.012472152709960938, -0.011250019073486328, -0.010027885437011719, -0.00880575180053711, -0.0075836181640625, -0.006361484527587891, -0.005139350891113281, -0.003917217254638672, -0.0026950836181640625, -0.0014729499816894531, -0.00025081634521484375, 0.0009713172912597656, 0.002193450927734375, 0.0034155845642089844, 0.004637718200683594, 0.005859851837158203, 0.0070819854736328125, 0.008304119110107422, 0.009526252746582031, 0.01074838638305664, 0.01197052001953125, 0.01319265365600586, 0.014414787292480469, 0.015636920928955078, 0.016859054565429688, 0.018081188201904297, 0.019303321838378906, 0.020525455474853516, 0.021747589111328125, 0.022969722747802734, 0.024191856384277344, 0.025413990020751953, 0.026636123657226562, 0.027858257293701172, 0.02908039093017578, 0.03030252456665039, 0.031524658203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 7.0, 5.0, 7.0, 18.0, 12.0, 43.0, 56.0, 142.0, 366.0, 1196.0, 7016.0, 92368.0, 3170474.0, 886178.0, 31586.0, 3556.0, 732.0, 260.0, 99.0, 61.0, 37.0, 25.0, 17.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10162353515625, -0.09752750396728516, -0.09343147277832031, -0.08933544158935547, -0.08523941040039062, -0.08114337921142578, -0.07704734802246094, -0.0729513168334961, -0.06885528564453125, -0.0647592544555664, -0.06066322326660156, -0.05656719207763672, -0.052471160888671875, -0.04837512969970703, -0.04427909851074219, -0.040183067321777344, -0.0360870361328125, -0.031991004943847656, -0.027894973754882812, -0.02379894256591797, -0.019702911376953125, -0.015606880187988281, -0.011510848999023438, -0.007414817810058594, -0.00331878662109375, 0.0007772445678710938, 0.0048732757568359375, 0.008969306945800781, 0.013065338134765625, 0.01716136932373047, 0.021257400512695312, 0.025353431701660156, 0.029449462890625, 0.033545494079589844, 0.03764152526855469, 0.04173755645751953, 0.045833587646484375, 0.04992961883544922, 0.05402565002441406, 0.058121681213378906, 0.06221771240234375, 0.0663137435913086, 0.07040977478027344, 0.07450580596923828, 0.07860183715820312, 0.08269786834716797, 0.08679389953613281, 0.09088993072509766, 0.0949859619140625, 0.09908199310302734, 0.10317802429199219, 0.10727405548095703, 0.11137008666992188, 0.11546611785888672, 0.11956214904785156, 0.1236581802368164, 0.12775421142578125, 0.1318502426147461, 0.13594627380371094, 0.14004230499267578, 0.14413833618164062, 0.14823436737060547, 0.1523303985595703, 0.15642642974853516, 0.1605224609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 8.0, 13.0, 15.0, 9.0, 22.0, 52.0, 43.0, 68.0, 108.0, 172.0, 261.0, 459.0, 821.0, 734.0, 484.0, 277.0, 201.0, 128.0, 70.0, 36.0, 27.0, 21.0, 19.0, 7.0, 5.0, 2.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03729248046875, -0.0358123779296875, -0.034332275390625, -0.0328521728515625, -0.0313720703125, -0.0298919677734375, -0.028411865234375, -0.0269317626953125, -0.02545166015625, -0.0239715576171875, -0.022491455078125, -0.0210113525390625, -0.01953125, -0.0180511474609375, -0.016571044921875, -0.0150909423828125, -0.01361083984375, -0.0121307373046875, -0.010650634765625, -0.0091705322265625, -0.0076904296875, -0.0062103271484375, -0.004730224609375, -0.0032501220703125, -0.00177001953125, -0.0002899169921875, 0.001190185546875, 0.0026702880859375, 0.004150390625, 0.0056304931640625, 0.007110595703125, 0.0085906982421875, 0.01007080078125, 0.0115509033203125, 0.013031005859375, 0.0145111083984375, 0.0159912109375, 0.0174713134765625, 0.018951416015625, 0.0204315185546875, 0.02191162109375, 0.0233917236328125, 0.024871826171875, 0.0263519287109375, 0.02783203125, 0.0293121337890625, 0.030792236328125, 0.0322723388671875, 0.03375244140625, 0.0352325439453125, 0.036712646484375, 0.0381927490234375, 0.0396728515625, 0.0411529541015625, 0.042633056640625, 0.0441131591796875, 0.04559326171875, 0.0470733642578125, 0.048553466796875, 0.0500335693359375, 0.051513671875, 0.0529937744140625, 0.054473876953125, 0.0559539794921875, 0.05743408203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 10.0, 39.0, 260.0, 492.0, 151.0, 45.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3368317484855652, -0.314841091632843, -0.29285046458244324, -0.27085983753204346, -0.2488691806793213, -0.22687853872776031, -0.20488789677619934, -0.18289725482463837, -0.1609066128730774, -0.13891597092151642, -0.11692532896995544, -0.09493468701839447, -0.0729440450668335, -0.05095340311527252, -0.028962761163711548, -0.006972119212150574, 0.0150185227394104, 0.037009164690971375, 0.05899980664253235, 0.08099044859409332, 0.1029810905456543, 0.12497173249721527, 0.14696237444877625, 0.16895301640033722, 0.1909436583518982, 0.21293430030345917, 0.23492494225502014, 0.2569155693054199, 0.2789062261581421, 0.30089688301086426, 0.32288751006126404, 0.3448781371116638, 0.36686885356903076, 0.38885951042175293, 0.4108501374721527, 0.4328407645225525, 0.45483142137527466, 0.4768220782279968, 0.4988127052783966, 0.5208033323287964, 0.5427939891815186, 0.5647846460342407, 0.5867753028869629, 0.6087659001350403, 0.6307565569877625, 0.6527472138404846, 0.674737811088562, 0.6967284679412842, 0.7187191247940063, 0.7407097816467285, 0.7627004384994507, 0.7846910357475281, 0.8066816926002502, 0.8286723494529724, 0.8506629467010498, 0.872653603553772, 0.8946442604064941, 0.9166349172592163, 0.9386255741119385, 0.9606161713600159, 0.982606828212738, 1.0045974254608154, 1.0265880823135376, 1.0485787391662598, 1.070569396018982]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 3.0, 10.0, 11.0, 17.0, 14.0, 18.0, 20.0, 27.0, 29.0, 28.0, 34.0, 41.0, 46.0, 46.0, 38.0, 40.0, 35.0, 49.0, 45.0, 55.0, 40.0, 32.0, 39.0, 32.0, 26.0, 36.0, 28.0, 21.0, 17.0, 10.0, 21.0, 17.0, 6.0, 12.0, 10.0, 4.0, 5.0, 2.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10927140712738037, -0.10571034252643585, -0.10214927047491074, -0.09858820587396622, -0.0950271338224411, -0.09146606922149658, -0.08790500462055206, -0.08434394001960754, -0.08078286796808243, -0.07722180336713791, -0.07366073131561279, -0.07009966671466827, -0.06653860211372375, -0.06297753006219864, -0.05941646546125412, -0.0558553971350193, -0.052294328808784485, -0.04873326048254967, -0.04517219215631485, -0.04161112755537033, -0.03805005922913551, -0.034488990902900696, -0.030927924439311028, -0.02736685797572136, -0.023805789649486542, -0.020244721323251724, -0.016683654859662056, -0.013122587464749813, -0.00956152006983757, -0.006000451743602753, -0.0024393852800130844, 0.0011216811835765839, 0.004682749509811401, 0.008243816904723644, 0.011804884299635887, 0.01536595169454813, 0.018927019089460373, 0.02248808741569519, 0.02604915387928486, 0.029610220342874527, 0.033171288669109344, 0.03673235699534416, 0.04029342532157898, 0.0438544899225235, 0.047415558248758316, 0.050976626574993134, 0.05453769117593765, 0.05809875950217247, 0.06165982782840729, 0.0652208924293518, 0.06878196448087692, 0.07234302908182144, 0.07590410113334656, 0.07946516573429108, 0.0830262303352356, 0.08658729493618011, 0.09014836698770523, 0.09370943158864975, 0.09727050364017487, 0.10083156824111938, 0.1043926328420639, 0.10795370489358902, 0.11151476949453354, 0.11507584154605865, 0.11863690614700317]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 11.0, 18.0, 12.0, 45.0, 76.0, 116.0, 195.0, 377.0, 722.0, 1807.0, 4766.0, 16212.0, 90575.0, 669365.0, 222942.0, 29224.0, 7425.0, 2499.0, 1046.0, 478.0, 256.0, 156.0, 87.0, 47.0, 42.0, 25.0, 10.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1844482421875, -0.17897415161132812, -0.17350006103515625, -0.16802597045898438, -0.1625518798828125, -0.15707778930664062, -0.15160369873046875, -0.14612960815429688, -0.140655517578125, -0.13518142700195312, -0.12970733642578125, -0.12423324584960938, -0.1187591552734375, -0.11328506469726562, -0.10781097412109375, -0.10233688354492188, -0.09686279296875, -0.09138870239257812, -0.08591461181640625, -0.08044052124023438, -0.0749664306640625, -0.06949234008789062, -0.06401824951171875, -0.058544158935546875, -0.053070068359375, -0.047595977783203125, -0.04212188720703125, -0.036647796630859375, -0.0311737060546875, -0.025699615478515625, -0.02022552490234375, -0.014751434326171875, -0.00927734375, -0.003803253173828125, 0.00167083740234375, 0.007144927978515625, 0.0126190185546875, 0.018093109130859375, 0.02356719970703125, 0.029041290283203125, 0.034515380859375, 0.039989471435546875, 0.04546356201171875, 0.050937652587890625, 0.0564117431640625, 0.061885833740234375, 0.06735992431640625, 0.07283401489257812, 0.07830810546875, 0.08378219604492188, 0.08925628662109375, 0.09473037719726562, 0.1002044677734375, 0.10567855834960938, 0.11115264892578125, 0.11662673950195312, 0.122100830078125, 0.12757492065429688, 0.13304901123046875, 0.13852310180664062, 0.1439971923828125, 0.14947128295898438, 0.15494537353515625, 0.16041946411132812, 0.1658935546875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 11.0, 9.0, 14.0, 11.0, 8.0, 14.0, 14.0, 20.0, 19.0, 28.0, 38.0, 26.0, 36.0, 46.0, 69.0, 46.0, 51.0, 50.0, 49.0, 53.0, 43.0, 43.0, 33.0, 45.0, 31.0, 24.0, 23.0, 26.0, 18.0, 19.0, 8.0, 14.0, 10.0, 7.0, 13.0, 11.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03692626953125, -0.035797119140625, -0.03466796875, -0.033538818359375, -0.03240966796875, -0.031280517578125, -0.0301513671875, -0.029022216796875, -0.02789306640625, -0.026763916015625, -0.025634765625, -0.024505615234375, -0.02337646484375, -0.022247314453125, -0.0211181640625, -0.019989013671875, -0.01885986328125, -0.017730712890625, -0.0166015625, -0.015472412109375, -0.01434326171875, -0.013214111328125, -0.0120849609375, -0.010955810546875, -0.00982666015625, -0.008697509765625, -0.007568359375, -0.006439208984375, -0.00531005859375, -0.004180908203125, -0.0030517578125, -0.001922607421875, -0.00079345703125, 0.000335693359375, 0.00146484375, 0.002593994140625, 0.00372314453125, 0.004852294921875, 0.0059814453125, 0.007110595703125, 0.00823974609375, 0.009368896484375, 0.010498046875, 0.011627197265625, 0.01275634765625, 0.013885498046875, 0.0150146484375, 0.016143798828125, 0.01727294921875, 0.018402099609375, 0.01953125, 0.020660400390625, 0.02178955078125, 0.022918701171875, 0.0240478515625, 0.025177001953125, 0.02630615234375, 0.027435302734375, 0.028564453125, 0.029693603515625, 0.03082275390625, 0.031951904296875, 0.0330810546875, 0.034210205078125, 0.03533935546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 11.0, 8.0, 11.0, 13.0, 7.0, 16.0, 16.0, 25.0, 25.0, 23.0, 30.0, 28.0, 51.0, 62.0, 119.0, 225.0, 807.0, 5708.0, 204713.0, 806302.0, 27645.0, 1750.0, 373.0, 172.0, 97.0, 52.0, 46.0, 40.0, 33.0, 23.0, 21.0, 19.0, 11.0, 9.0, 16.0, 9.0, 11.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.226318359375, -0.2195110321044922, -0.21270370483398438, -0.20589637756347656, -0.19908905029296875, -0.19228172302246094, -0.18547439575195312, -0.1786670684814453, -0.1718597412109375, -0.1650524139404297, -0.15824508666992188, -0.15143775939941406, -0.14463043212890625, -0.13782310485839844, -0.13101577758789062, -0.12420845031738281, -0.117401123046875, -0.11059379577636719, -0.10378646850585938, -0.09697914123535156, -0.09017181396484375, -0.08336448669433594, -0.07655715942382812, -0.06974983215332031, -0.0629425048828125, -0.05613517761230469, -0.049327850341796875, -0.04252052307128906, -0.03571319580078125, -0.028905868530273438, -0.022098541259765625, -0.015291213989257812, -0.00848388671875, -0.0016765594482421875, 0.005130767822265625, 0.011938095092773438, 0.01874542236328125, 0.025552749633789062, 0.032360076904296875, 0.03916740417480469, 0.0459747314453125, 0.05278205871582031, 0.059589385986328125, 0.06639671325683594, 0.07320404052734375, 0.08001136779785156, 0.08681869506835938, 0.09362602233886719, 0.100433349609375, 0.10724067687988281, 0.11404800415039062, 0.12085533142089844, 0.12766265869140625, 0.13446998596191406, 0.14127731323242188, 0.1480846405029297, 0.1548919677734375, 0.1616992950439453, 0.16850662231445312, 0.17531394958496094, 0.18212127685546875, 0.18892860412597656, 0.19573593139648438, 0.2025432586669922, 0.2093505859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 6.0, 9.0, 8.0, 8.0, 30.0, 22.0, 29.0, 32.0, 36.0, 29.0, 32.0, 52.0, 46.0, 40.0, 48.0, 56.0, 51.0, 43.0, 47.0, 47.0, 46.0, 42.0, 50.0, 25.0, 33.0, 26.0, 26.0, 17.0, 17.0, 13.0, 7.0, 9.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08306884765625, -0.08063697814941406, -0.07820510864257812, -0.07577323913574219, -0.07334136962890625, -0.07090950012207031, -0.06847763061523438, -0.06604576110839844, -0.0636138916015625, -0.06118202209472656, -0.058750152587890625, -0.05631828308105469, -0.05388641357421875, -0.05145454406738281, -0.049022674560546875, -0.04659080505371094, -0.044158935546875, -0.04172706604003906, -0.039295196533203125, -0.03686332702636719, -0.03443145751953125, -0.03199958801269531, -0.029567718505859375, -0.027135848999023438, -0.0247039794921875, -0.022272109985351562, -0.019840240478515625, -0.017408370971679688, -0.01497650146484375, -0.012544631958007812, -0.010112762451171875, -0.0076808929443359375, -0.0052490234375, -0.0028171539306640625, -0.000385284423828125, 0.0020465850830078125, 0.00447845458984375, 0.0069103240966796875, 0.009342193603515625, 0.011774063110351562, 0.0142059326171875, 0.016637802124023438, 0.019069671630859375, 0.021501541137695312, 0.02393341064453125, 0.026365280151367188, 0.028797149658203125, 0.031229019165039062, 0.033660888671875, 0.03609275817871094, 0.038524627685546875, 0.04095649719238281, 0.04338836669921875, 0.04582023620605469, 0.048252105712890625, 0.05068397521972656, 0.0531158447265625, 0.05554771423339844, 0.057979583740234375, 0.06041145324707031, 0.06284332275390625, 0.06527519226074219, 0.06770706176757812, 0.07013893127441406, 0.07257080078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 6.0, 15.0, 26.0, 35.0, 68.0, 121.0, 216.0, 382.0, 676.0, 1332.0, 2773.0, 6607.0, 19841.0, 87252.0, 481732.0, 359943.0, 61747.0, 15584.0, 5338.0, 2380.0, 1111.0, 583.0, 328.0, 186.0, 104.0, 53.0, 39.0, 24.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030975341796875, -0.029903411865234375, -0.02883148193359375, -0.027759552001953125, -0.0266876220703125, -0.025615692138671875, -0.02454376220703125, -0.023471832275390625, -0.02239990234375, -0.021327972412109375, -0.02025604248046875, -0.019184112548828125, -0.0181121826171875, -0.017040252685546875, -0.01596832275390625, -0.014896392822265625, -0.013824462890625, -0.012752532958984375, -0.01168060302734375, -0.010608673095703125, -0.0095367431640625, -0.008464813232421875, -0.00739288330078125, -0.006320953369140625, -0.0052490234375, -0.004177093505859375, -0.00310516357421875, -0.002033233642578125, -0.0009613037109375, 0.000110626220703125, 0.00118255615234375, 0.002254486083984375, 0.003326416015625, 0.004398345947265625, 0.00547027587890625, 0.006542205810546875, 0.0076141357421875, 0.008686065673828125, 0.00975799560546875, 0.010829925537109375, 0.01190185546875, 0.012973785400390625, 0.01404571533203125, 0.015117645263671875, 0.0161895751953125, 0.017261505126953125, 0.01833343505859375, 0.019405364990234375, 0.020477294921875, 0.021549224853515625, 0.02262115478515625, 0.023693084716796875, 0.0247650146484375, 0.025836944580078125, 0.02690887451171875, 0.027980804443359375, 0.029052734375, 0.030124664306640625, 0.03119659423828125, 0.032268524169921875, 0.0333404541015625, 0.034412384033203125, 0.03548431396484375, 0.036556243896484375, 0.037628173828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 9.0, 9.0, 7.0, 10.0, 14.0, 16.0, 12.0, 14.0, 30.0, 31.0, 34.0, 57.0, 52.0, 59.0, 72.0, 70.0, 68.0, 67.0, 61.0, 59.0, 36.0, 43.0, 35.0, 25.0, 17.0, 14.0, 14.0, 13.0, 5.0, 9.0, 3.0, 8.0, 7.0, 7.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3887882232666016e-05, -1.3440847396850586e-05, -1.2993812561035156e-05, -1.2546777725219727e-05, -1.2099742889404297e-05, -1.1652708053588867e-05, -1.1205673217773438e-05, -1.0758638381958008e-05, -1.0311603546142578e-05, -9.864568710327148e-06, -9.417533874511719e-06, -8.970499038696289e-06, -8.52346420288086e-06, -8.07642936706543e-06, -7.62939453125e-06, -7.18235969543457e-06, -6.735324859619141e-06, -6.288290023803711e-06, -5.841255187988281e-06, -5.3942203521728516e-06, -4.947185516357422e-06, -4.500150680541992e-06, -4.0531158447265625e-06, -3.606081008911133e-06, -3.159046173095703e-06, -2.7120113372802734e-06, -2.2649765014648438e-06, -1.817941665649414e-06, -1.3709068298339844e-06, -9.238719940185547e-07, -4.76837158203125e-07, -2.9802322387695312e-08, 4.172325134277344e-07, 8.642673492431641e-07, 1.3113021850585938e-06, 1.7583370208740234e-06, 2.205371856689453e-06, 2.652406692504883e-06, 3.0994415283203125e-06, 3.546476364135742e-06, 3.993511199951172e-06, 4.4405460357666016e-06, 4.887580871582031e-06, 5.334615707397461e-06, 5.781650543212891e-06, 6.22868537902832e-06, 6.67572021484375e-06, 7.12275505065918e-06, 7.569789886474609e-06, 8.016824722290039e-06, 8.463859558105469e-06, 8.910894393920898e-06, 9.357929229736328e-06, 9.804964065551758e-06, 1.0251998901367188e-05, 1.0699033737182617e-05, 1.1146068572998047e-05, 1.1593103408813477e-05, 1.2040138244628906e-05, 1.2487173080444336e-05, 1.2934207916259766e-05, 1.3381242752075195e-05, 1.3828277587890625e-05, 1.4275312423706055e-05, 1.4722347259521484e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 7.0, 16.0, 14.0, 18.0, 26.0, 39.0, 43.0, 79.0, 160.0, 488.0, 4207.0, 159915.0, 852133.0, 29446.0, 1410.0, 237.0, 107.0, 55.0, 37.0, 24.0, 24.0, 18.0, 10.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.07039308547973633, -0.06839847564697266, -0.06640386581420898, -0.06440925598144531, -0.06241464614868164, -0.06042003631591797, -0.0584254264831543, -0.056430816650390625, -0.05443620681762695, -0.05244159698486328, -0.05044698715209961, -0.04845237731933594, -0.046457767486572266, -0.044463157653808594, -0.04246854782104492, -0.04047393798828125, -0.03847932815551758, -0.036484718322753906, -0.034490108489990234, -0.03249549865722656, -0.03050088882446289, -0.02850627899169922, -0.026511669158935547, -0.024517059326171875, -0.022522449493408203, -0.02052783966064453, -0.01853322982788086, -0.016538619995117188, -0.014544010162353516, -0.012549400329589844, -0.010554790496826172, -0.0085601806640625, -0.006565570831298828, -0.004570960998535156, -0.0025763511657714844, -0.0005817413330078125, 0.0014128684997558594, 0.0034074783325195312, 0.005402088165283203, 0.007396697998046875, 0.009391307830810547, 0.011385917663574219, 0.01338052749633789, 0.015375137329101562, 0.017369747161865234, 0.019364356994628906, 0.021358966827392578, 0.02335357666015625, 0.025348186492919922, 0.027342796325683594, 0.029337406158447266, 0.03133201599121094, 0.03332662582397461, 0.03532123565673828, 0.03731584548950195, 0.039310455322265625, 0.0413050651550293, 0.04329967498779297, 0.04529428482055664, 0.04728889465332031, 0.049283504486083984, 0.051278114318847656, 0.05327272415161133, 0.055267333984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 17.0, 18.0, 20.0, 25.0, 31.0, 29.0, 48.0, 59.0, 47.0, 76.0, 81.0, 87.0, 67.0, 72.0, 56.0, 52.0, 52.0, 28.0, 29.0, 30.0, 17.0, 11.0, 12.0, 5.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.017730712890625, -0.017249584197998047, -0.016768455505371094, -0.01628732681274414, -0.015806198120117188, -0.015325069427490234, -0.014843940734863281, -0.014362812042236328, -0.013881683349609375, -0.013400554656982422, -0.012919425964355469, -0.012438297271728516, -0.011957168579101562, -0.01147603988647461, -0.010994911193847656, -0.010513782501220703, -0.01003265380859375, -0.009551525115966797, -0.009070396423339844, -0.00858926773071289, -0.008108139038085938, -0.007627010345458984, -0.007145881652832031, -0.006664752960205078, -0.006183624267578125, -0.005702495574951172, -0.005221366882324219, -0.004740238189697266, -0.0042591094970703125, -0.0037779808044433594, -0.0032968521118164062, -0.002815723419189453, -0.0023345947265625, -0.0018534660339355469, -0.0013723373413085938, -0.0008912086486816406, -0.0004100799560546875, 7.104873657226562e-05, 0.0005521774291992188, 0.0010333061218261719, 0.001514434814453125, 0.001995563507080078, 0.0024766921997070312, 0.0029578208923339844, 0.0034389495849609375, 0.003920078277587891, 0.004401206970214844, 0.004882335662841797, 0.00536346435546875, 0.005844593048095703, 0.006325721740722656, 0.006806850433349609, 0.0072879791259765625, 0.007769107818603516, 0.008250236511230469, 0.008731365203857422, 0.009212493896484375, 0.009693622589111328, 0.010174751281738281, 0.010655879974365234, 0.011137008666992188, 0.01161813735961914, 0.012099266052246094, 0.012580394744873047, 0.0130615234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 35.0, 288.0, 518.0, 142.0, 17.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0957276821136475, -1.067823052406311, -1.039918303489685, -1.0120136737823486, -0.9841089248657227, -0.9562042951583862, -0.928299605846405, -0.9003949165344238, -0.8724902272224426, -0.8445855379104614, -0.8166808485984802, -0.788776159286499, -0.7608715295791626, -0.7329667806625366, -0.7050621509552002, -0.677157461643219, -0.6492527723312378, -0.6213480830192566, -0.5934433937072754, -0.5655387043952942, -0.537634015083313, -0.5097293853759766, -0.48182469606399536, -0.45392000675201416, -0.42601531744003296, -0.39811062812805176, -0.37020593881607056, -0.34230127930641174, -0.31439658999443054, -0.28649190068244934, -0.2585872411727905, -0.23068255186080933, -0.20277786254882812, -0.17487317323684692, -0.14696849882602692, -0.11906381696462631, -0.09115913510322571, -0.0632544457912445, -0.0353497713804245, -0.007445096969604492, 0.02045959234237671, 0.04836427420377731, 0.07626895606517792, 0.10417363792657852, 0.13207831978797913, 0.15998300909996033, 0.18788768351078033, 0.21579235792160034, 0.24369704723358154, 0.27160173654556274, 0.29950642585754395, 0.32741108536720276, 0.35531577467918396, 0.38322046399116516, 0.411125123500824, 0.4390298128128052, 0.4669345021247864, 0.4948391914367676, 0.5227438807487488, 0.55064857006073, 0.5785531997680664, 0.6064579486846924, 0.6343625783920288, 0.66226726770401, 0.6901719570159912]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 9.0, 11.0, 8.0, 14.0, 9.0, 12.0, 21.0, 16.0, 27.0, 19.0, 30.0, 25.0, 31.0, 26.0, 42.0, 51.0, 42.0, 47.0, 42.0, 36.0, 42.0, 39.0, 37.0, 41.0, 32.0, 36.0, 35.0, 27.0, 20.0, 18.0, 26.0, 15.0, 16.0, 18.0, 11.0, 17.0, 8.0, 3.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0], "bins": [-0.262748122215271, -0.2552414536476135, -0.24773478507995605, -0.24022811651229858, -0.2327214479446411, -0.22521477937698364, -0.21770811080932617, -0.2102014422416687, -0.20269477367401123, -0.19518810510635376, -0.1876814365386963, -0.18017476797103882, -0.17266809940338135, -0.16516143083572388, -0.1576547622680664, -0.15014809370040894, -0.14264141023159027, -0.1351347416639328, -0.12762807309627533, -0.12012140452861786, -0.11261473596096039, -0.10510806739330292, -0.09760139137506485, -0.09009472280740738, -0.08258805423974991, -0.07508138567209244, -0.06757471710443497, -0.0600680448114872, -0.05256137624382973, -0.045054707676172256, -0.03754803538322449, -0.030041366815567017, -0.022534698247909546, -0.0150280287489295, -0.007521359249949455, -1.4688819646835327e-05, 0.007491979748010635, 0.014998648315668106, 0.022505320608615875, 0.030011989176273346, 0.03751865774393082, 0.04502532631158829, 0.05253199487924576, 0.06003866717219353, 0.0675453394651413, 0.07505200803279877, 0.08255867660045624, 0.09006534516811371, 0.09757201373577118, 0.10507868230342865, 0.11258535087108612, 0.12009201943874359, 0.12759868800640106, 0.13510535657405853, 0.1426120400428772, 0.15011870861053467, 0.15762537717819214, 0.1651320457458496, 0.17263871431350708, 0.18014538288116455, 0.18765205144882202, 0.1951587200164795, 0.20266538858413696, 0.21017205715179443, 0.2176787257194519]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 11.0, 17.0, 29.0, 46.0, 50.0, 68.0, 111.0, 167.0, 231.0, 351.0, 637.0, 1271.0, 3239.0, 14912.0, 434914.0, 3637741.0, 88037.0, 7914.0, 2148.0, 868.0, 516.0, 343.0, 194.0, 126.0, 98.0, 63.0, 47.0, 34.0, 23.0, 18.0, 16.0, 10.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.1851806640625, -0.18069839477539062, -0.17621612548828125, -0.17173385620117188, -0.1672515869140625, -0.16276931762695312, -0.15828704833984375, -0.15380477905273438, -0.149322509765625, -0.14484024047851562, -0.14035797119140625, -0.13587570190429688, -0.1313934326171875, -0.12691116333007812, -0.12242889404296875, -0.11794662475585938, -0.11346435546875, -0.10898208618164062, -0.10449981689453125, -0.10001754760742188, -0.0955352783203125, -0.09105300903320312, -0.08657073974609375, -0.08208847045898438, -0.077606201171875, -0.07312393188476562, -0.06864166259765625, -0.06415939331054688, -0.0596771240234375, -0.055194854736328125, -0.05071258544921875, -0.046230316162109375, -0.041748046875, -0.037265777587890625, -0.03278350830078125, -0.028301239013671875, -0.0238189697265625, -0.019336700439453125, -0.01485443115234375, -0.010372161865234375, -0.005889892578125, -0.001407623291015625, 0.00307464599609375, 0.007556915283203125, 0.0120391845703125, 0.016521453857421875, 0.02100372314453125, 0.025485992431640625, 0.02996826171875, 0.034450531005859375, 0.03893280029296875, 0.043415069580078125, 0.0478973388671875, 0.052379608154296875, 0.05686187744140625, 0.061344146728515625, 0.065826416015625, 0.07030868530273438, 0.07479095458984375, 0.07927322387695312, 0.0837554931640625, 0.08823776245117188, 0.09272003173828125, 0.09720230102539062, 0.1016845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 6.0, 13.0, 7.0, 17.0, 21.0, 12.0, 22.0, 23.0, 24.0, 43.0, 39.0, 36.0, 53.0, 53.0, 68.0, 61.0, 49.0, 51.0, 45.0, 33.0, 37.0, 50.0, 29.0, 32.0, 26.0, 26.0, 13.0, 20.0, 18.0, 14.0, 7.0, 8.0, 5.0, 6.0, 4.0, 7.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04052734375, -0.03939962387084961, -0.03827190399169922, -0.03714418411254883, -0.03601646423339844, -0.03488874435424805, -0.033761024475097656, -0.032633304595947266, -0.031505584716796875, -0.030377864837646484, -0.029250144958496094, -0.028122425079345703, -0.026994705200195312, -0.025866985321044922, -0.02473926544189453, -0.02361154556274414, -0.02248382568359375, -0.02135610580444336, -0.02022838592529297, -0.019100666046142578, -0.017972946166992188, -0.016845226287841797, -0.015717506408691406, -0.014589786529541016, -0.013462066650390625, -0.012334346771240234, -0.011206626892089844, -0.010078907012939453, -0.008951187133789062, -0.007823467254638672, -0.006695747375488281, -0.005568027496337891, -0.0044403076171875, -0.0033125877380371094, -0.0021848678588867188, -0.0010571479797363281, 7.05718994140625e-05, 0.0011982917785644531, 0.0023260116577148438, 0.0034537315368652344, 0.004581451416015625, 0.005709171295166016, 0.006836891174316406, 0.007964611053466797, 0.009092330932617188, 0.010220050811767578, 0.011347770690917969, 0.01247549057006836, 0.01360321044921875, 0.01473093032836914, 0.01585865020751953, 0.016986370086669922, 0.018114089965820312, 0.019241809844970703, 0.020369529724121094, 0.021497249603271484, 0.022624969482421875, 0.023752689361572266, 0.024880409240722656, 0.026008129119873047, 0.027135848999023438, 0.028263568878173828, 0.02939128875732422, 0.03051900863647461, 0.031646728515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 11.0, 20.0, 16.0, 39.0, 41.0, 90.0, 133.0, 227.0, 371.0, 762.0, 1775.0, 6799.0, 44816.0, 526271.0, 3007260.0, 547731.0, 47142.0, 7117.0, 1978.0, 746.0, 383.0, 199.0, 145.0, 62.0, 32.0, 35.0, 15.0, 17.0, 12.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.09705924987792969, -0.09365463256835938, -0.09025001525878906, -0.08684539794921875, -0.08344078063964844, -0.08003616333007812, -0.07663154602050781, -0.0732269287109375, -0.06982231140136719, -0.06641769409179688, -0.06301307678222656, -0.05960845947265625, -0.05620384216308594, -0.052799224853515625, -0.04939460754394531, -0.045989990234375, -0.04258537292480469, -0.039180755615234375, -0.03577613830566406, -0.03237152099609375, -0.028966903686523438, -0.025562286376953125, -0.022157669067382812, -0.0187530517578125, -0.015348434448242188, -0.011943817138671875, -0.008539199829101562, -0.00513458251953125, -0.0017299652099609375, 0.001674652099609375, 0.0050792694091796875, 0.00848388671875, 0.011888504028320312, 0.015293121337890625, 0.018697738647460938, 0.02210235595703125, 0.025506973266601562, 0.028911590576171875, 0.03231620788574219, 0.0357208251953125, 0.03912544250488281, 0.042530059814453125, 0.04593467712402344, 0.04933929443359375, 0.05274391174316406, 0.056148529052734375, 0.05955314636230469, 0.062957763671875, 0.06636238098144531, 0.06976699829101562, 0.07317161560058594, 0.07657623291015625, 0.07998085021972656, 0.08338546752929688, 0.08679008483886719, 0.0901947021484375, 0.09359931945800781, 0.09700393676757812, 0.10040855407714844, 0.10381317138671875, 0.10721778869628906, 0.11062240600585938, 0.11402702331542969, 0.117431640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 12.0, 13.0, 10.0, 20.0, 22.0, 49.0, 48.0, 71.0, 110.0, 155.0, 213.0, 291.0, 404.0, 557.0, 628.0, 409.0, 292.0, 230.0, 186.0, 107.0, 71.0, 52.0, 37.0, 22.0, 27.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.057373046875, -0.05578899383544922, -0.05420494079589844, -0.052620887756347656, -0.051036834716796875, -0.049452781677246094, -0.04786872863769531, -0.04628467559814453, -0.04470062255859375, -0.04311656951904297, -0.04153251647949219, -0.039948463439941406, -0.038364410400390625, -0.036780357360839844, -0.03519630432128906, -0.03361225128173828, -0.0320281982421875, -0.03044414520263672, -0.028860092163085938, -0.027276039123535156, -0.025691986083984375, -0.024107933044433594, -0.022523880004882812, -0.02093982696533203, -0.01935577392578125, -0.01777172088623047, -0.016187667846679688, -0.014603614807128906, -0.013019561767578125, -0.011435508728027344, -0.009851455688476562, -0.008267402648925781, -0.006683349609375, -0.005099296569824219, -0.0035152435302734375, -0.0019311904907226562, -0.000347137451171875, 0.0012369155883789062, 0.0028209686279296875, 0.004405021667480469, 0.00598907470703125, 0.007573127746582031, 0.009157180786132812, 0.010741233825683594, 0.012325286865234375, 0.013909339904785156, 0.015493392944335938, 0.01707744598388672, 0.0186614990234375, 0.02024555206298828, 0.021829605102539062, 0.023413658142089844, 0.024997711181640625, 0.026581764221191406, 0.028165817260742188, 0.02974987030029297, 0.03133392333984375, 0.03291797637939453, 0.03450202941894531, 0.036086082458496094, 0.037670135498046875, 0.039254188537597656, 0.04083824157714844, 0.04242229461669922, 0.04400634765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 11.0, 39.0, 183.0, 420.0, 267.0, 67.0, 17.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19105690717697144, -0.16678118705749512, -0.14250548183918, -0.11822976917028427, -0.09395405650138855, -0.06967834383249283, -0.04540263116359711, -0.021126925945281982, 0.003148794174194336, 0.027424506843090057, 0.05170021951198578, 0.0759759321808815, 0.10025164484977722, 0.12452735751867294, 0.14880307018756866, 0.1730787754058838, 0.1973544955253601, 0.22163021564483643, 0.24590592086315155, 0.2701816260814667, 0.294457346200943, 0.3187330663204193, 0.34300875663757324, 0.36728447675704956, 0.3915601968765259, 0.4158359169960022, 0.4401116371154785, 0.46438732743263245, 0.48866304755210876, 0.5129387378692627, 0.537214457988739, 0.5614901781082153, 0.5857658386230469, 0.6100415587425232, 0.6343172788619995, 0.6585929989814758, 0.6828687191009521, 0.7071443796157837, 0.73142009973526, 0.7556958198547363, 0.7799715399742126, 0.804247260093689, 0.8285229802131653, 0.8527987003326416, 0.8770743608474731, 0.9013500809669495, 0.9256258010864258, 0.9499015212059021, 0.9741772413253784, 0.9984529614448547, 1.022728681564331, 1.0470043420791626, 1.0712801218032837, 1.0955557823181152, 1.1198315620422363, 1.1441072225570679, 1.1683828830718994, 1.192658543586731, 1.216934323310852, 1.2412099838256836, 1.2654857635498047, 1.2897614240646362, 1.3140372037887573, 1.3383128643035889, 1.36258864402771]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 8.0, 11.0, 11.0, 14.0, 13.0, 19.0, 20.0, 24.0, 29.0, 43.0, 41.0, 38.0, 41.0, 33.0, 50.0, 44.0, 47.0, 40.0, 44.0, 46.0, 49.0, 34.0, 39.0, 25.0, 31.0, 42.0, 30.0, 27.0, 22.0, 16.0, 16.0, 18.0, 9.0, 5.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16983050107955933, -0.16446751356124878, -0.15910452604293823, -0.15374153852462769, -0.14837855100631714, -0.1430155485868454, -0.13765256106853485, -0.1322895735502243, -0.12692658603191376, -0.12156359851360321, -0.11620061099529266, -0.11083761602640152, -0.10547462850809097, -0.10011164098978043, -0.09474864602088928, -0.08938565850257874, -0.08402267098426819, -0.07865968346595764, -0.0732966959476471, -0.06793370097875595, -0.0625707134604454, -0.05720772594213486, -0.05184473469853401, -0.046481743454933167, -0.04111875593662262, -0.03575576841831207, -0.030392777174711227, -0.02502978779375553, -0.019666798412799835, -0.014303809031844139, -0.008940819650888443, -0.0035778284072875977, 0.0017851591110229492, 0.007148148491978645, 0.012511137872934341, 0.017874127253890038, 0.023237116634845734, 0.02860010601580143, 0.033963095396757126, 0.03932608664035797, 0.04468907415866852, 0.050052061676979065, 0.05541505292057991, 0.060778044164180756, 0.0661410316824913, 0.07150401920080185, 0.076867014169693, 0.08223000168800354, 0.08759298920631409, 0.09295597672462463, 0.09831896424293518, 0.10368195921182632, 0.10904494673013687, 0.11440793424844742, 0.11977092921733856, 0.1251339167356491, 0.13049690425395966, 0.1358598917722702, 0.14122287929058075, 0.1465858668088913, 0.15194886922836304, 0.15731185674667358, 0.16267484426498413, 0.16803783178329468, 0.17340081930160522]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 6.0, 8.0, 10.0, 5.0, 21.0, 29.0, 39.0, 67.0, 80.0, 151.0, 231.0, 463.0, 1014.0, 2028.0, 4058.0, 9154.0, 22253.0, 69781.0, 289077.0, 455123.0, 133379.0, 36622.0, 13487.0, 5848.0, 2769.0, 1314.0, 644.0, 336.0, 192.0, 117.0, 78.0, 49.0, 28.0, 24.0, 13.0, 6.0, 10.0, 8.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11053466796875, -0.10710525512695312, -0.10367584228515625, -0.10024642944335938, -0.0968170166015625, -0.09338760375976562, -0.08995819091796875, -0.08652877807617188, -0.083099365234375, -0.07966995239257812, -0.07624053955078125, -0.07281112670898438, -0.0693817138671875, -0.06595230102539062, -0.06252288818359375, -0.059093475341796875, -0.0556640625, -0.052234649658203125, -0.04880523681640625, -0.045375823974609375, -0.0419464111328125, -0.038516998291015625, -0.03508758544921875, -0.031658172607421875, -0.028228759765625, -0.024799346923828125, -0.02136993408203125, -0.017940521240234375, -0.0145111083984375, -0.011081695556640625, -0.00765228271484375, -0.004222869873046875, -0.00079345703125, 0.002635955810546875, 0.00606536865234375, 0.009494781494140625, 0.0129241943359375, 0.016353607177734375, 0.01978302001953125, 0.023212432861328125, 0.026641845703125, 0.030071258544921875, 0.03350067138671875, 0.036930084228515625, 0.0403594970703125, 0.043788909912109375, 0.04721832275390625, 0.050647735595703125, 0.0540771484375, 0.057506561279296875, 0.06093597412109375, 0.06436538696289062, 0.0677947998046875, 0.07122421264648438, 0.07465362548828125, 0.07808303833007812, 0.081512451171875, 0.08494186401367188, 0.08837127685546875, 0.09180068969726562, 0.0952301025390625, 0.09865951538085938, 0.10208892822265625, 0.10551834106445312, 0.10894775390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 8.0, 10.0, 21.0, 26.0, 21.0, 15.0, 34.0, 29.0, 45.0, 50.0, 74.0, 63.0, 56.0, 62.0, 58.0, 52.0, 50.0, 55.0, 36.0, 34.0, 31.0, 33.0, 19.0, 22.0, 14.0, 14.0, 10.0, 8.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0419921875, -0.0407414436340332, -0.039490699768066406, -0.03823995590209961, -0.03698921203613281, -0.035738468170166016, -0.03448772430419922, -0.03323698043823242, -0.031986236572265625, -0.030735492706298828, -0.02948474884033203, -0.028234004974365234, -0.026983261108398438, -0.02573251724243164, -0.024481773376464844, -0.023231029510498047, -0.02198028564453125, -0.020729541778564453, -0.019478797912597656, -0.01822805404663086, -0.016977310180664062, -0.015726566314697266, -0.014475822448730469, -0.013225078582763672, -0.011974334716796875, -0.010723590850830078, -0.009472846984863281, -0.008222103118896484, -0.0069713592529296875, -0.005720615386962891, -0.004469871520996094, -0.003219127655029297, -0.0019683837890625, -0.0007176399230957031, 0.0005331039428710938, 0.0017838478088378906, 0.0030345916748046875, 0.004285335540771484, 0.005536079406738281, 0.006786823272705078, 0.008037567138671875, 0.009288311004638672, 0.010539054870605469, 0.011789798736572266, 0.013040542602539062, 0.01429128646850586, 0.015542030334472656, 0.016792774200439453, 0.01804351806640625, 0.019294261932373047, 0.020545005798339844, 0.02179574966430664, 0.023046493530273438, 0.024297237396240234, 0.02554798126220703, 0.026798725128173828, 0.028049468994140625, 0.029300212860107422, 0.03055095672607422, 0.031801700592041016, 0.03305244445800781, 0.03430318832397461, 0.035553932189941406, 0.0368046760559082, 0.038055419921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 8.0, 13.0, 16.0, 15.0, 22.0, 24.0, 33.0, 31.0, 61.0, 87.0, 159.0, 295.0, 714.0, 2356.0, 8325.0, 36680.0, 315039.0, 586801.0, 77761.0, 14192.0, 3767.0, 1132.0, 409.0, 199.0, 124.0, 75.0, 46.0, 34.0, 24.0, 19.0, 14.0, 16.0, 8.0, 8.0, 9.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.147125244140625, -0.14190673828125, -0.136688232421875, -0.1314697265625, -0.126251220703125, -0.12103271484375, -0.115814208984375, -0.110595703125, -0.105377197265625, -0.10015869140625, -0.094940185546875, -0.0897216796875, -0.084503173828125, -0.07928466796875, -0.074066162109375, -0.06884765625, -0.063629150390625, -0.05841064453125, -0.053192138671875, -0.0479736328125, -0.042755126953125, -0.03753662109375, -0.032318115234375, -0.027099609375, -0.021881103515625, -0.01666259765625, -0.011444091796875, -0.0062255859375, -0.001007080078125, 0.00421142578125, 0.009429931640625, 0.0146484375, 0.019866943359375, 0.02508544921875, 0.030303955078125, 0.0355224609375, 0.040740966796875, 0.04595947265625, 0.051177978515625, 0.056396484375, 0.061614990234375, 0.06683349609375, 0.072052001953125, 0.0772705078125, 0.082489013671875, 0.08770751953125, 0.092926025390625, 0.09814453125, 0.103363037109375, 0.10858154296875, 0.113800048828125, 0.1190185546875, 0.124237060546875, 0.12945556640625, 0.134674072265625, 0.139892578125, 0.145111083984375, 0.15032958984375, 0.155548095703125, 0.1607666015625, 0.165985107421875, 0.17120361328125, 0.176422119140625, 0.181640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 4.0, 15.0, 10.0, 11.0, 12.0, 22.0, 27.0, 11.0, 31.0, 34.0, 34.0, 44.0, 41.0, 56.0, 32.0, 29.0, 41.0, 39.0, 39.0, 43.0, 43.0, 51.0, 32.0, 30.0, 40.0, 25.0, 20.0, 22.0, 19.0, 18.0, 10.0, 16.0, 17.0, 13.0, 10.0, 7.0, 12.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0743408203125, -0.07210731506347656, -0.06987380981445312, -0.06764030456542969, -0.06540679931640625, -0.06317329406738281, -0.060939788818359375, -0.05870628356933594, -0.0564727783203125, -0.05423927307128906, -0.052005767822265625, -0.04977226257324219, -0.04753875732421875, -0.04530525207519531, -0.043071746826171875, -0.04083824157714844, -0.038604736328125, -0.03637123107910156, -0.034137725830078125, -0.03190422058105469, -0.02967071533203125, -0.027437210083007812, -0.025203704833984375, -0.022970199584960938, -0.0207366943359375, -0.018503189086914062, -0.016269683837890625, -0.014036178588867188, -0.01180267333984375, -0.009569168090820312, -0.007335662841796875, -0.0051021575927734375, -0.00286865234375, -0.0006351470947265625, 0.001598358154296875, 0.0038318634033203125, 0.00606536865234375, 0.008298873901367188, 0.010532379150390625, 0.012765884399414062, 0.0149993896484375, 0.017232894897460938, 0.019466400146484375, 0.021699905395507812, 0.02393341064453125, 0.026166915893554688, 0.028400421142578125, 0.030633926391601562, 0.032867431640625, 0.03510093688964844, 0.037334442138671875, 0.03956794738769531, 0.04180145263671875, 0.04403495788574219, 0.046268463134765625, 0.04850196838378906, 0.0507354736328125, 0.05296897888183594, 0.055202484130859375, 0.05743598937988281, 0.05966949462890625, 0.06190299987792969, 0.06413650512695312, 0.06637001037597656, 0.068603515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 4.0, 11.0, 9.0, 10.0, 15.0, 25.0, 45.0, 78.0, 84.0, 195.0, 338.0, 584.0, 1026.0, 2014.0, 4627.0, 11250.0, 39170.0, 296047.0, 579611.0, 82696.0, 18099.0, 6507.0, 2925.0, 1485.0, 731.0, 392.0, 222.0, 126.0, 80.0, 51.0, 31.0, 25.0, 8.0, 14.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09588623046875, -0.09330940246582031, -0.09073257446289062, -0.08815574645996094, -0.08557891845703125, -0.08300209045410156, -0.08042526245117188, -0.07784843444824219, -0.0752716064453125, -0.07269477844238281, -0.07011795043945312, -0.06754112243652344, -0.06496429443359375, -0.06238746643066406, -0.059810638427734375, -0.05723381042480469, -0.054656982421875, -0.05208015441894531, -0.049503326416015625, -0.04692649841308594, -0.04434967041015625, -0.04177284240722656, -0.039196014404296875, -0.03661918640136719, -0.0340423583984375, -0.03146553039550781, -0.028888702392578125, -0.026311874389648438, -0.02373504638671875, -0.021158218383789062, -0.018581390380859375, -0.016004562377929688, -0.013427734375, -0.010850906372070312, -0.008274078369140625, -0.0056972503662109375, -0.00312042236328125, -0.0005435943603515625, 0.002033233642578125, 0.0046100616455078125, 0.0071868896484375, 0.009763717651367188, 0.012340545654296875, 0.014917373657226562, 0.01749420166015625, 0.020071029663085938, 0.022647857666015625, 0.025224685668945312, 0.027801513671875, 0.030378341674804688, 0.032955169677734375, 0.03553199768066406, 0.03810882568359375, 0.04068565368652344, 0.043262481689453125, 0.04583930969238281, 0.0484161376953125, 0.05099296569824219, 0.053569793701171875, 0.05614662170410156, 0.05872344970703125, 0.06130027770996094, 0.06387710571289062, 0.06645393371582031, 0.06903076171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 7.0, 9.0, 13.0, 22.0, 47.0, 71.0, 84.0, 122.0, 170.0, 133.0, 103.0, 80.0, 56.0, 28.0, 21.0, 12.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7087669372558594e-05, -4.5933760702610016e-05, -4.477985203266144e-05, -4.362594336271286e-05, -4.247203469276428e-05, -4.1318126022815704e-05, -4.0164217352867126e-05, -3.901030868291855e-05, -3.785640001296997e-05, -3.670249134302139e-05, -3.5548582673072815e-05, -3.439467400312424e-05, -3.324076533317566e-05, -3.208685666322708e-05, -3.0932947993278503e-05, -2.9779039323329926e-05, -2.8625130653381348e-05, -2.747122198343277e-05, -2.6317313313484192e-05, -2.5163404643535614e-05, -2.4009495973587036e-05, -2.2855587303638458e-05, -2.170167863368988e-05, -2.0547769963741302e-05, -1.9393861293792725e-05, -1.8239952623844147e-05, -1.708604395389557e-05, -1.593213528394699e-05, -1.4778226613998413e-05, -1.3624317944049835e-05, -1.2470409274101257e-05, -1.131650060415268e-05, -1.0162591934204102e-05, -9.008683264255524e-06, -7.854774594306946e-06, -6.700865924358368e-06, -5.54695725440979e-06, -4.393048584461212e-06, -3.2391399145126343e-06, -2.0852312445640564e-06, -9.313225746154785e-07, 2.2258609533309937e-07, 1.3764947652816772e-06, 2.530403435230255e-06, 3.684312105178833e-06, 4.838220775127411e-06, 5.992129445075989e-06, 7.146038115024567e-06, 8.299946784973145e-06, 9.453855454921722e-06, 1.06077641248703e-05, 1.1761672794818878e-05, 1.2915581464767456e-05, 1.4069490134716034e-05, 1.5223398804664612e-05, 1.637730747461319e-05, 1.7531216144561768e-05, 1.8685124814510345e-05, 1.9839033484458923e-05, 2.09929421544075e-05, 2.214685082435608e-05, 2.3300759494304657e-05, 2.4454668164253235e-05, 2.5608576834201813e-05, 2.676248550415039e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 8.0, 6.0, 21.0, 30.0, 66.0, 206.0, 743.0, 4271.0, 42220.0, 822281.0, 167389.0, 9401.0, 1389.0, 297.0, 104.0, 50.0, 27.0, 13.0, 5.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.126708984375, -0.122711181640625, -0.11871337890625, -0.114715576171875, -0.1107177734375, -0.106719970703125, -0.10272216796875, -0.098724365234375, -0.0947265625, -0.090728759765625, -0.08673095703125, -0.082733154296875, -0.0787353515625, -0.074737548828125, -0.07073974609375, -0.066741943359375, -0.062744140625, -0.058746337890625, -0.05474853515625, -0.050750732421875, -0.0467529296875, -0.042755126953125, -0.03875732421875, -0.034759521484375, -0.03076171875, -0.026763916015625, -0.02276611328125, -0.018768310546875, -0.0147705078125, -0.010772705078125, -0.00677490234375, -0.002777099609375, 0.001220703125, 0.005218505859375, 0.00921630859375, 0.013214111328125, 0.0172119140625, 0.021209716796875, 0.02520751953125, 0.029205322265625, 0.033203125, 0.037200927734375, 0.04119873046875, 0.045196533203125, 0.0491943359375, 0.053192138671875, 0.05718994140625, 0.061187744140625, 0.065185546875, 0.069183349609375, 0.07318115234375, 0.077178955078125, 0.0811767578125, 0.085174560546875, 0.08917236328125, 0.093170166015625, 0.09716796875, 0.101165771484375, 0.10516357421875, 0.109161376953125, 0.1131591796875, 0.117156982421875, 0.12115478515625, 0.125152587890625, 0.129150390625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 6.0, 2.0, 1.0, 4.0, 8.0, 13.0, 16.0, 34.0, 45.0, 64.0, 94.0, 121.0, 106.0, 136.0, 115.0, 84.0, 54.0, 30.0, 21.0, 17.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0552978515625, -0.05375099182128906, -0.052204132080078125, -0.05065727233886719, -0.04911041259765625, -0.04756355285644531, -0.046016693115234375, -0.04446983337402344, -0.0429229736328125, -0.04137611389160156, -0.039829254150390625, -0.03828239440917969, -0.03673553466796875, -0.03518867492675781, -0.033641815185546875, -0.03209495544433594, -0.030548095703125, -0.029001235961914062, -0.027454376220703125, -0.025907516479492188, -0.02436065673828125, -0.022813796997070312, -0.021266937255859375, -0.019720077514648438, -0.0181732177734375, -0.016626358032226562, -0.015079498291015625, -0.013532638549804688, -0.01198577880859375, -0.010438919067382812, -0.008892059326171875, -0.0073451995849609375, -0.00579833984375, -0.0042514801025390625, -0.002704620361328125, -0.0011577606201171875, 0.00038909912109375, 0.0019359588623046875, 0.003482818603515625, 0.0050296783447265625, 0.0065765380859375, 0.008123397827148438, 0.009670257568359375, 0.011217117309570312, 0.01276397705078125, 0.014310836791992188, 0.015857696533203125, 0.017404556274414062, 0.018951416015625, 0.020498275756835938, 0.022045135498046875, 0.023591995239257812, 0.02513885498046875, 0.026685714721679688, 0.028232574462890625, 0.029779434204101562, 0.0313262939453125, 0.03287315368652344, 0.034420013427734375, 0.03596687316894531, 0.03751373291015625, 0.03906059265136719, 0.040607452392578125, 0.04215431213378906, 0.043701171875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 14.0, 20.0, 52.0, 106.0, 195.0, 228.0, 162.0, 118.0, 57.0, 20.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21428444981575012, -0.19954802095890045, -0.18481160700321198, -0.1700751781463623, -0.15533876419067383, -0.14060233533382416, -0.1258659064769745, -0.11112948507070541, -0.09639306366443634, -0.08165664225816727, -0.0669202208518982, -0.05218379199504852, -0.03744737058877945, -0.022710949182510376, -0.007974520325660706, 0.006761901080608368, 0.02149832248687744, 0.036234743893146515, 0.05097116902470589, 0.06570759415626526, 0.08044401556253433, 0.0951804369688034, 0.10991686582565308, 0.12465328723192215, 0.13938970863819122, 0.1541261374950409, 0.16886255145072937, 0.18359898030757904, 0.1983354091644287, 0.2130718231201172, 0.22780825197696686, 0.24254468083381653, 0.2572811245918274, 0.27201753854751587, 0.28675398230552673, 0.3014903962612152, 0.3162268102169037, 0.33096325397491455, 0.345699667930603, 0.3604360818862915, 0.37517249584198, 0.38990890979766846, 0.4046453535556793, 0.4193817675113678, 0.4341181814670563, 0.44885462522506714, 0.4635910391807556, 0.4783274531364441, 0.49306389689445496, 0.5078003406524658, 0.5225367546081543, 0.5372731685638428, 0.5520095825195312, 0.5667459964752197, 0.5814824104309082, 0.5962188839912415, 0.6109552979469299, 0.6256917119026184, 0.6404281258583069, 0.6551645994186401, 0.6699010133743286, 0.6846374273300171, 0.6993738412857056, 0.714110255241394, 0.7288466691970825]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 6.0, 12.0, 9.0, 4.0, 12.0, 17.0, 17.0, 19.0, 20.0, 22.0, 26.0, 28.0, 29.0, 25.0, 33.0, 34.0, 41.0, 38.0, 34.0, 49.0, 34.0, 34.0, 32.0, 39.0, 32.0, 37.0, 41.0, 35.0, 31.0, 28.0, 29.0, 33.0, 19.0, 15.0, 12.0, 11.0, 16.0, 9.0, 5.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20495587587356567, -0.19831247627735138, -0.1916690617799759, -0.1850256621837616, -0.1783822476863861, -0.17173884809017181, -0.16509544849395752, -0.15845203399658203, -0.15180861949920654, -0.14516521990299225, -0.13852180540561676, -0.13187840580940247, -0.12523499131202698, -0.11859159171581268, -0.11194818466901779, -0.1053047776222229, -0.0986613780260086, -0.09201797097921371, -0.08537456393241882, -0.07873116433620453, -0.07208774983882904, -0.06544435024261475, -0.058800943195819855, -0.05215753614902496, -0.04551412910223007, -0.03887072205543518, -0.03222731500864029, -0.025583911687135696, -0.018940504640340805, -0.012297097593545914, -0.005653694272041321, 0.0009897127747535706, 0.007633119821548462, 0.014276525937020779, 0.020919932052493095, 0.027563337236642838, 0.03420674428343773, 0.04085015133023262, 0.04749355465173721, 0.054136961698532104, 0.060780368745326996, 0.06742377579212189, 0.07406718283891678, 0.08071058988571167, 0.08735398948192596, 0.09399740397930145, 0.10064080357551575, 0.10728421062231064, 0.11392761766910553, 0.12057102471590042, 0.1272144317626953, 0.1338578313589096, 0.1405012458562851, 0.1471446454524994, 0.15378805994987488, 0.16043145954608917, 0.16707485914230347, 0.17371825873851776, 0.18036167323589325, 0.18700507283210754, 0.19364848732948303, 0.20029188692569733, 0.20693528652191162, 0.2135787010192871, 0.2202221155166626]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 4.0, 10.0, 15.0, 21.0, 29.0, 40.0, 46.0, 60.0, 73.0, 115.0, 161.0, 237.0, 377.0, 645.0, 1119.0, 2198.0, 4330.0, 10398.0, 31711.0, 158759.0, 1174488.0, 2233106.0, 471118.0, 71746.0, 19083.0, 7184.0, 3214.0, 1661.0, 872.0, 502.0, 324.0, 179.0, 142.0, 86.0, 47.0, 47.0, 36.0, 21.0, 15.0, 16.0, 8.0, 7.0, 3.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052581787109375, -0.050844669342041016, -0.04910755157470703, -0.04737043380737305, -0.04563331604003906, -0.04389619827270508, -0.042159080505371094, -0.04042196273803711, -0.038684844970703125, -0.03694772720336914, -0.035210609436035156, -0.03347349166870117, -0.03173637390136719, -0.029999256134033203, -0.02826213836669922, -0.026525020599365234, -0.02478790283203125, -0.023050785064697266, -0.02131366729736328, -0.019576549530029297, -0.017839431762695312, -0.016102313995361328, -0.014365196228027344, -0.01262807846069336, -0.010890960693359375, -0.00915384292602539, -0.007416725158691406, -0.005679607391357422, -0.0039424896240234375, -0.002205371856689453, -0.00046825408935546875, 0.0012688636779785156, 0.0030059814453125, 0.004743099212646484, 0.006480216979980469, 0.008217334747314453, 0.009954452514648438, 0.011691570281982422, 0.013428688049316406, 0.01516580581665039, 0.016902923583984375, 0.01864004135131836, 0.020377159118652344, 0.022114276885986328, 0.023851394653320312, 0.025588512420654297, 0.02732563018798828, 0.029062747955322266, 0.03079986572265625, 0.032536983489990234, 0.03427410125732422, 0.0360112190246582, 0.03774833679199219, 0.03948545455932617, 0.041222572326660156, 0.04295969009399414, 0.044696807861328125, 0.04643392562866211, 0.048171043395996094, 0.04990816116333008, 0.05164527893066406, 0.05338239669799805, 0.05511951446533203, 0.056856632232666016, 0.05859375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 5.0, 8.0, 7.0, 14.0, 16.0, 24.0, 17.0, 19.0, 25.0, 32.0, 32.0, 44.0, 51.0, 66.0, 73.0, 59.0, 64.0, 72.0, 38.0, 53.0, 43.0, 35.0, 31.0, 41.0, 31.0, 29.0, 15.0, 12.0, 11.0, 12.0, 7.0, 5.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.03845643997192383, -0.037178993225097656, -0.035901546478271484, -0.03462409973144531, -0.03334665298461914, -0.03206920623779297, -0.030791759490966797, -0.029514312744140625, -0.028236865997314453, -0.02695941925048828, -0.02568197250366211, -0.024404525756835938, -0.023127079010009766, -0.021849632263183594, -0.020572185516357422, -0.01929473876953125, -0.018017292022705078, -0.016739845275878906, -0.015462398529052734, -0.014184951782226562, -0.01290750503540039, -0.011630058288574219, -0.010352611541748047, -0.009075164794921875, -0.007797718048095703, -0.006520271301269531, -0.005242824554443359, -0.0039653778076171875, -0.0026879310607910156, -0.0014104843139648438, -0.00013303756713867188, 0.0011444091796875, 0.002421855926513672, 0.0036993026733398438, 0.004976749420166016, 0.0062541961669921875, 0.007531642913818359, 0.008809089660644531, 0.010086536407470703, 0.011363983154296875, 0.012641429901123047, 0.013918876647949219, 0.01519632339477539, 0.016473770141601562, 0.017751216888427734, 0.019028663635253906, 0.020306110382080078, 0.02158355712890625, 0.022861003875732422, 0.024138450622558594, 0.025415897369384766, 0.026693344116210938, 0.02797079086303711, 0.02924823760986328, 0.030525684356689453, 0.031803131103515625, 0.0330805778503418, 0.03435802459716797, 0.03563547134399414, 0.03691291809082031, 0.038190364837646484, 0.039467811584472656, 0.04074525833129883, 0.042022705078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 8.0, 10.0, 23.0, 26.0, 61.0, 71.0, 124.0, 238.0, 555.0, 1871.0, 18183.0, 838869.0, 3232052.0, 95835.0, 4668.0, 931.0, 338.0, 169.0, 98.0, 50.0, 43.0, 17.0, 19.0, 7.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1566162109375, -0.15175819396972656, -0.14690017700195312, -0.1420421600341797, -0.13718414306640625, -0.1323261260986328, -0.12746810913085938, -0.12261009216308594, -0.1177520751953125, -0.11289405822753906, -0.10803604125976562, -0.10317802429199219, -0.09832000732421875, -0.09346199035644531, -0.08860397338867188, -0.08374595642089844, -0.078887939453125, -0.07402992248535156, -0.06917190551757812, -0.06431388854980469, -0.05945587158203125, -0.05459785461425781, -0.049739837646484375, -0.04488182067871094, -0.0400238037109375, -0.03516578674316406, -0.030307769775390625, -0.025449752807617188, -0.02059173583984375, -0.015733718872070312, -0.010875701904296875, -0.0060176849365234375, -0.00115966796875, 0.0036983489990234375, 0.008556365966796875, 0.013414382934570312, 0.01827239990234375, 0.023130416870117188, 0.027988433837890625, 0.03284645080566406, 0.0377044677734375, 0.04256248474121094, 0.047420501708984375, 0.05227851867675781, 0.05713653564453125, 0.06199455261230469, 0.06685256958007812, 0.07171058654785156, 0.076568603515625, 0.08142662048339844, 0.08628463745117188, 0.09114265441894531, 0.09600067138671875, 0.10085868835449219, 0.10571670532226562, 0.11057472229003906, 0.1154327392578125, 0.12029075622558594, 0.12514877319335938, 0.1300067901611328, 0.13486480712890625, 0.1397228240966797, 0.14458084106445312, 0.14943885803222656, 0.154296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 14.0, 11.0, 20.0, 24.0, 60.0, 82.0, 142.0, 228.0, 373.0, 488.0, 556.0, 623.0, 482.0, 330.0, 228.0, 154.0, 83.0, 67.0, 42.0, 28.0, 13.0, 10.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077392578125, -0.07497119903564453, -0.07254981994628906, -0.0701284408569336, -0.06770706176757812, -0.06528568267822266, -0.06286430358886719, -0.06044292449951172, -0.05802154541015625, -0.05560016632080078, -0.05317878723144531, -0.050757408142089844, -0.048336029052734375, -0.045914649963378906, -0.04349327087402344, -0.04107189178466797, -0.0386505126953125, -0.03622913360595703, -0.03380775451660156, -0.031386375427246094, -0.028964996337890625, -0.026543617248535156, -0.024122238159179688, -0.02170085906982422, -0.01927947998046875, -0.01685810089111328, -0.014436721801757812, -0.012015342712402344, -0.009593963623046875, -0.007172584533691406, -0.0047512054443359375, -0.0023298263549804688, 9.1552734375e-05, 0.0025129318237304688, 0.0049343109130859375, 0.007355690002441406, 0.009777069091796875, 0.012198448181152344, 0.014619827270507812, 0.01704120635986328, 0.01946258544921875, 0.02188396453857422, 0.024305343627929688, 0.026726722717285156, 0.029148101806640625, 0.031569480895996094, 0.03399085998535156, 0.03641223907470703, 0.0388336181640625, 0.04125499725341797, 0.04367637634277344, 0.046097755432128906, 0.048519134521484375, 0.050940513610839844, 0.05336189270019531, 0.05578327178955078, 0.05820465087890625, 0.06062602996826172, 0.06304740905761719, 0.06546878814697266, 0.06789016723632812, 0.0703115463256836, 0.07273292541503906, 0.07515430450439453, 0.07757568359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 8.0, 173.0, 618.0, 204.0, 13.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1681140810251236, -0.1209784746170044, -0.0738428607583046, -0.026707246899604797, 0.020428359508514404, 0.0675639659166336, 0.114699587225914, 0.161835178732872, 0.2089708000421524, 0.2561064064502716, 0.303242027759552, 0.35037761926651, 0.3975132405757904, 0.4446488618850708, 0.4917844533920288, 0.5389200448989868, 0.5860556960105896, 0.6331912875175476, 0.6803269386291504, 0.7274625301361084, 0.7745981216430664, 0.8217337131500244, 0.8688693642616272, 0.9160049557685852, 0.9631405472755432, 1.010276198387146, 1.057411789894104, 1.104547381401062, 1.15168297290802, 1.198818564414978, 1.2459542751312256, 1.2930898666381836, 1.340225338935852, 1.38736093044281, 1.434496521949768, 1.4816322326660156, 1.5287678241729736, 1.5759034156799316, 1.6230390071868896, 1.6701745986938477, 1.7173101902008057, 1.7644457817077637, 1.8115813732147217, 1.8587169647216797, 1.9058526754379272, 1.9529882669448853, 2.000123977661133, 2.0472593307495117, 2.094395160675049, 2.141530752182007, 2.188666343688965, 2.235801935195923, 2.282937526702881, 2.330073118209839, 2.377208709716797, 2.424344539642334, 2.471479892730713, 2.518615484237671, 2.565751075744629, 2.612886667251587, 2.660022258758545, 2.707157850265503, 2.754293441772461, 2.801429271697998, 2.848564863204956]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 7.0, 17.0, 16.0, 17.0, 21.0, 29.0, 29.0, 33.0, 33.0, 28.0, 33.0, 53.0, 35.0, 39.0, 45.0, 49.0, 44.0, 28.0, 45.0, 53.0, 41.0, 31.0, 36.0, 31.0, 27.0, 26.0, 18.0, 18.0, 17.0, 23.0, 9.0, 12.0, 8.0, 7.0, 5.0, 9.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.17982804775238037, -0.17431052029132843, -0.1687929928302765, -0.16327545046806335, -0.1577579230070114, -0.15224039554595947, -0.14672285318374634, -0.1412053257226944, -0.13568779826164246, -0.13017027080059052, -0.12465273588895798, -0.11913520097732544, -0.1136176735162735, -0.10810014605522156, -0.10258261114358902, -0.09706507623195648, -0.09154754877090454, -0.0860300213098526, -0.08051248639822006, -0.07499495148658752, -0.06947742402553558, -0.06395989656448364, -0.058442361652851105, -0.052924830466508865, -0.047407299280166626, -0.04188976809382439, -0.03637223690748215, -0.030854705721139908, -0.02533717453479767, -0.01981964334845543, -0.01430211216211319, -0.00878458097577095, -0.003267049789428711, 0.0022504813969135284, 0.007768012583255768, 0.013285543769598007, 0.018803074955940247, 0.024320606142282486, 0.029838137328624725, 0.035355668514966965, 0.040873199701309204, 0.046390730887651443, 0.05190826207399368, 0.05742579326033592, 0.06294332444667816, 0.0684608519077301, 0.07397838681936264, 0.07949592173099518, 0.08501344919204712, 0.09053097665309906, 0.0960485115647316, 0.10156604647636414, 0.10708357393741608, 0.11260110139846802, 0.11811863631010056, 0.1236361712217331, 0.12915369868278503, 0.13467122614383698, 0.14018875360488892, 0.14570629596710205, 0.151223823428154, 0.15674135088920593, 0.16225889325141907, 0.167776420712471, 0.17329394817352295]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 5.0, 7.0, 6.0, 4.0, 10.0, 20.0, 20.0, 29.0, 50.0, 73.0, 105.0, 185.0, 293.0, 570.0, 1226.0, 2688.0, 6158.0, 15370.0, 41360.0, 118639.0, 306915.0, 336484.0, 139739.0, 47983.0, 17554.0, 7046.0, 2976.0, 1433.0, 705.0, 340.0, 170.0, 112.0, 95.0, 42.0, 36.0, 28.0, 24.0, 13.0, 15.0, 9.0, 3.0, 4.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.08081626892089844, -0.07783126831054688, -0.07484626770019531, -0.07186126708984375, -0.06887626647949219, -0.06589126586914062, -0.06290626525878906, -0.0599212646484375, -0.05693626403808594, -0.053951263427734375, -0.05096626281738281, -0.04798126220703125, -0.04499626159667969, -0.042011260986328125, -0.03902626037597656, -0.036041259765625, -0.03305625915527344, -0.030071258544921875, -0.027086257934570312, -0.02410125732421875, -0.021116256713867188, -0.018131256103515625, -0.015146255493164062, -0.0121612548828125, -0.009176254272460938, -0.006191253662109375, -0.0032062530517578125, -0.00022125244140625, 0.0027637481689453125, 0.005748748779296875, 0.008733749389648438, 0.01171875, 0.014703750610351562, 0.017688751220703125, 0.020673751831054688, 0.02365875244140625, 0.026643753051757812, 0.029628753662109375, 0.03261375427246094, 0.0355987548828125, 0.03858375549316406, 0.041568756103515625, 0.04455375671386719, 0.04753875732421875, 0.05052375793457031, 0.053508758544921875, 0.05649375915527344, 0.059478759765625, 0.06246376037597656, 0.06544876098632812, 0.06843376159667969, 0.07141876220703125, 0.07440376281738281, 0.07738876342773438, 0.08037376403808594, 0.0833587646484375, 0.08634376525878906, 0.08932876586914062, 0.09231376647949219, 0.09529876708984375, 0.09828376770019531, 0.10126876831054688, 0.10425376892089844, 0.10723876953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 4.0, 13.0, 10.0, 17.0, 11.0, 24.0, 11.0, 17.0, 35.0, 35.0, 44.0, 44.0, 57.0, 71.0, 65.0, 61.0, 60.0, 56.0, 46.0, 54.0, 34.0, 40.0, 36.0, 30.0, 36.0, 17.0, 14.0, 9.0, 9.0, 9.0, 8.0, 6.0, 7.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036773681640625, -0.03557634353637695, -0.034379005432128906, -0.03318166732788086, -0.03198432922363281, -0.030786991119384766, -0.02958965301513672, -0.028392314910888672, -0.027194976806640625, -0.025997638702392578, -0.02480030059814453, -0.023602962493896484, -0.022405624389648438, -0.02120828628540039, -0.020010948181152344, -0.018813610076904297, -0.01761627197265625, -0.016418933868408203, -0.015221595764160156, -0.01402425765991211, -0.012826919555664062, -0.011629581451416016, -0.010432243347167969, -0.009234905242919922, -0.008037567138671875, -0.006840229034423828, -0.005642890930175781, -0.004445552825927734, -0.0032482147216796875, -0.0020508766174316406, -0.0008535385131835938, 0.0003437995910644531, 0.0015411376953125, 0.002738475799560547, 0.003935813903808594, 0.005133152008056641, 0.0063304901123046875, 0.007527828216552734, 0.008725166320800781, 0.009922504425048828, 0.011119842529296875, 0.012317180633544922, 0.013514518737792969, 0.014711856842041016, 0.015909194946289062, 0.01710653305053711, 0.018303871154785156, 0.019501209259033203, 0.02069854736328125, 0.021895885467529297, 0.023093223571777344, 0.02429056167602539, 0.025487899780273438, 0.026685237884521484, 0.02788257598876953, 0.029079914093017578, 0.030277252197265625, 0.03147459030151367, 0.03267192840576172, 0.033869266510009766, 0.03506660461425781, 0.03626394271850586, 0.037461280822753906, 0.03865861892700195, 0.03985595703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 14.0, 6.0, 10.0, 15.0, 23.0, 33.0, 61.0, 113.0, 170.0, 264.0, 643.0, 1706.0, 5596.0, 19651.0, 73882.0, 277564.0, 442791.0, 166361.0, 42778.0, 11391.0, 3295.0, 1104.0, 446.0, 260.0, 127.0, 73.0, 52.0, 38.0, 34.0, 12.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11761474609375, -0.11345767974853516, -0.10930061340332031, -0.10514354705810547, -0.10098648071289062, -0.09682941436767578, -0.09267234802246094, -0.0885152816772461, -0.08435821533203125, -0.0802011489868164, -0.07604408264160156, -0.07188701629638672, -0.06772994995117188, -0.06357288360595703, -0.05941581726074219, -0.055258750915527344, -0.0511016845703125, -0.046944618225097656, -0.04278755187988281, -0.03863048553466797, -0.034473419189453125, -0.03031635284423828, -0.026159286499023438, -0.022002220153808594, -0.01784515380859375, -0.013688087463378906, -0.009531021118164062, -0.005373954772949219, -0.001216888427734375, 0.0029401779174804688, 0.0070972442626953125, 0.011254310607910156, 0.015411376953125, 0.019568443298339844, 0.023725509643554688, 0.02788257598876953, 0.032039642333984375, 0.03619670867919922, 0.04035377502441406, 0.044510841369628906, 0.04866790771484375, 0.052824974060058594, 0.05698204040527344, 0.06113910675048828, 0.06529617309570312, 0.06945323944091797, 0.07361030578613281, 0.07776737213134766, 0.0819244384765625, 0.08608150482177734, 0.09023857116699219, 0.09439563751220703, 0.09855270385742188, 0.10270977020263672, 0.10686683654785156, 0.1110239028930664, 0.11518096923828125, 0.1193380355834961, 0.12349510192871094, 0.12765216827392578, 0.13180923461914062, 0.13596630096435547, 0.1401233673095703, 0.14428043365478516, 0.1484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 17.0, 19.0, 26.0, 25.0, 23.0, 33.0, 40.0, 26.0, 29.0, 37.0, 49.0, 46.0, 45.0, 37.0, 49.0, 49.0, 47.0, 49.0, 39.0, 44.0, 35.0, 25.0, 26.0, 31.0, 24.0, 32.0, 11.0, 8.0, 16.0, 8.0, 10.0, 9.0, 3.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09363174438476562, -0.09082794189453125, -0.08802413940429688, -0.0852203369140625, -0.08241653442382812, -0.07961273193359375, -0.07680892944335938, -0.074005126953125, -0.07120132446289062, -0.06839752197265625, -0.06559371948242188, -0.0627899169921875, -0.059986114501953125, -0.05718231201171875, -0.054378509521484375, -0.05157470703125, -0.048770904541015625, -0.04596710205078125, -0.043163299560546875, -0.0403594970703125, -0.037555694580078125, -0.03475189208984375, -0.031948089599609375, -0.029144287109375, -0.026340484619140625, -0.02353668212890625, -0.020732879638671875, -0.0179290771484375, -0.015125274658203125, -0.01232147216796875, -0.009517669677734375, -0.0067138671875, -0.003910064697265625, -0.00110626220703125, 0.001697540283203125, 0.0045013427734375, 0.007305145263671875, 0.01010894775390625, 0.012912750244140625, 0.015716552734375, 0.018520355224609375, 0.02132415771484375, 0.024127960205078125, 0.0269317626953125, 0.029735565185546875, 0.03253936767578125, 0.035343170166015625, 0.03814697265625, 0.040950775146484375, 0.04375457763671875, 0.046558380126953125, 0.0493621826171875, 0.052165985107421875, 0.05496978759765625, 0.057773590087890625, 0.060577392578125, 0.06338119506835938, 0.06618499755859375, 0.06898880004882812, 0.0717926025390625, 0.07459640502929688, 0.07740020751953125, 0.08020401000976562, 0.0830078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 15.0, 19.0, 21.0, 46.0, 52.0, 85.0, 150.0, 321.0, 680.0, 1821.0, 6303.0, 26618.0, 136156.0, 468277.0, 320798.0, 67415.0, 13809.0, 3669.0, 1209.0, 510.0, 263.0, 130.0, 60.0, 49.0, 29.0, 16.0, 12.0, 11.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077392578125, -0.07503223419189453, -0.07267189025878906, -0.0703115463256836, -0.06795120239257812, -0.06559085845947266, -0.06323051452636719, -0.06087017059326172, -0.05850982666015625, -0.05614948272705078, -0.05378913879394531, -0.051428794860839844, -0.049068450927734375, -0.046708106994628906, -0.04434776306152344, -0.04198741912841797, -0.0396270751953125, -0.03726673126220703, -0.03490638732910156, -0.032546043395996094, -0.030185699462890625, -0.027825355529785156, -0.025465011596679688, -0.02310466766357422, -0.02074432373046875, -0.01838397979736328, -0.016023635864257812, -0.013663291931152344, -0.011302947998046875, -0.008942604064941406, -0.0065822601318359375, -0.004221916198730469, -0.001861572265625, 0.0004987716674804688, 0.0028591156005859375, 0.005219459533691406, 0.007579803466796875, 0.009940147399902344, 0.012300491333007812, 0.014660835266113281, 0.01702117919921875, 0.01938152313232422, 0.021741867065429688, 0.024102210998535156, 0.026462554931640625, 0.028822898864746094, 0.031183242797851562, 0.03354358673095703, 0.0359039306640625, 0.03826427459716797, 0.04062461853027344, 0.042984962463378906, 0.045345306396484375, 0.047705650329589844, 0.05006599426269531, 0.05242633819580078, 0.05478668212890625, 0.05714702606201172, 0.05950736999511719, 0.061867713928222656, 0.06422805786132812, 0.0665884017944336, 0.06894874572753906, 0.07130908966064453, 0.07366943359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 12.0, 10.0, 12.0, 7.0, 18.0, 15.0, 21.0, 17.0, 24.0, 28.0, 30.0, 45.0, 48.0, 56.0, 65.0, 73.0, 66.0, 69.0, 60.0, 43.0, 42.0, 25.0, 19.0, 31.0, 24.0, 13.0, 16.0, 8.0, 11.0, 14.0, 7.0, 2.0, 11.0, 13.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9490718841552734e-05, -1.8914230167865753e-05, -1.8337741494178772e-05, -1.776125282049179e-05, -1.718476414680481e-05, -1.660827547311783e-05, -1.6031786799430847e-05, -1.5455298125743866e-05, -1.4878809452056885e-05, -1.4302320778369904e-05, -1.3725832104682922e-05, -1.3149343430995941e-05, -1.257285475730896e-05, -1.1996366083621979e-05, -1.1419877409934998e-05, -1.0843388736248016e-05, -1.0266900062561035e-05, -9.690411388874054e-06, -9.113922715187073e-06, -8.537434041500092e-06, -7.96094536781311e-06, -7.384456694126129e-06, -6.807968020439148e-06, -6.231479346752167e-06, -5.6549906730651855e-06, -5.078501999378204e-06, -4.502013325691223e-06, -3.925524652004242e-06, -3.3490359783172607e-06, -2.7725473046302795e-06, -2.1960586309432983e-06, -1.6195699572563171e-06, -1.043081283569336e-06, -4.6659260988235474e-07, 1.0989606380462646e-07, 6.863847374916077e-07, 1.2628734111785889e-06, 1.83936208486557e-06, 2.4158507585525513e-06, 2.9923394322395325e-06, 3.5688281059265137e-06, 4.145316779613495e-06, 4.721805453300476e-06, 5.298294126987457e-06, 5.8747828006744385e-06, 6.45127147436142e-06, 7.027760148048401e-06, 7.604248821735382e-06, 8.180737495422363e-06, 8.757226169109344e-06, 9.333714842796326e-06, 9.910203516483307e-06, 1.0486692190170288e-05, 1.106318086385727e-05, 1.163966953754425e-05, 1.2216158211231232e-05, 1.2792646884918213e-05, 1.3369135558605194e-05, 1.3945624232292175e-05, 1.4522112905979156e-05, 1.5098601579666138e-05, 1.567509025335312e-05, 1.62515789270401e-05, 1.682806760072708e-05, 1.7404556274414062e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 3.0, 8.0, 17.0, 11.0, 15.0, 28.0, 44.0, 49.0, 70.0, 132.0, 215.0, 380.0, 753.0, 1626.0, 3938.0, 9887.0, 28053.0, 86919.0, 229679.0, 343255.0, 219690.0, 81205.0, 26329.0, 9255.0, 3709.0, 1572.0, 717.0, 382.0, 212.0, 141.0, 76.0, 45.0, 43.0, 30.0, 13.0, 11.0, 8.0, 11.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.037506103515625, -0.03623342514038086, -0.03496074676513672, -0.03368806838989258, -0.03241539001464844, -0.031142711639404297, -0.029870033264160156, -0.028597354888916016, -0.027324676513671875, -0.026051998138427734, -0.024779319763183594, -0.023506641387939453, -0.022233963012695312, -0.020961284637451172, -0.01968860626220703, -0.01841592788696289, -0.01714324951171875, -0.01587057113647461, -0.014597892761230469, -0.013325214385986328, -0.012052536010742188, -0.010779857635498047, -0.009507179260253906, -0.008234500885009766, -0.006961822509765625, -0.005689144134521484, -0.004416465759277344, -0.003143787384033203, -0.0018711090087890625, -0.0005984306335449219, 0.0006742477416992188, 0.0019469261169433594, 0.0032196044921875, 0.004492282867431641, 0.005764961242675781, 0.007037639617919922, 0.008310317993164062, 0.009582996368408203, 0.010855674743652344, 0.012128353118896484, 0.013401031494140625, 0.014673709869384766, 0.015946388244628906, 0.017219066619873047, 0.018491744995117188, 0.019764423370361328, 0.02103710174560547, 0.02230978012084961, 0.02358245849609375, 0.02485513687133789, 0.02612781524658203, 0.027400493621826172, 0.028673171997070312, 0.029945850372314453, 0.031218528747558594, 0.032491207122802734, 0.033763885498046875, 0.035036563873291016, 0.036309242248535156, 0.0375819206237793, 0.03885459899902344, 0.04012727737426758, 0.04139995574951172, 0.04267263412475586, 0.0439453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 10.0, 6.0, 15.0, 15.0, 21.0, 25.0, 25.0, 37.0, 26.0, 46.0, 43.0, 48.0, 73.0, 62.0, 52.0, 62.0, 55.0, 62.0, 49.0, 37.0, 40.0, 39.0, 26.0, 23.0, 18.0, 14.0, 16.0, 11.0, 13.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0313720703125, -0.03046560287475586, -0.02955913543701172, -0.028652667999267578, -0.027746200561523438, -0.026839733123779297, -0.025933265686035156, -0.025026798248291016, -0.024120330810546875, -0.023213863372802734, -0.022307395935058594, -0.021400928497314453, -0.020494461059570312, -0.019587993621826172, -0.01868152618408203, -0.01777505874633789, -0.01686859130859375, -0.01596212387084961, -0.015055656433105469, -0.014149188995361328, -0.013242721557617188, -0.012336254119873047, -0.011429786682128906, -0.010523319244384766, -0.009616851806640625, -0.008710384368896484, -0.007803916931152344, -0.006897449493408203, -0.0059909820556640625, -0.005084514617919922, -0.004178047180175781, -0.0032715797424316406, -0.0023651123046875, -0.0014586448669433594, -0.0005521774291992188, 0.0003542900085449219, 0.0012607574462890625, 0.002167224884033203, 0.0030736923217773438, 0.003980159759521484, 0.004886627197265625, 0.005793094635009766, 0.006699562072753906, 0.007606029510498047, 0.008512496948242188, 0.009418964385986328, 0.010325431823730469, 0.01123189926147461, 0.01213836669921875, 0.01304483413696289, 0.013951301574707031, 0.014857769012451172, 0.015764236450195312, 0.016670703887939453, 0.017577171325683594, 0.018483638763427734, 0.019390106201171875, 0.020296573638916016, 0.021203041076660156, 0.022109508514404297, 0.023015975952148438, 0.023922443389892578, 0.02482891082763672, 0.02573537826538086, 0.026641845703125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 12.0, 44.0, 109.0, 243.0, 294.0, 188.0, 77.0, 28.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7279870510101318, -0.7022101879119873, -0.6764333844184875, -0.650656521320343, -0.6248797178268433, -0.5991028547286987, -0.5733259916305542, -0.5475491881370544, -0.5217723250389099, -0.49599549174308777, -0.4702186584472656, -0.4444417953491211, -0.41866496205329895, -0.3928881287574768, -0.36711129546165466, -0.3413344621658325, -0.3155576288700104, -0.28978079557418823, -0.2640039622783661, -0.23822711408138275, -0.21245026588439941, -0.18667343258857727, -0.16089659929275513, -0.1351197510957718, -0.10934291779994965, -0.0835660770535469, -0.057789240032434464, -0.03201240301132202, -0.006235562264919281, 0.01954127848148346, 0.0453181117773056, 0.07109495997428894, 0.09687179327011108, 0.12264863401651382, 0.14842547476291656, 0.1742023080587387, 0.19997915625572205, 0.2257559895515442, 0.25153282284736633, 0.2773096561431885, 0.303086519241333, 0.32886335253715515, 0.3546401858329773, 0.3804170489311218, 0.40619388222694397, 0.4319707155227661, 0.45774754881858826, 0.4835243821144104, 0.5093011856079102, 0.5350780487060547, 0.5608548521995544, 0.586631715297699, 0.6124085187911987, 0.6381853818893433, 0.6639622449874878, 0.6897390484809875, 0.7155159115791321, 0.7412927746772766, 0.7670695781707764, 0.7928464412689209, 0.8186232447624207, 0.8444001078605652, 0.8701769113540649, 0.8959537744522095, 0.921730637550354]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 8.0, 4.0, 9.0, 9.0, 11.0, 15.0, 23.0, 29.0, 28.0, 33.0, 29.0, 35.0, 33.0, 48.0, 59.0, 45.0, 53.0, 49.0, 59.0, 46.0, 57.0, 35.0, 38.0, 38.0, 29.0, 31.0, 26.0, 20.0, 23.0, 19.0, 13.0, 9.0, 8.0, 9.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30393558740615845, -0.29411283135414124, -0.2842901051044464, -0.2744673490524292, -0.2646446228027344, -0.25482186675071716, -0.24499912559986115, -0.23517638444900513, -0.2253536432981491, -0.2155309021472931, -0.20570816099643707, -0.19588541984558105, -0.18606266379356384, -0.17623993754386902, -0.1664171814918518, -0.1565944403409958, -0.14677169919013977, -0.13694895803928375, -0.12712621688842773, -0.11730346828699112, -0.1074807271361351, -0.09765798598527908, -0.08783523738384247, -0.07801249623298645, -0.06818975508213043, -0.058367013931274414, -0.0485442690551281, -0.03872152417898178, -0.028898783028125763, -0.019076041877269745, -0.009253297001123428, 0.0005694478750228882, 0.010392189025878906, 0.020214932039380074, 0.03003767505288124, 0.03986041992902756, 0.049683161079883575, 0.059505902230739594, 0.06932865083217621, 0.07915139198303223, 0.08897413313388824, 0.09879687428474426, 0.10861961543560028, 0.1184423640370369, 0.1282651126384735, 0.13808783888816833, 0.14791059494018555, 0.15773333609104156, 0.16755607724189758, 0.1773788183927536, 0.18720155954360962, 0.19702430069446564, 0.20684704184532166, 0.21666979789733887, 0.22649253904819489, 0.2363152801990509, 0.24613802134990692, 0.25596076250076294, 0.26578351855278015, 0.275606244802475, 0.2854290008544922, 0.295251727104187, 0.3050744831562042, 0.31489723920822144, 0.32471996545791626]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 13.0, 8.0, 12.0, 19.0, 27.0, 41.0, 67.0, 64.0, 112.0, 128.0, 215.0, 411.0, 965.0, 4298.0, 51935.0, 2574796.0, 1525839.0, 30615.0, 3066.0, 707.0, 316.0, 199.0, 113.0, 89.0, 69.0, 59.0, 36.0, 19.0, 15.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.101348876953125, -0.09771728515625, -0.094085693359375, -0.0904541015625, -0.086822509765625, -0.08319091796875, -0.079559326171875, -0.075927734375, -0.072296142578125, -0.06866455078125, -0.065032958984375, -0.0614013671875, -0.057769775390625, -0.05413818359375, -0.050506591796875, -0.046875, -0.043243408203125, -0.03961181640625, -0.035980224609375, -0.0323486328125, -0.028717041015625, -0.02508544921875, -0.021453857421875, -0.017822265625, -0.014190673828125, -0.01055908203125, -0.006927490234375, -0.0032958984375, 0.000335693359375, 0.00396728515625, 0.007598876953125, 0.01123046875, 0.014862060546875, 0.01849365234375, 0.022125244140625, 0.0257568359375, 0.029388427734375, 0.03302001953125, 0.036651611328125, 0.040283203125, 0.043914794921875, 0.04754638671875, 0.051177978515625, 0.0548095703125, 0.058441162109375, 0.06207275390625, 0.065704345703125, 0.0693359375, 0.072967529296875, 0.07659912109375, 0.080230712890625, 0.0838623046875, 0.087493896484375, 0.09112548828125, 0.094757080078125, 0.098388671875, 0.102020263671875, 0.10565185546875, 0.109283447265625, 0.1129150390625, 0.116546630859375, 0.12017822265625, 0.123809814453125, 0.12744140625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 8.0, 11.0, 10.0, 14.0, 17.0, 31.0, 21.0, 23.0, 39.0, 44.0, 61.0, 57.0, 60.0, 57.0, 68.0, 61.0, 72.0, 44.0, 45.0, 43.0, 35.0, 24.0, 38.0, 33.0, 21.0, 16.0, 12.0, 7.0, 12.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.04105567932128906, -0.039752960205078125, -0.03845024108886719, -0.03714752197265625, -0.03584480285644531, -0.034542083740234375, -0.03323936462402344, -0.0319366455078125, -0.030633926391601562, -0.029331207275390625, -0.028028488159179688, -0.02672576904296875, -0.025423049926757812, -0.024120330810546875, -0.022817611694335938, -0.021514892578125, -0.020212173461914062, -0.018909454345703125, -0.017606735229492188, -0.01630401611328125, -0.015001296997070312, -0.013698577880859375, -0.012395858764648438, -0.0110931396484375, -0.009790420532226562, -0.008487701416015625, -0.0071849822998046875, -0.00588226318359375, -0.0045795440673828125, -0.003276824951171875, -0.0019741058349609375, -0.00067138671875, 0.0006313323974609375, 0.001934051513671875, 0.0032367706298828125, 0.00453948974609375, 0.0058422088623046875, 0.007144927978515625, 0.008447647094726562, 0.0097503662109375, 0.011053085327148438, 0.012355804443359375, 0.013658523559570312, 0.01496124267578125, 0.016263961791992188, 0.017566680908203125, 0.018869400024414062, 0.020172119140625, 0.021474838256835938, 0.022777557373046875, 0.024080276489257812, 0.02538299560546875, 0.026685714721679688, 0.027988433837890625, 0.029291152954101562, 0.0305938720703125, 0.03189659118652344, 0.033199310302734375, 0.03450202941894531, 0.03580474853515625, 0.03710746765136719, 0.038410186767578125, 0.03971290588378906, 0.041015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 12.0, 22.0, 37.0, 42.0, 65.0, 104.0, 155.0, 301.0, 664.0, 2203.0, 12934.0, 171943.0, 2570892.0, 1355762.0, 69728.0, 6822.0, 1381.0, 505.0, 286.0, 150.0, 117.0, 48.0, 27.0, 22.0, 14.0, 13.0, 5.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1270751953125, -0.1237173080444336, -0.12035942077636719, -0.11700153350830078, -0.11364364624023438, -0.11028575897216797, -0.10692787170410156, -0.10356998443603516, -0.10021209716796875, -0.09685420989990234, -0.09349632263183594, -0.09013843536376953, -0.08678054809570312, -0.08342266082763672, -0.08006477355957031, -0.0767068862915039, -0.0733489990234375, -0.0699911117553711, -0.06663322448730469, -0.06327533721923828, -0.059917449951171875, -0.05655956268310547, -0.05320167541503906, -0.049843788146972656, -0.04648590087890625, -0.043128013610839844, -0.03977012634277344, -0.03641223907470703, -0.033054351806640625, -0.02969646453857422, -0.026338577270507812, -0.022980690002441406, -0.019622802734375, -0.016264915466308594, -0.012907028198242188, -0.009549140930175781, -0.006191253662109375, -0.0028333663940429688, 0.0005245208740234375, 0.0038824081420898438, 0.00724029541015625, 0.010598182678222656, 0.013956069946289062, 0.01731395721435547, 0.020671844482421875, 0.02402973175048828, 0.027387619018554688, 0.030745506286621094, 0.0341033935546875, 0.037461280822753906, 0.04081916809082031, 0.04417705535888672, 0.047534942626953125, 0.05089282989501953, 0.05425071716308594, 0.057608604431152344, 0.06096649169921875, 0.06432437896728516, 0.06768226623535156, 0.07104015350341797, 0.07439804077148438, 0.07775592803955078, 0.08111381530761719, 0.0844717025756836, 0.08782958984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 5.0, 7.0, 8.0, 18.0, 12.0, 36.0, 26.0, 54.0, 61.0, 91.0, 144.0, 149.0, 195.0, 247.0, 301.0, 325.0, 338.0, 354.0, 350.0, 293.0, 271.0, 186.0, 162.0, 110.0, 80.0, 59.0, 55.0, 41.0, 26.0, 22.0, 16.0, 10.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036149024963378906, -0.03470039367675781, -0.03325176239013672, -0.031803131103515625, -0.03035449981689453, -0.028905868530273438, -0.027457237243652344, -0.02600860595703125, -0.024559974670410156, -0.023111343383789062, -0.02166271209716797, -0.020214080810546875, -0.01876544952392578, -0.017316818237304688, -0.015868186950683594, -0.0144195556640625, -0.012970924377441406, -0.011522293090820312, -0.010073661804199219, -0.008625030517578125, -0.007176399230957031, -0.0057277679443359375, -0.004279136657714844, -0.00283050537109375, -0.0013818740844726562, 6.67572021484375e-05, 0.0015153884887695312, 0.002964019775390625, 0.004412651062011719, 0.0058612823486328125, 0.007309913635253906, 0.008758544921875, 0.010207176208496094, 0.011655807495117188, 0.013104438781738281, 0.014553070068359375, 0.01600170135498047, 0.017450332641601562, 0.018898963928222656, 0.02034759521484375, 0.021796226501464844, 0.023244857788085938, 0.02469348907470703, 0.026142120361328125, 0.02759075164794922, 0.029039382934570312, 0.030488014221191406, 0.0319366455078125, 0.033385276794433594, 0.03483390808105469, 0.03628253936767578, 0.037731170654296875, 0.03917980194091797, 0.04062843322753906, 0.042077064514160156, 0.04352569580078125, 0.044974327087402344, 0.04642295837402344, 0.04787158966064453, 0.049320220947265625, 0.05076885223388672, 0.05221748352050781, 0.053666114807128906, 0.05511474609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 13.0, 37.0, 111.0, 224.0, 279.0, 185.0, 105.0, 35.0, 12.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5911338925361633, -0.5739768147468567, -0.5568197965621948, -0.5396627187728882, -0.5225057005882263, -0.5053486227989197, -0.4881915748119354, -0.47103452682495117, -0.4538774788379669, -0.43672043085098267, -0.4195633828639984, -0.40240633487701416, -0.3852492570877075, -0.36809223890304565, -0.350935161113739, -0.33377811312675476, -0.3166210651397705, -0.29946401715278625, -0.282306969165802, -0.26514992117881775, -0.2479928582906723, -0.23083581030368805, -0.2136787474155426, -0.19652169942855835, -0.1793646514415741, -0.16220760345458984, -0.1450505554676056, -0.12789349257946014, -0.11073644459247589, -0.09357939660549164, -0.07642234116792679, -0.05926528573036194, -0.042108237743377686, -0.024951186031103134, -0.007794134318828583, 0.009362917393445969, 0.02651996910572052, 0.04367701709270477, 0.06083407253026962, 0.07799112796783447, 0.09514817595481873, 0.11230522394180298, 0.12946227192878723, 0.14661933481693268, 0.16377638280391693, 0.18093343079090118, 0.19809049367904663, 0.21524754166603088, 0.23240458965301514, 0.2495616376399994, 0.26671868562698364, 0.2838757336139679, 0.30103278160095215, 0.3181898593902588, 0.33534690737724304, 0.3525039553642273, 0.36966100335121155, 0.3868180513381958, 0.40397509932518005, 0.4211321473121643, 0.43828922510147095, 0.4554462432861328, 0.47260332107543945, 0.4897603690624237, 0.506917417049408]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 5.0, 4.0, 8.0, 7.0, 11.0, 11.0, 18.0, 24.0, 20.0, 25.0, 26.0, 28.0, 28.0, 33.0, 36.0, 41.0, 44.0, 55.0, 50.0, 47.0, 49.0, 44.0, 53.0, 39.0, 31.0, 49.0, 32.0, 30.0, 18.0, 27.0, 28.0, 16.0, 18.0, 8.0, 11.0, 14.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180620014667511, -0.17485976219177246, -0.16909950971603394, -0.1633392572402954, -0.15757900476455688, -0.15181876718997955, -0.14605851471424103, -0.1402982622385025, -0.13453800976276398, -0.12877775728702545, -0.12301750481128693, -0.117257259786129, -0.11149700731039047, -0.10573675483465195, -0.09997650980949402, -0.0942162573337555, -0.08845600485801697, -0.08269575238227844, -0.07693549990653992, -0.07117525488138199, -0.06541500240564346, -0.05965474992990494, -0.05389450117945671, -0.048134252429008484, -0.04237399995326996, -0.03661374747753143, -0.030853498727083206, -0.02509324811398983, -0.019332997500896454, -0.013572746887803078, -0.0078124962747097015, -0.0020522475242614746, 0.0037080049514770508, 0.009468255564570427, 0.015228506177663803, 0.02098875679075718, 0.026749007403850555, 0.03250925987958908, 0.03826950863003731, 0.044029757380485535, 0.04979000985622406, 0.055550262331962585, 0.06131051108241081, 0.06707075983285904, 0.07283101230859756, 0.07859126478433609, 0.08435150980949402, 0.09011176228523254, 0.09587201476097107, 0.1016322672367096, 0.10739251971244812, 0.11315276473760605, 0.11891301721334457, 0.1246732696890831, 0.13043351471424103, 0.13619376718997955, 0.14195401966571808, 0.1477142721414566, 0.15347452461719513, 0.15923477709293365, 0.164995014667511, 0.1707552671432495, 0.17651551961898804, 0.18227577209472656, 0.1880360245704651]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 14.0, 15.0, 21.0, 29.0, 43.0, 53.0, 96.0, 171.0, 309.0, 595.0, 1316.0, 2913.0, 6647.0, 15957.0, 42577.0, 136695.0, 379477.0, 309513.0, 97661.0, 31962.0, 12537.0, 5425.0, 2320.0, 995.0, 510.0, 277.0, 153.0, 91.0, 52.0, 28.0, 28.0, 22.0, 10.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0985107421875, -0.09521198272705078, -0.09191322326660156, -0.08861446380615234, -0.08531570434570312, -0.0820169448852539, -0.07871818542480469, -0.07541942596435547, -0.07212066650390625, -0.06882190704345703, -0.06552314758300781, -0.062224388122558594, -0.058925628662109375, -0.055626869201660156, -0.05232810974121094, -0.04902935028076172, -0.0457305908203125, -0.04243183135986328, -0.03913307189941406, -0.035834312438964844, -0.032535552978515625, -0.029236793518066406, -0.025938034057617188, -0.02263927459716797, -0.01934051513671875, -0.01604175567626953, -0.012742996215820312, -0.009444236755371094, -0.006145477294921875, -0.0028467178344726562, 0.0004520416259765625, 0.0037508010864257812, 0.007049560546875, 0.010348320007324219, 0.013647079467773438, 0.016945838928222656, 0.020244598388671875, 0.023543357849121094, 0.026842117309570312, 0.03014087677001953, 0.03343963623046875, 0.03673839569091797, 0.04003715515136719, 0.043335914611816406, 0.046634674072265625, 0.049933433532714844, 0.05323219299316406, 0.05653095245361328, 0.0598297119140625, 0.06312847137451172, 0.06642723083496094, 0.06972599029541016, 0.07302474975585938, 0.0763235092163086, 0.07962226867675781, 0.08292102813720703, 0.08621978759765625, 0.08951854705810547, 0.09281730651855469, 0.0961160659790039, 0.09941482543945312, 0.10271358489990234, 0.10601234436035156, 0.10931110382080078, 0.11260986328125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 12.0, 13.0, 31.0, 31.0, 21.0, 39.0, 44.0, 59.0, 71.0, 76.0, 69.0, 82.0, 85.0, 59.0, 43.0, 52.0, 45.0, 37.0, 30.0, 29.0, 18.0, 20.0, 8.0, 5.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04791259765625, -0.04642343521118164, -0.04493427276611328, -0.04344511032104492, -0.04195594787597656, -0.0404667854309082, -0.038977622985839844, -0.037488460540771484, -0.035999298095703125, -0.034510135650634766, -0.033020973205566406, -0.03153181076049805, -0.030042648315429688, -0.028553485870361328, -0.02706432342529297, -0.02557516098022461, -0.02408599853515625, -0.02259683609008789, -0.02110767364501953, -0.019618511199951172, -0.018129348754882812, -0.016640186309814453, -0.015151023864746094, -0.013661861419677734, -0.012172698974609375, -0.010683536529541016, -0.009194374084472656, -0.007705211639404297, -0.0062160491943359375, -0.004726886749267578, -0.0032377243041992188, -0.0017485618591308594, -0.0002593994140625, 0.0012297630310058594, 0.0027189254760742188, 0.004208087921142578, 0.0056972503662109375, 0.007186412811279297, 0.008675575256347656, 0.010164737701416016, 0.011653900146484375, 0.013143062591552734, 0.014632225036621094, 0.016121387481689453, 0.017610549926757812, 0.019099712371826172, 0.02058887481689453, 0.02207803726196289, 0.02356719970703125, 0.02505636215209961, 0.02654552459716797, 0.028034687042236328, 0.029523849487304688, 0.031013011932373047, 0.032502174377441406, 0.033991336822509766, 0.035480499267578125, 0.036969661712646484, 0.038458824157714844, 0.0399479866027832, 0.04143714904785156, 0.04292631149291992, 0.04441547393798828, 0.04590463638305664, 0.047393798828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 10.0, 5.0, 7.0, 15.0, 14.0, 18.0, 25.0, 40.0, 50.0, 64.0, 104.0, 131.0, 158.0, 240.0, 480.0, 891.0, 1811.0, 4066.0, 10197.0, 26194.0, 69384.0, 177505.0, 323421.0, 254750.0, 109509.0, 41692.0, 15890.0, 6309.0, 2608.0, 1214.0, 608.0, 337.0, 233.0, 157.0, 119.0, 86.0, 56.0, 35.0, 26.0, 26.0, 14.0, 12.0, 14.0, 9.0, 11.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0894775390625, -0.08690166473388672, -0.08432579040527344, -0.08174991607666016, -0.07917404174804688, -0.0765981674194336, -0.07402229309082031, -0.07144641876220703, -0.06887054443359375, -0.06629467010498047, -0.06371879577636719, -0.061142921447753906, -0.058567047119140625, -0.055991172790527344, -0.05341529846191406, -0.05083942413330078, -0.0482635498046875, -0.04568767547607422, -0.04311180114746094, -0.040535926818847656, -0.037960052490234375, -0.035384178161621094, -0.03280830383300781, -0.03023242950439453, -0.02765655517578125, -0.02508068084716797, -0.022504806518554688, -0.019928932189941406, -0.017353057861328125, -0.014777183532714844, -0.012201309204101562, -0.009625434875488281, -0.007049560546875, -0.004473686218261719, -0.0018978118896484375, 0.0006780624389648438, 0.003253936767578125, 0.005829811096191406, 0.008405685424804688, 0.010981559753417969, 0.01355743408203125, 0.01613330841064453, 0.018709182739257812, 0.021285057067871094, 0.023860931396484375, 0.026436805725097656, 0.029012680053710938, 0.03158855438232422, 0.0341644287109375, 0.03674030303955078, 0.03931617736816406, 0.041892051696777344, 0.044467926025390625, 0.047043800354003906, 0.04961967468261719, 0.05219554901123047, 0.05477142333984375, 0.05734729766845703, 0.05992317199707031, 0.062499046325683594, 0.06507492065429688, 0.06765079498291016, 0.07022666931152344, 0.07280254364013672, 0.07537841796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 11.0, 10.0, 15.0, 10.0, 16.0, 18.0, 21.0, 28.0, 35.0, 27.0, 47.0, 31.0, 41.0, 35.0, 42.0, 41.0, 42.0, 50.0, 48.0, 38.0, 43.0, 43.0, 39.0, 31.0, 24.0, 28.0, 24.0, 30.0, 29.0, 16.0, 16.0, 8.0, 11.0, 9.0, 6.0, 5.0, 3.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0743408203125, -0.07181644439697266, -0.06929206848144531, -0.06676769256591797, -0.06424331665039062, -0.06171894073486328, -0.05919456481933594, -0.056670188903808594, -0.05414581298828125, -0.051621437072753906, -0.04909706115722656, -0.04657268524169922, -0.044048309326171875, -0.04152393341064453, -0.03899955749511719, -0.036475181579589844, -0.0339508056640625, -0.031426429748535156, -0.028902053833007812, -0.02637767791748047, -0.023853302001953125, -0.02132892608642578, -0.018804550170898438, -0.016280174255371094, -0.01375579833984375, -0.011231422424316406, -0.008707046508789062, -0.006182670593261719, -0.003658294677734375, -0.0011339187622070312, 0.0013904571533203125, 0.003914833068847656, 0.006439208984375, 0.008963584899902344, 0.011487960815429688, 0.014012336730957031, 0.016536712646484375, 0.01906108856201172, 0.021585464477539062, 0.024109840393066406, 0.02663421630859375, 0.029158592224121094, 0.03168296813964844, 0.03420734405517578, 0.036731719970703125, 0.03925609588623047, 0.04178047180175781, 0.044304847717285156, 0.0468292236328125, 0.049353599548339844, 0.05187797546386719, 0.05440235137939453, 0.056926727294921875, 0.05945110321044922, 0.06197547912597656, 0.0644998550415039, 0.06702423095703125, 0.0695486068725586, 0.07207298278808594, 0.07459735870361328, 0.07712173461914062, 0.07964611053466797, 0.08217048645019531, 0.08469486236572266, 0.08721923828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 10.0, 10.0, 13.0, 22.0, 37.0, 53.0, 81.0, 118.0, 195.0, 282.0, 466.0, 859.0, 1329.0, 2158.0, 3531.0, 5902.0, 10179.0, 17289.0, 31390.0, 59094.0, 109642.0, 178666.0, 216322.0, 174659.0, 106569.0, 57045.0, 30835.0, 17144.0, 9747.0, 5808.0, 3502.0, 2099.0, 1314.0, 766.0, 502.0, 318.0, 208.0, 126.0, 83.0, 60.0, 44.0, 27.0, 12.0, 10.0, 13.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0218353271484375, -0.021162986755371094, -0.020490646362304688, -0.01981830596923828, -0.019145965576171875, -0.01847362518310547, -0.017801284790039062, -0.017128944396972656, -0.01645660400390625, -0.015784263610839844, -0.015111923217773438, -0.014439582824707031, -0.013767242431640625, -0.013094902038574219, -0.012422561645507812, -0.011750221252441406, -0.011077880859375, -0.010405540466308594, -0.009733200073242188, -0.009060859680175781, -0.008388519287109375, -0.007716178894042969, -0.0070438385009765625, -0.006371498107910156, -0.00569915771484375, -0.005026817321777344, -0.0043544769287109375, -0.0036821365356445312, -0.003009796142578125, -0.0023374557495117188, -0.0016651153564453125, -0.0009927749633789062, -0.0003204345703125, 0.00035190582275390625, 0.0010242462158203125, 0.0016965866088867188, 0.002368927001953125, 0.0030412673950195312, 0.0037136077880859375, 0.004385948181152344, 0.00505828857421875, 0.005730628967285156, 0.0064029693603515625, 0.007075309753417969, 0.007747650146484375, 0.008419990539550781, 0.009092330932617188, 0.009764671325683594, 0.01043701171875, 0.011109352111816406, 0.011781692504882812, 0.012454032897949219, 0.013126373291015625, 0.013798713684082031, 0.014471054077148438, 0.015143394470214844, 0.01581573486328125, 0.016488075256347656, 0.017160415649414062, 0.01783275604248047, 0.018505096435546875, 0.01917743682861328, 0.019849777221679688, 0.020522117614746094, 0.0211944580078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 5.0, 12.0, 22.0, 17.0, 9.0, 16.0, 22.0, 24.0, 35.0, 28.0, 35.0, 53.0, 58.0, 57.0, 54.0, 47.0, 69.0, 55.0, 47.0, 58.0, 35.0, 37.0, 34.0, 24.0, 26.0, 18.0, 17.0, 19.0, 7.0, 12.0, 7.0, 10.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1861324310302734e-05, -1.1422671377658844e-05, -1.0984018445014954e-05, -1.0545365512371063e-05, -1.0106712579727173e-05, -9.668059647083282e-06, -9.229406714439392e-06, -8.790753781795502e-06, -8.352100849151611e-06, -7.913447916507721e-06, -7.4747949838638306e-06, -7.03614205121994e-06, -6.59748911857605e-06, -6.1588361859321594e-06, -5.720183253288269e-06, -5.281530320644379e-06, -4.842877388000488e-06, -4.404224455356598e-06, -3.9655715227127075e-06, -3.526918590068817e-06, -3.0882656574249268e-06, -2.6496127247810364e-06, -2.210959792137146e-06, -1.7723068594932556e-06, -1.3336539268493652e-06, -8.950009942054749e-07, -4.5634806156158447e-07, -1.7695128917694092e-08, 4.209578037261963e-07, 8.596107363700867e-07, 1.298263669013977e-06, 1.7369166016578674e-06, 2.175569534301758e-06, 2.614222466945648e-06, 3.0528753995895386e-06, 3.491528332233429e-06, 3.930181264877319e-06, 4.36883419752121e-06, 4.8074871301651e-06, 5.2461400628089905e-06, 5.684792995452881e-06, 6.123445928096771e-06, 6.562098860740662e-06, 7.000751793384552e-06, 7.439404726028442e-06, 7.878057658672333e-06, 8.316710591316223e-06, 8.755363523960114e-06, 9.194016456604004e-06, 9.632669389247894e-06, 1.0071322321891785e-05, 1.0509975254535675e-05, 1.0948628187179565e-05, 1.1387281119823456e-05, 1.1825934052467346e-05, 1.2264586985111237e-05, 1.2703239917755127e-05, 1.3141892850399017e-05, 1.3580545783042908e-05, 1.4019198715686798e-05, 1.4457851648330688e-05, 1.4896504580974579e-05, 1.533515751361847e-05, 1.577381044626236e-05, 1.621246337890625e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 13.0, 10.0, 15.0, 21.0, 26.0, 48.0, 52.0, 66.0, 111.0, 188.0, 251.0, 428.0, 703.0, 1211.0, 2015.0, 3760.0, 7063.0, 13620.0, 28705.0, 68020.0, 155851.0, 264503.0, 251840.0, 138730.0, 59052.0, 25629.0, 12304.0, 6199.0, 3341.0, 1863.0, 1120.0, 634.0, 370.0, 235.0, 147.0, 110.0, 73.0, 54.0, 40.0, 31.0, 25.0, 23.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0253753662109375, -0.024554729461669922, -0.023734092712402344, -0.022913455963134766, -0.022092819213867188, -0.02127218246459961, -0.02045154571533203, -0.019630908966064453, -0.018810272216796875, -0.017989635467529297, -0.01716899871826172, -0.01634836196899414, -0.015527725219726562, -0.014707088470458984, -0.013886451721191406, -0.013065814971923828, -0.01224517822265625, -0.011424541473388672, -0.010603904724121094, -0.009783267974853516, -0.008962631225585938, -0.00814199447631836, -0.007321357727050781, -0.006500720977783203, -0.005680084228515625, -0.004859447479248047, -0.004038810729980469, -0.0032181739807128906, -0.0023975372314453125, -0.0015769004821777344, -0.0007562637329101562, 6.437301635742188e-05, 0.000885009765625, 0.0017056465148925781, 0.0025262832641601562, 0.0033469200134277344, 0.0041675567626953125, 0.004988193511962891, 0.005808830261230469, 0.006629467010498047, 0.007450103759765625, 0.008270740509033203, 0.009091377258300781, 0.00991201400756836, 0.010732650756835938, 0.011553287506103516, 0.012373924255371094, 0.013194561004638672, 0.01401519775390625, 0.014835834503173828, 0.015656471252441406, 0.016477108001708984, 0.017297744750976562, 0.01811838150024414, 0.01893901824951172, 0.019759654998779297, 0.020580291748046875, 0.021400928497314453, 0.02222156524658203, 0.02304220199584961, 0.023862838745117188, 0.024683475494384766, 0.025504112243652344, 0.026324748992919922, 0.0271453857421875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 5.0, 10.0, 7.0, 12.0, 11.0, 18.0, 20.0, 23.0, 26.0, 32.0, 38.0, 47.0, 62.0, 51.0, 54.0, 57.0, 53.0, 42.0, 60.0, 59.0, 46.0, 46.0, 47.0, 32.0, 26.0, 21.0, 14.0, 10.0, 11.0, 10.0, 15.0, 3.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0229339599609375, -0.022223472595214844, -0.021512985229492188, -0.02080249786376953, -0.020092010498046875, -0.01938152313232422, -0.018671035766601562, -0.017960548400878906, -0.01725006103515625, -0.016539573669433594, -0.015829086303710938, -0.015118598937988281, -0.014408111572265625, -0.013697624206542969, -0.012987136840820312, -0.012276649475097656, -0.011566162109375, -0.010855674743652344, -0.010145187377929688, -0.009434700012207031, -0.008724212646484375, -0.008013725280761719, -0.0073032379150390625, -0.006592750549316406, -0.00588226318359375, -0.005171775817871094, -0.0044612884521484375, -0.0037508010864257812, -0.003040313720703125, -0.0023298263549804688, -0.0016193389892578125, -0.0009088516235351562, -0.0001983642578125, 0.0005121231079101562, 0.0012226104736328125, 0.0019330978393554688, 0.002643585205078125, 0.0033540725708007812, 0.0040645599365234375, 0.004775047302246094, 0.00548553466796875, 0.006196022033691406, 0.0069065093994140625, 0.007616996765136719, 0.008327484130859375, 0.009037971496582031, 0.009748458862304688, 0.010458946228027344, 0.01116943359375, 0.011879920959472656, 0.012590408325195312, 0.013300895690917969, 0.014011383056640625, 0.014721870422363281, 0.015432357788085938, 0.016142845153808594, 0.01685333251953125, 0.017563819885253906, 0.018274307250976562, 0.01898479461669922, 0.019695281982421875, 0.02040576934814453, 0.021116256713867188, 0.021826744079589844, 0.0225372314453125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 34.0, 122.0, 278.0, 321.0, 169.0, 56.0, 19.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447647094726562, -0.8157989382743835, -0.7868331670761108, -0.7578673958778381, -0.7289016246795654, -0.699935793876648, -0.67097008228302, -0.6420042514801025, -0.6130384802818298, -0.5840727090835571, -0.5551069378852844, -0.5261411666870117, -0.4971753656864166, -0.4682095944881439, -0.4392438232898712, -0.4102780222892761, -0.3813122808933258, -0.3523465096950531, -0.3233807384967804, -0.2944149374961853, -0.2654491662979126, -0.2364833950996399, -0.2075176239013672, -0.1785518378019333, -0.14958606660366058, -0.12062028795480728, -0.09165450930595398, -0.06268873810768127, -0.03372295945882797, -0.00475718080997467, 0.024208590388298035, 0.053174376487731934, 0.08214014768600464, 0.11110592633485794, 0.14007170498371124, 0.16903747618198395, 0.19800326228141785, 0.22696903347969055, 0.25593480467796326, 0.28490060567855835, 0.31386637687683105, 0.34283214807510376, 0.37179791927337646, 0.40076369047164917, 0.42972949147224426, 0.45869526267051697, 0.4876610338687897, 0.5166268348693848, 0.5455925464630127, 0.5745583176612854, 0.6035240888595581, 0.6324898600578308, 0.6614556312561035, 0.690421462059021, 0.7193871736526489, 0.7483530044555664, 0.7773187756538391, 0.8062845468521118, 0.8352503180503845, 0.8642160892486572, 0.8931818604469299, 0.9221476316452026, 0.9511134624481201, 0.9800792336463928, 1.0090450048446655]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 13.0, 11.0, 8.0, 16.0, 14.0, 32.0, 38.0, 27.0, 29.0, 35.0, 31.0, 57.0, 48.0, 49.0, 56.0, 38.0, 47.0, 42.0, 36.0, 41.0, 41.0, 50.0, 29.0, 26.0, 26.0, 24.0, 24.0, 21.0, 16.0, 11.0, 14.0, 8.0, 11.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.32525014877319336, -0.31658703088760376, -0.30792391300201416, -0.29926082491874695, -0.29059770703315735, -0.28193458914756775, -0.27327150106430054, -0.26460838317871094, -0.25594526529312134, -0.24728214740753174, -0.23861904442310333, -0.22995594143867493, -0.22129282355308533, -0.21262970566749573, -0.20396660268306732, -0.19530349969863892, -0.18664038181304932, -0.17797726392745972, -0.1693141609430313, -0.1606510579586029, -0.1519879400730133, -0.1433248221874237, -0.1346617192029953, -0.1259986162185669, -0.1173354983329773, -0.10867238789796829, -0.10000927746295929, -0.09134616702795029, -0.08268305659294128, -0.07401994615793228, -0.06535683572292328, -0.056693725287914276, -0.04803061485290527, -0.03936750441789627, -0.030704393982887268, -0.022041283547878265, -0.013378173112869263, -0.00471506267786026, 0.003948047757148743, 0.012611158192157745, 0.021274268627166748, 0.02993737906217575, 0.03860048949718475, 0.047263599932193756, 0.05592671036720276, 0.06458982080221176, 0.07325293123722076, 0.08191604167222977, 0.09057915210723877, 0.09924226254224777, 0.10790537297725677, 0.11656848341226578, 0.12523159384727478, 0.13389471173286438, 0.14255781471729279, 0.1512209177017212, 0.1598840355873108, 0.1685471534729004, 0.1772102564573288, 0.1858733594417572, 0.1945364773273468, 0.2031995952129364, 0.2118626981973648, 0.2205258011817932, 0.2291889190673828]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 13.0, 26.0, 29.0, 44.0, 93.0, 154.0, 325.0, 600.0, 1381.0, 4174.0, 16024.0, 106255.0, 1421999.0, 2381849.0, 224435.0, 27405.0, 6181.0, 1869.0, 727.0, 305.0, 159.0, 83.0, 51.0, 34.0, 24.0, 10.0, 13.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06880664825439453, -0.06644630432128906, -0.0640859603881836, -0.061725616455078125, -0.059365272521972656, -0.05700492858886719, -0.05464458465576172, -0.05228424072265625, -0.04992389678955078, -0.04756355285644531, -0.045203208923339844, -0.042842864990234375, -0.040482521057128906, -0.03812217712402344, -0.03576183319091797, -0.0334014892578125, -0.03104114532470703, -0.028680801391601562, -0.026320457458496094, -0.023960113525390625, -0.021599769592285156, -0.019239425659179688, -0.01687908172607422, -0.01451873779296875, -0.012158393859863281, -0.009798049926757812, -0.007437705993652344, -0.005077362060546875, -0.0027170181274414062, -0.0003566741943359375, 0.0020036697387695312, 0.004364013671875, 0.006724357604980469, 0.009084701538085938, 0.011445045471191406, 0.013805389404296875, 0.016165733337402344, 0.018526077270507812, 0.02088642120361328, 0.02324676513671875, 0.02560710906982422, 0.027967453002929688, 0.030327796936035156, 0.032688140869140625, 0.035048484802246094, 0.03740882873535156, 0.03976917266845703, 0.0421295166015625, 0.04448986053466797, 0.04685020446777344, 0.049210548400878906, 0.051570892333984375, 0.053931236267089844, 0.05629158020019531, 0.05865192413330078, 0.06101226806640625, 0.06337261199951172, 0.06573295593261719, 0.06809329986572266, 0.07045364379882812, 0.0728139877319336, 0.07517433166503906, 0.07753467559814453, 0.07989501953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 7.0, 16.0, 20.0, 20.0, 15.0, 24.0, 29.0, 35.0, 60.0, 49.0, 56.0, 73.0, 68.0, 79.0, 77.0, 48.0, 60.0, 46.0, 48.0, 28.0, 34.0, 25.0, 21.0, 16.0, 14.0, 11.0, 2.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037841796875, -0.036448001861572266, -0.03505420684814453, -0.0336604118347168, -0.03226661682128906, -0.030872821807861328, -0.029479026794433594, -0.02808523178100586, -0.026691436767578125, -0.02529764175415039, -0.023903846740722656, -0.022510051727294922, -0.021116256713867188, -0.019722461700439453, -0.01832866668701172, -0.016934871673583984, -0.01554107666015625, -0.014147281646728516, -0.012753486633300781, -0.011359691619873047, -0.009965896606445312, -0.008572101593017578, -0.007178306579589844, -0.005784511566162109, -0.004390716552734375, -0.0029969215393066406, -0.0016031265258789062, -0.00020933151245117188, 0.0011844635009765625, 0.002578258514404297, 0.003972053527832031, 0.005365848541259766, 0.0067596435546875, 0.008153438568115234, 0.009547233581542969, 0.010941028594970703, 0.012334823608398438, 0.013728618621826172, 0.015122413635253906, 0.01651620864868164, 0.017910003662109375, 0.01930379867553711, 0.020697593688964844, 0.022091388702392578, 0.023485183715820312, 0.024878978729248047, 0.02627277374267578, 0.027666568756103516, 0.02906036376953125, 0.030454158782958984, 0.03184795379638672, 0.03324174880981445, 0.03463554382324219, 0.03602933883666992, 0.037423133850097656, 0.03881692886352539, 0.040210723876953125, 0.04160451889038086, 0.042998313903808594, 0.04439210891723633, 0.04578590393066406, 0.0471796989440918, 0.04857349395751953, 0.049967288970947266, 0.051361083984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 8.0, 15.0, 15.0, 18.0, 32.0, 40.0, 73.0, 150.0, 237.0, 633.0, 1620.0, 7387.0, 76988.0, 1916373.0, 2094500.0, 85550.0, 7795.0, 1646.0, 584.0, 260.0, 128.0, 72.0, 49.0, 26.0, 23.0, 17.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1402587890625, -0.13646984100341797, -0.13268089294433594, -0.1288919448852539, -0.12510299682617188, -0.12131404876708984, -0.11752510070800781, -0.11373615264892578, -0.10994720458984375, -0.10615825653076172, -0.10236930847167969, -0.09858036041259766, -0.09479141235351562, -0.0910024642944336, -0.08721351623535156, -0.08342456817626953, -0.0796356201171875, -0.07584667205810547, -0.07205772399902344, -0.0682687759399414, -0.06447982788085938, -0.060690879821777344, -0.05690193176269531, -0.05311298370361328, -0.04932403564453125, -0.04553508758544922, -0.04174613952636719, -0.037957191467285156, -0.034168243408203125, -0.030379295349121094, -0.026590347290039062, -0.02280139923095703, -0.019012451171875, -0.015223503112792969, -0.011434555053710938, -0.007645606994628906, -0.003856658935546875, -6.771087646484375e-05, 0.0037212371826171875, 0.007510185241699219, 0.01129913330078125, 0.015088081359863281, 0.018877029418945312, 0.022665977478027344, 0.026454925537109375, 0.030243873596191406, 0.03403282165527344, 0.03782176971435547, 0.0416107177734375, 0.04539966583251953, 0.04918861389160156, 0.052977561950683594, 0.056766510009765625, 0.060555458068847656, 0.06434440612792969, 0.06813335418701172, 0.07192230224609375, 0.07571125030517578, 0.07950019836425781, 0.08328914642333984, 0.08707809448242188, 0.0908670425415039, 0.09465599060058594, 0.09844493865966797, 0.10223388671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 16.0, 18.0, 31.0, 35.0, 58.0, 62.0, 105.0, 167.0, 185.0, 307.0, 386.0, 440.0, 456.0, 438.0, 346.0, 295.0, 190.0, 152.0, 90.0, 85.0, 56.0, 32.0, 36.0, 18.0, 13.0, 12.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0416259765625, -0.03992176055908203, -0.03821754455566406, -0.036513328552246094, -0.034809112548828125, -0.033104896545410156, -0.03140068054199219, -0.02969646453857422, -0.02799224853515625, -0.02628803253173828, -0.024583816528320312, -0.022879600524902344, -0.021175384521484375, -0.019471168518066406, -0.017766952514648438, -0.01606273651123047, -0.0143585205078125, -0.012654304504394531, -0.010950088500976562, -0.009245872497558594, -0.007541656494140625, -0.005837440490722656, -0.0041332244873046875, -0.0024290084838867188, -0.00072479248046875, 0.0009794235229492188, 0.0026836395263671875, 0.004387855529785156, 0.006092071533203125, 0.007796287536621094, 0.009500503540039062, 0.011204719543457031, 0.012908935546875, 0.014613151550292969, 0.016317367553710938, 0.018021583557128906, 0.019725799560546875, 0.021430015563964844, 0.023134231567382812, 0.02483844757080078, 0.02654266357421875, 0.02824687957763672, 0.029951095581054688, 0.031655311584472656, 0.033359527587890625, 0.035063743591308594, 0.03676795959472656, 0.03847217559814453, 0.0401763916015625, 0.04188060760498047, 0.04358482360839844, 0.045289039611816406, 0.046993255615234375, 0.048697471618652344, 0.05040168762207031, 0.05210590362548828, 0.05381011962890625, 0.05551433563232422, 0.05721855163574219, 0.058922767639160156, 0.060626983642578125, 0.062331199645996094, 0.06403541564941406, 0.06573963165283203, 0.06744384765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 16.0, 23.0, 49.0, 102.0, 165.0, 163.0, 173.0, 120.0, 86.0, 49.0, 28.0, 15.0, 12.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5891666412353516, -0.5762376189231873, -0.563308596611023, -0.5503795742988586, -0.5374505519866943, -0.52452152967453, -0.5115925073623657, -0.4986635148525238, -0.4857344925403595, -0.4728054702281952, -0.4598764479160309, -0.4469474256038666, -0.43401840329170227, -0.42108941078186035, -0.40816038846969604, -0.39523136615753174, -0.38230234384536743, -0.3693733215332031, -0.3564442992210388, -0.3435152769088745, -0.3305862545967102, -0.3176572322845459, -0.3047282099723816, -0.2917992174625397, -0.278870165348053, -0.26594114303588867, -0.25301212072372437, -0.24008309841156006, -0.22715409100055695, -0.21422506868839264, -0.20129604637622833, -0.18836703896522522, -0.1754380166530609, -0.1625089943408966, -0.1495799720287323, -0.136650949716568, -0.12372194230556488, -0.11079291999340057, -0.09786389768123627, -0.08493488281965256, -0.07200586050748825, -0.05907684192061424, -0.046147823333740234, -0.03321880102157593, -0.02028978243470192, -0.007360763847827911, 0.005568258464336395, 0.018497273325920105, 0.03142629563808441, 0.04435531422495842, 0.05728433281183243, 0.07021335512399673, 0.08314236998558044, 0.09607139229774475, 0.10900041460990906, 0.12192942947149277, 0.13485845923423767, 0.14778748154640198, 0.16071650385856628, 0.1736455261707306, 0.1865745335817337, 0.199503555893898, 0.21243257820606232, 0.22536158561706543, 0.23829060792922974]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 12.0, 18.0, 19.0, 20.0, 17.0, 23.0, 28.0, 33.0, 21.0, 30.0, 28.0, 31.0, 34.0, 41.0, 46.0, 40.0, 35.0, 35.0, 45.0, 41.0, 36.0, 35.0, 39.0, 28.0, 29.0, 25.0, 26.0, 22.0, 23.0, 29.0, 15.0, 12.0, 15.0, 9.0, 10.0, 3.0, 14.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16827094554901123, -0.16324302554130554, -0.15821510553359985, -0.15318717062473297, -0.14815925061702728, -0.1431313306093216, -0.1381033957004547, -0.13307547569274902, -0.12804755568504333, -0.12301963567733765, -0.11799170821905136, -0.11296378076076508, -0.10793586075305939, -0.1029079407453537, -0.09788001328706741, -0.09285208582878113, -0.08782416582107544, -0.08279624581336975, -0.07776831835508347, -0.07274039089679718, -0.06771247088909149, -0.0626845508813858, -0.05765662342309952, -0.05262869969010353, -0.047600775957107544, -0.04257285222411156, -0.03754492849111557, -0.03251700475811958, -0.027489081025123596, -0.02246115729212761, -0.017433233559131622, -0.012405309826135635, -0.0073773860931396484, -0.0023494623601436615, 0.0026784613728523254, 0.007706385105848312, 0.0127343088388443, 0.017762232571840286, 0.022790156304836273, 0.02781808003783226, 0.03284600377082825, 0.037873927503824234, 0.04290185123682022, 0.04792977496981621, 0.052957698702812195, 0.05798562243580818, 0.06301354616880417, 0.06804147362709045, 0.07306939363479614, 0.07809731364250183, 0.08312524110078812, 0.0881531685590744, 0.09318108856678009, 0.09820900857448578, 0.10323693603277206, 0.10826486349105835, 0.11329278349876404, 0.11832070350646973, 0.12334863096475601, 0.1283765584230423, 0.13340447843074799, 0.13843239843845367, 0.14346033334732056, 0.14848825335502625, 0.15351617336273193]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 4.0, 16.0, 15.0, 29.0, 35.0, 57.0, 93.0, 188.0, 348.0, 690.0, 1570.0, 3984.0, 10791.0, 30928.0, 96468.0, 304231.0, 390091.0, 140717.0, 44117.0, 14804.0, 5393.0, 2112.0, 941.0, 413.0, 209.0, 113.0, 57.0, 45.0, 24.0, 23.0, 13.0, 11.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12831497192382812, -0.12503814697265625, -0.12176132202148438, -0.1184844970703125, -0.11520767211914062, -0.11193084716796875, -0.10865402221679688, -0.105377197265625, -0.10210037231445312, -0.09882354736328125, -0.09554672241210938, -0.0922698974609375, -0.08899307250976562, -0.08571624755859375, -0.08243942260742188, -0.07916259765625, -0.07588577270507812, -0.07260894775390625, -0.06933212280273438, -0.0660552978515625, -0.06277847290039062, -0.05950164794921875, -0.056224822998046875, -0.052947998046875, -0.049671173095703125, -0.04639434814453125, -0.043117523193359375, -0.0398406982421875, -0.036563873291015625, -0.03328704833984375, -0.030010223388671875, -0.0267333984375, -0.023456573486328125, -0.02017974853515625, -0.016902923583984375, -0.0136260986328125, -0.010349273681640625, -0.00707244873046875, -0.003795623779296875, -0.000518798828125, 0.002758026123046875, 0.00603485107421875, 0.009311676025390625, 0.0125885009765625, 0.015865325927734375, 0.01914215087890625, 0.022418975830078125, 0.02569580078125, 0.028972625732421875, 0.03224945068359375, 0.035526275634765625, 0.0388031005859375, 0.042079925537109375, 0.04535675048828125, 0.048633575439453125, 0.051910400390625, 0.055187225341796875, 0.05846405029296875, 0.061740875244140625, 0.0650177001953125, 0.06829452514648438, 0.07157135009765625, 0.07484817504882812, 0.078125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 6.0, 6.0, 8.0, 17.0, 22.0, 22.0, 24.0, 30.0, 38.0, 39.0, 49.0, 67.0, 59.0, 62.0, 66.0, 75.0, 55.0, 64.0, 54.0, 33.0, 44.0, 44.0, 31.0, 15.0, 18.0, 13.0, 16.0, 10.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04296875, -0.04165077209472656, -0.040332794189453125, -0.03901481628417969, -0.03769683837890625, -0.03637886047363281, -0.035060882568359375, -0.03374290466308594, -0.0324249267578125, -0.031106948852539062, -0.029788970947265625, -0.028470993041992188, -0.02715301513671875, -0.025835037231445312, -0.024517059326171875, -0.023199081420898438, -0.021881103515625, -0.020563125610351562, -0.019245147705078125, -0.017927169799804688, -0.01660919189453125, -0.015291213989257812, -0.013973236083984375, -0.012655258178710938, -0.0113372802734375, -0.010019302368164062, -0.008701324462890625, -0.0073833465576171875, -0.00606536865234375, -0.0047473907470703125, -0.003429412841796875, -0.0021114349365234375, -0.00079345703125, 0.0005245208740234375, 0.001842498779296875, 0.0031604766845703125, 0.00447845458984375, 0.0057964324951171875, 0.007114410400390625, 0.008432388305664062, 0.0097503662109375, 0.011068344116210938, 0.012386322021484375, 0.013704299926757812, 0.01502227783203125, 0.016340255737304688, 0.017658233642578125, 0.018976211547851562, 0.020294189453125, 0.021612167358398438, 0.022930145263671875, 0.024248123168945312, 0.02556610107421875, 0.026884078979492188, 0.028202056884765625, 0.029520034790039062, 0.0308380126953125, 0.03215599060058594, 0.033473968505859375, 0.03479194641113281, 0.03610992431640625, 0.03742790222167969, 0.038745880126953125, 0.04006385803222656, 0.0413818359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 5.0, 5.0, 14.0, 12.0, 13.0, 12.0, 9.0, 18.0, 28.0, 32.0, 42.0, 62.0, 84.0, 178.0, 323.0, 824.0, 2198.0, 5862.0, 16586.0, 46223.0, 122305.0, 289946.0, 324370.0, 150181.0, 56765.0, 20611.0, 7348.0, 2610.0, 969.0, 410.0, 173.0, 86.0, 70.0, 39.0, 26.0, 23.0, 19.0, 17.0, 14.0, 6.0, 11.0, 5.0, 8.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0892333984375, -0.08636474609375, -0.08349609375, -0.08062744140625, -0.0777587890625, -0.07489013671875, -0.072021484375, -0.06915283203125, -0.0662841796875, -0.06341552734375, -0.060546875, -0.05767822265625, -0.0548095703125, -0.05194091796875, -0.049072265625, -0.04620361328125, -0.0433349609375, -0.04046630859375, -0.03759765625, -0.03472900390625, -0.0318603515625, -0.02899169921875, -0.026123046875, -0.02325439453125, -0.0203857421875, -0.01751708984375, -0.0146484375, -0.01177978515625, -0.0089111328125, -0.00604248046875, -0.003173828125, -0.00030517578125, 0.0025634765625, 0.00543212890625, 0.00830078125, 0.01116943359375, 0.0140380859375, 0.01690673828125, 0.019775390625, 0.02264404296875, 0.0255126953125, 0.02838134765625, 0.03125, 0.03411865234375, 0.0369873046875, 0.03985595703125, 0.042724609375, 0.04559326171875, 0.0484619140625, 0.05133056640625, 0.05419921875, 0.05706787109375, 0.0599365234375, 0.06280517578125, 0.065673828125, 0.06854248046875, 0.0714111328125, 0.07427978515625, 0.0771484375, 0.08001708984375, 0.0828857421875, 0.08575439453125, 0.088623046875, 0.09149169921875, 0.0943603515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 6.0, 8.0, 10.0, 6.0, 16.0, 11.0, 12.0, 17.0, 17.0, 19.0, 28.0, 21.0, 28.0, 21.0, 25.0, 30.0, 33.0, 34.0, 27.0, 46.0, 47.0, 41.0, 48.0, 19.0, 39.0, 39.0, 33.0, 33.0, 25.0, 27.0, 29.0, 23.0, 30.0, 25.0, 17.0, 23.0, 20.0, 8.0, 5.0, 12.0, 14.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.078125, -0.07583045959472656, -0.07353591918945312, -0.07124137878417969, -0.06894683837890625, -0.06665229797363281, -0.06435775756835938, -0.06206321716308594, -0.0597686767578125, -0.05747413635253906, -0.055179595947265625, -0.05288505554199219, -0.05059051513671875, -0.04829597473144531, -0.046001434326171875, -0.04370689392089844, -0.041412353515625, -0.03911781311035156, -0.036823272705078125, -0.03452873229980469, -0.03223419189453125, -0.029939651489257812, -0.027645111083984375, -0.025350570678710938, -0.0230560302734375, -0.020761489868164062, -0.018466949462890625, -0.016172409057617188, -0.01387786865234375, -0.011583328247070312, -0.009288787841796875, -0.0069942474365234375, -0.00469970703125, -0.0024051666259765625, -0.000110626220703125, 0.0021839141845703125, 0.00447845458984375, 0.0067729949951171875, 0.009067535400390625, 0.011362075805664062, 0.0136566162109375, 0.015951156616210938, 0.018245697021484375, 0.020540237426757812, 0.02283477783203125, 0.025129318237304688, 0.027423858642578125, 0.029718399047851562, 0.032012939453125, 0.03430747985839844, 0.036602020263671875, 0.03889656066894531, 0.04119110107421875, 0.04348564147949219, 0.045780181884765625, 0.04807472229003906, 0.0503692626953125, 0.05266380310058594, 0.054958343505859375, 0.05725288391113281, 0.05954742431640625, 0.06184196472167969, 0.06413650512695312, 0.06643104553222656, 0.0687255859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 11.0, 8.0, 11.0, 14.0, 18.0, 28.0, 62.0, 58.0, 84.0, 163.0, 214.0, 348.0, 571.0, 996.0, 1661.0, 2743.0, 4686.0, 8425.0, 15118.0, 28022.0, 51620.0, 92884.0, 156676.0, 213101.0, 191897.0, 123294.0, 69395.0, 38615.0, 20834.0, 11466.0, 6395.0, 3695.0, 2188.0, 1252.0, 741.0, 454.0, 288.0, 165.0, 104.0, 82.0, 48.0, 34.0, 24.0, 22.0, 12.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0211639404296875, -0.02045273780822754, -0.019741535186767578, -0.019030332565307617, -0.018319129943847656, -0.017607927322387695, -0.016896724700927734, -0.016185522079467773, -0.015474319458007812, -0.014763116836547852, -0.01405191421508789, -0.01334071159362793, -0.012629508972167969, -0.011918306350708008, -0.011207103729248047, -0.010495901107788086, -0.009784698486328125, -0.009073495864868164, -0.008362293243408203, -0.007651090621948242, -0.006939888000488281, -0.00622868537902832, -0.005517482757568359, -0.0048062801361083984, -0.0040950775146484375, -0.0033838748931884766, -0.0026726722717285156, -0.0019614696502685547, -0.0012502670288085938, -0.0005390644073486328, 0.00017213821411132812, 0.0008833408355712891, 0.00159454345703125, 0.002305746078491211, 0.003016948699951172, 0.003728151321411133, 0.004439353942871094, 0.005150556564331055, 0.005861759185791016, 0.0065729618072509766, 0.0072841644287109375, 0.007995367050170898, 0.00870656967163086, 0.00941777229309082, 0.010128974914550781, 0.010840177536010742, 0.011551380157470703, 0.012262582778930664, 0.012973785400390625, 0.013684988021850586, 0.014396190643310547, 0.015107393264770508, 0.01581859588623047, 0.01652979850769043, 0.01724100112915039, 0.01795220375061035, 0.018663406372070312, 0.019374608993530273, 0.020085811614990234, 0.020797014236450195, 0.021508216857910156, 0.022219419479370117, 0.022930622100830078, 0.02364182472229004, 0.02435302734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 2.0, 10.0, 6.0, 12.0, 12.0, 13.0, 15.0, 20.0, 26.0, 29.0, 36.0, 37.0, 58.0, 62.0, 54.0, 75.0, 72.0, 39.0, 65.0, 56.0, 52.0, 27.0, 34.0, 31.0, 21.0, 20.0, 23.0, 9.0, 11.0, 13.0, 7.0, 10.0, 7.0, 6.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.519918441772461e-05, -1.4643184840679169e-05, -1.4087185263633728e-05, -1.3531185686588287e-05, -1.2975186109542847e-05, -1.2419186532497406e-05, -1.1863186955451965e-05, -1.1307187378406525e-05, -1.0751187801361084e-05, -1.0195188224315643e-05, -9.639188647270203e-06, -9.083189070224762e-06, -8.527189493179321e-06, -7.97118991613388e-06, -7.41519033908844e-06, -6.859190762042999e-06, -6.303191184997559e-06, -5.747191607952118e-06, -5.191192030906677e-06, -4.6351924538612366e-06, -4.079192876815796e-06, -3.5231932997703552e-06, -2.9671937227249146e-06, -2.411194145679474e-06, -1.8551945686340332e-06, -1.2991949915885925e-06, -7.431954145431519e-07, -1.8719583749771118e-07, 3.688037395477295e-07, 9.248033165931702e-07, 1.4808028936386108e-06, 2.0368024706840515e-06, 2.592802047729492e-06, 3.148801624774933e-06, 3.7048012018203735e-06, 4.260800778865814e-06, 4.816800355911255e-06, 5.3727999329566956e-06, 5.928799510002136e-06, 6.484799087047577e-06, 7.040798664093018e-06, 7.596798241138458e-06, 8.152797818183899e-06, 8.70879739522934e-06, 9.26479697227478e-06, 9.820796549320221e-06, 1.0376796126365662e-05, 1.0932795703411102e-05, 1.1488795280456543e-05, 1.2044794857501984e-05, 1.2600794434547424e-05, 1.3156794011592865e-05, 1.3712793588638306e-05, 1.4268793165683746e-05, 1.4824792742729187e-05, 1.5380792319774628e-05, 1.593679189682007e-05, 1.649279147386551e-05, 1.704879105091095e-05, 1.760479062795639e-05, 1.816079020500183e-05, 1.8716789782047272e-05, 1.9272789359092712e-05, 1.9828788936138153e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 4.0, 5.0, 12.0, 7.0, 17.0, 26.0, 53.0, 81.0, 146.0, 259.0, 522.0, 1056.0, 2157.0, 4538.0, 9685.0, 21872.0, 47050.0, 101655.0, 196151.0, 264486.0, 200862.0, 106177.0, 49889.0, 22483.0, 10180.0, 4636.0, 2236.0, 1035.0, 571.0, 257.0, 154.0, 97.0, 60.0, 25.0, 25.0, 14.0, 13.0, 7.0, 6.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0241851806640625, -0.023392915725708008, -0.022600650787353516, -0.021808385848999023, -0.02101612091064453, -0.02022385597229004, -0.019431591033935547, -0.018639326095581055, -0.017847061157226562, -0.01705479621887207, -0.016262531280517578, -0.015470266342163086, -0.014678001403808594, -0.013885736465454102, -0.01309347152709961, -0.012301206588745117, -0.011508941650390625, -0.010716676712036133, -0.00992441177368164, -0.009132146835327148, -0.008339881896972656, -0.007547616958618164, -0.006755352020263672, -0.00596308708190918, -0.0051708221435546875, -0.004378557205200195, -0.003586292266845703, -0.002794027328491211, -0.0020017623901367188, -0.0012094974517822266, -0.0004172325134277344, 0.0003750324249267578, 0.00116729736328125, 0.001959562301635742, 0.0027518272399902344, 0.0035440921783447266, 0.004336357116699219, 0.005128622055053711, 0.005920886993408203, 0.006713151931762695, 0.0075054168701171875, 0.00829768180847168, 0.009089946746826172, 0.009882211685180664, 0.010674476623535156, 0.011466741561889648, 0.01225900650024414, 0.013051271438598633, 0.013843536376953125, 0.014635801315307617, 0.01542806625366211, 0.0162203311920166, 0.017012596130371094, 0.017804861068725586, 0.018597126007080078, 0.01938939094543457, 0.020181655883789062, 0.020973920822143555, 0.021766185760498047, 0.02255845069885254, 0.02335071563720703, 0.024142980575561523, 0.024935245513916016, 0.025727510452270508, 0.026519775390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 7.0, 6.0, 5.0, 8.0, 7.0, 9.0, 6.0, 4.0, 14.0, 15.0, 8.0, 12.0, 15.0, 18.0, 31.0, 33.0, 31.0, 28.0, 34.0, 56.0, 52.0, 61.0, 51.0, 58.0, 53.0, 55.0, 47.0, 35.0, 39.0, 40.0, 30.0, 19.0, 23.0, 19.0, 14.0, 9.0, 5.0, 6.0, 11.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0222930908203125, -0.02165079116821289, -0.02100849151611328, -0.020366191864013672, -0.019723892211914062, -0.019081592559814453, -0.018439292907714844, -0.017796993255615234, -0.017154693603515625, -0.016512393951416016, -0.015870094299316406, -0.015227794647216797, -0.014585494995117188, -0.013943195343017578, -0.013300895690917969, -0.01265859603881836, -0.01201629638671875, -0.01137399673461914, -0.010731697082519531, -0.010089397430419922, -0.009447097778320312, -0.008804798126220703, -0.008162498474121094, -0.007520198822021484, -0.006877899169921875, -0.006235599517822266, -0.005593299865722656, -0.004951000213623047, -0.0043087005615234375, -0.003666400909423828, -0.0030241012573242188, -0.0023818016052246094, -0.001739501953125, -0.0010972023010253906, -0.00045490264892578125, 0.00018739700317382812, 0.0008296966552734375, 0.0014719963073730469, 0.0021142959594726562, 0.0027565956115722656, 0.003398895263671875, 0.004041194915771484, 0.004683494567871094, 0.005325794219970703, 0.0059680938720703125, 0.006610393524169922, 0.007252693176269531, 0.00789499282836914, 0.00853729248046875, 0.00917959213256836, 0.009821891784667969, 0.010464191436767578, 0.011106491088867188, 0.011748790740966797, 0.012391090393066406, 0.013033390045166016, 0.013675689697265625, 0.014317989349365234, 0.014960289001464844, 0.015602588653564453, 0.016244888305664062, 0.016887187957763672, 0.01752948760986328, 0.01817178726196289, 0.0188140869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 7.0, 14.0, 15.0, 27.0, 20.0, 45.0, 52.0, 49.0, 61.0, 86.0, 85.0, 81.0, 69.0, 74.0, 71.0, 52.0, 53.0, 34.0, 24.0, 25.0, 7.0, 16.0, 8.0, 10.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21301813423633575, -0.20575805008411407, -0.1984979808330536, -0.1912378966808319, -0.18397781252861023, -0.17671772837638855, -0.16945765912532806, -0.16219757497310638, -0.1549375057220459, -0.14767742156982422, -0.14041735231876373, -0.13315726816654205, -0.12589718401432037, -0.11863710731267929, -0.11137703061103821, -0.10411694645881653, -0.09685686230659485, -0.08959678560495377, -0.08233670145273209, -0.075076624751091, -0.06781654059886932, -0.06055646389722824, -0.05329638719558716, -0.04603630676865578, -0.038776226341724396, -0.031516145914793015, -0.024256067350506783, -0.01699598878622055, -0.00973590835928917, -0.002475827932357788, 0.004784248769283295, 0.012044329196214676, 0.01930442452430725, 0.026564504951238632, 0.03382458537817001, 0.041084662079811096, 0.04834474250674248, 0.05560482293367386, 0.06286489963531494, 0.07012498378753662, 0.0773850604891777, 0.08464513719081879, 0.09190522134304047, 0.09916529804468155, 0.10642537474632263, 0.11368545889854431, 0.1209455356001854, 0.12820561230182648, 0.13546569645404816, 0.14272578060626984, 0.14998584985733032, 0.157245934009552, 0.16450601816177368, 0.17176610231399536, 0.17902617156505585, 0.18628625571727753, 0.193546324968338, 0.2008064091205597, 0.20806647837162018, 0.21532656252384186, 0.22258664667606354, 0.22984671592712402, 0.2371068000793457, 0.24436688423156738, 0.25162696838378906]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 12.0, 10.0, 13.0, 13.0, 17.0, 24.0, 27.0, 26.0, 31.0, 31.0, 39.0, 33.0, 35.0, 52.0, 42.0, 43.0, 42.0, 41.0, 58.0, 36.0, 42.0, 44.0, 44.0, 41.0, 24.0, 24.0, 22.0, 22.0, 27.0, 12.0, 13.0, 10.0, 5.0, 1.0, 8.0, 5.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2907903790473938, -0.2819488048553467, -0.27310723066329956, -0.26426562666893005, -0.25542405247688293, -0.24658247828483582, -0.2377409040927887, -0.22889931499958038, -0.22005772590637207, -0.21121615171432495, -0.20237456262111664, -0.19353298842906952, -0.1846913993358612, -0.1758498251438141, -0.16700825095176697, -0.15816666185855865, -0.14932508766651154, -0.14048351347446442, -0.1316419243812561, -0.12280035018920898, -0.11395876109600067, -0.10511718690395355, -0.09627560526132584, -0.08743402361869812, -0.0785924419760704, -0.06975086033344269, -0.06090927869081497, -0.052067700773477554, -0.04322611913084984, -0.03438453748822212, -0.025542959570884705, -0.01670137792825699, -0.007859796285629272, 0.000981784425675869, 0.00982336513698101, 0.018664944916963577, 0.027506526559591293, 0.03634810820221901, 0.04518968611955643, 0.05403126776218414, 0.06287284940481186, 0.07171443104743958, 0.08055601269006729, 0.08939759433269501, 0.09823916852474213, 0.10708075761795044, 0.11592233180999756, 0.12476391345262527, 0.133605495095253, 0.1424470692873001, 0.15128865838050842, 0.16013023257255554, 0.16897182166576385, 0.17781339585781097, 0.1866549849510193, 0.1954965591430664, 0.20433813333511353, 0.21317970752716064, 0.22202129662036896, 0.23086287081241608, 0.2397044599056244, 0.2485460340976715, 0.25738760828971863, 0.26622921228408813, 0.27507078647613525]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 5.0, 10.0, 23.0, 33.0, 44.0, 72.0, 129.0, 222.0, 487.0, 1334.0, 4798.0, 24569.0, 294424.0, 3254168.0, 567447.0, 37528.0, 6345.0, 1584.0, 526.0, 229.0, 123.0, 70.0, 43.0, 25.0, 12.0, 13.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0897216796875, -0.0864706039428711, -0.08321952819824219, -0.07996845245361328, -0.07671737670898438, -0.07346630096435547, -0.07021522521972656, -0.06696414947509766, -0.06371307373046875, -0.060461997985839844, -0.05721092224121094, -0.05395984649658203, -0.050708770751953125, -0.04745769500732422, -0.04420661926269531, -0.040955543518066406, -0.0377044677734375, -0.034453392028808594, -0.031202316284179688, -0.02795124053955078, -0.024700164794921875, -0.02144908905029297, -0.018198013305664062, -0.014946937561035156, -0.01169586181640625, -0.008444786071777344, -0.0051937103271484375, -0.0019426345825195312, 0.001308441162109375, 0.004559516906738281, 0.0078105926513671875, 0.011061668395996094, 0.014312744140625, 0.017563819885253906, 0.020814895629882812, 0.02406597137451172, 0.027317047119140625, 0.03056812286376953, 0.03381919860839844, 0.037070274353027344, 0.04032135009765625, 0.043572425842285156, 0.04682350158691406, 0.05007457733154297, 0.053325653076171875, 0.05657672882080078, 0.05982780456542969, 0.0630788803100586, 0.0663299560546875, 0.0695810317993164, 0.07283210754394531, 0.07608318328857422, 0.07933425903320312, 0.08258533477783203, 0.08583641052246094, 0.08908748626708984, 0.09233856201171875, 0.09558963775634766, 0.09884071350097656, 0.10209178924560547, 0.10534286499023438, 0.10859394073486328, 0.11184501647949219, 0.1150960922241211, 0.11834716796875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 11.0, 12.0, 11.0, 24.0, 29.0, 23.0, 35.0, 49.0, 48.0, 61.0, 63.0, 66.0, 68.0, 66.0, 68.0, 62.0, 55.0, 53.0, 45.0, 37.0, 26.0, 22.0, 23.0, 12.0, 10.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044586181640625, -0.04314374923706055, -0.041701316833496094, -0.04025888442993164, -0.03881645202636719, -0.037374019622802734, -0.03593158721923828, -0.03448915481567383, -0.033046722412109375, -0.03160429000854492, -0.03016185760498047, -0.028719425201416016, -0.027276992797851562, -0.02583456039428711, -0.024392127990722656, -0.022949695587158203, -0.02150726318359375, -0.020064830780029297, -0.018622398376464844, -0.01717996597290039, -0.015737533569335938, -0.014295101165771484, -0.012852668762207031, -0.011410236358642578, -0.009967803955078125, -0.008525371551513672, -0.007082939147949219, -0.005640506744384766, -0.0041980743408203125, -0.0027556419372558594, -0.0013132095336914062, 0.00012922286987304688, 0.0015716552734375, 0.003014087677001953, 0.004456520080566406, 0.005898952484130859, 0.0073413848876953125, 0.008783817291259766, 0.010226249694824219, 0.011668682098388672, 0.013111114501953125, 0.014553546905517578, 0.01599597930908203, 0.017438411712646484, 0.018880844116210938, 0.02032327651977539, 0.021765708923339844, 0.023208141326904297, 0.02465057373046875, 0.026093006134033203, 0.027535438537597656, 0.02897787094116211, 0.030420303344726562, 0.031862735748291016, 0.03330516815185547, 0.03474760055541992, 0.036190032958984375, 0.03763246536254883, 0.03907489776611328, 0.040517330169677734, 0.04195976257324219, 0.04340219497680664, 0.044844627380371094, 0.04628705978393555, 0.0477294921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 6.0, 9.0, 25.0, 20.0, 50.0, 41.0, 70.0, 110.0, 213.0, 405.0, 1042.0, 3419.0, 20232.0, 279823.0, 3138989.0, 702508.0, 39479.0, 5363.0, 1342.0, 518.0, 208.0, 135.0, 90.0, 55.0, 35.0, 24.0, 23.0, 16.0, 9.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13370037078857422, -0.12994956970214844, -0.12619876861572266, -0.12244796752929688, -0.1186971664428711, -0.11494636535644531, -0.11119556427001953, -0.10744476318359375, -0.10369396209716797, -0.09994316101074219, -0.0961923599243164, -0.09244155883789062, -0.08869075775146484, -0.08493995666503906, -0.08118915557861328, -0.0774383544921875, -0.07368755340576172, -0.06993675231933594, -0.06618595123291016, -0.062435150146484375, -0.058684349060058594, -0.05493354797363281, -0.05118274688720703, -0.04743194580078125, -0.04368114471435547, -0.03993034362792969, -0.036179542541503906, -0.032428741455078125, -0.028677940368652344, -0.024927139282226562, -0.02117633819580078, -0.017425537109375, -0.013674736022949219, -0.009923934936523438, -0.006173133850097656, -0.002422332763671875, 0.0013284683227539062, 0.0050792694091796875, 0.008830070495605469, 0.01258087158203125, 0.01633167266845703, 0.020082473754882812, 0.023833274841308594, 0.027584075927734375, 0.031334877014160156, 0.03508567810058594, 0.03883647918701172, 0.0425872802734375, 0.04633808135986328, 0.05008888244628906, 0.053839683532714844, 0.057590484619140625, 0.061341285705566406, 0.06509208679199219, 0.06884288787841797, 0.07259368896484375, 0.07634449005126953, 0.08009529113769531, 0.0838460922241211, 0.08759689331054688, 0.09134769439697266, 0.09509849548339844, 0.09884929656982422, 0.10260009765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 3.0, 12.0, 14.0, 18.0, 15.0, 28.0, 48.0, 65.0, 77.0, 119.0, 171.0, 221.0, 313.0, 365.0, 462.0, 448.0, 422.0, 324.0, 267.0, 210.0, 127.0, 88.0, 69.0, 43.0, 34.0, 22.0, 25.0, 16.0, 15.0, 9.0, 5.0, 1.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039703369140625, -0.03806161880493164, -0.03641986846923828, -0.03477811813354492, -0.03313636779785156, -0.0314946174621582, -0.029852867126464844, -0.028211116790771484, -0.026569366455078125, -0.024927616119384766, -0.023285865783691406, -0.021644115447998047, -0.020002365112304688, -0.018360614776611328, -0.01671886444091797, -0.01507711410522461, -0.01343536376953125, -0.01179361343383789, -0.010151863098144531, -0.008510112762451172, -0.0068683624267578125, -0.005226612091064453, -0.0035848617553710938, -0.0019431114196777344, -0.000301361083984375, 0.0013403892517089844, 0.0029821395874023438, 0.004623889923095703, 0.0062656402587890625, 0.007907390594482422, 0.009549140930175781, 0.01119089126586914, 0.0128326416015625, 0.01447439193725586, 0.01611614227294922, 0.017757892608642578, 0.019399642944335938, 0.021041393280029297, 0.022683143615722656, 0.024324893951416016, 0.025966644287109375, 0.027608394622802734, 0.029250144958496094, 0.030891895294189453, 0.03253364562988281, 0.03417539596557617, 0.03581714630126953, 0.03745889663696289, 0.03910064697265625, 0.04074239730834961, 0.04238414764404297, 0.04402589797973633, 0.04566764831542969, 0.04730939865112305, 0.048951148986816406, 0.050592899322509766, 0.052234649658203125, 0.053876399993896484, 0.055518150329589844, 0.0571599006652832, 0.05880165100097656, 0.06044340133666992, 0.06208515167236328, 0.06372690200805664, 0.06536865234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 16.0, 24.0, 31.0, 39.0, 75.0, 75.0, 91.0, 96.0, 113.0, 110.0, 89.0, 71.0, 57.0, 34.0, 22.0, 18.0, 13.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35860559344291687, -0.34958165884017944, -0.340557724237442, -0.3315337896347046, -0.32250985503196716, -0.31348592042922974, -0.3044620156288147, -0.29543808102607727, -0.28641414642333984, -0.2773902118206024, -0.268366277217865, -0.25934234261512756, -0.25031840801239014, -0.2412944883108139, -0.23227055370807648, -0.22324663400650024, -0.21422268450260162, -0.2051987498998642, -0.19617481529712677, -0.18715089559555054, -0.1781269609928131, -0.16910302639007568, -0.16007909178733826, -0.15105515718460083, -0.1420312225818634, -0.13300728797912598, -0.12398336082696915, -0.11495942622423172, -0.10593549907207489, -0.09691156446933746, -0.08788762986660004, -0.0788637027144432, -0.06983977556228638, -0.06081584468483925, -0.05179191380739212, -0.042767979204654694, -0.033744048327207565, -0.024720117449760437, -0.01569618284702301, -0.00667225569486618, 0.0023516789078712463, 0.01137561071664095, 0.020399542525410652, 0.02942347526550293, 0.03844740614295006, 0.047471337020397186, 0.05649527162313461, 0.06551919877529144, 0.07454313337802887, 0.0835670679807663, 0.09259099513292313, 0.10161492973566055, 0.11063885688781738, 0.11966279149055481, 0.12868672609329224, 0.13771066069602966, 0.1467345952987671, 0.15575852990150452, 0.16478246450424194, 0.17380639910697937, 0.1828303188085556, 0.19185425341129303, 0.20087818801403046, 0.2099021077156067, 0.21892604231834412]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 3.0, 11.0, 9.0, 8.0, 10.0, 20.0, 23.0, 18.0, 24.0, 31.0, 27.0, 26.0, 26.0, 24.0, 37.0, 44.0, 41.0, 35.0, 30.0, 31.0, 35.0, 41.0, 47.0, 44.0, 34.0, 34.0, 32.0, 41.0, 18.0, 31.0, 19.0, 17.0, 16.0, 24.0, 12.0, 11.0, 6.0, 9.0, 9.0, 11.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1703234314918518, -0.16501012444496155, -0.1596968173980713, -0.15438351035118103, -0.14907020330429077, -0.14375688135623932, -0.13844357430934906, -0.1331302672624588, -0.12781696021556854, -0.12250365316867828, -0.11719034612178802, -0.11187703162431717, -0.10656372457742691, -0.10125041753053665, -0.0959371030330658, -0.09062379598617554, -0.08531048893928528, -0.07999718189239502, -0.07468387484550476, -0.0693705603480339, -0.06405725330114365, -0.05874394625425339, -0.05343063548207283, -0.04811732470989227, -0.042804017663002014, -0.037490710616111755, -0.0321773998439312, -0.02686409093439579, -0.021550782024860382, -0.016237473115324974, -0.010924164205789566, -0.005610853433609009, -0.00029754638671875, 0.005015762522816658, 0.010329071432352066, 0.015642380341887474, 0.020955689251422882, 0.02626899816095829, 0.0315823070704937, 0.036895617842674255, 0.042208924889564514, 0.04752223193645477, 0.05283554270863533, 0.05814885348081589, 0.06346216052770615, 0.0687754675745964, 0.07408878207206726, 0.07940208911895752, 0.08471539616584778, 0.09002870321273804, 0.0953420102596283, 0.10065532475709915, 0.10596863180398941, 0.11128193885087967, 0.11659525334835052, 0.12190856039524078, 0.12722186744213104, 0.1325351744890213, 0.13784848153591156, 0.14316178858280182, 0.14847511053085327, 0.15378841757774353, 0.1591017246246338, 0.16441503167152405, 0.1697283387184143]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 3.0, 9.0, 11.0, 10.0, 15.0, 18.0, 23.0, 27.0, 43.0, 66.0, 95.0, 187.0, 282.0, 557.0, 1106.0, 2232.0, 4546.0, 10306.0, 23842.0, 59755.0, 155246.0, 324251.0, 274249.0, 114511.0, 43832.0, 18113.0, 7766.0, 3666.0, 1769.0, 863.0, 451.0, 266.0, 133.0, 83.0, 69.0, 44.0, 36.0, 23.0, 11.0, 8.0, 8.0, 5.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.142578125, -0.1379547119140625, -0.133331298828125, -0.1287078857421875, -0.12408447265625, -0.1194610595703125, -0.114837646484375, -0.1102142333984375, -0.1055908203125, -0.1009674072265625, -0.096343994140625, -0.0917205810546875, -0.08709716796875, -0.0824737548828125, -0.077850341796875, -0.0732269287109375, -0.068603515625, -0.0639801025390625, -0.059356689453125, -0.0547332763671875, -0.05010986328125, -0.0454864501953125, -0.040863037109375, -0.0362396240234375, -0.0316162109375, -0.0269927978515625, -0.022369384765625, -0.0177459716796875, -0.01312255859375, -0.0084991455078125, -0.003875732421875, 0.0007476806640625, 0.00537109375, 0.0099945068359375, 0.014617919921875, 0.0192413330078125, 0.02386474609375, 0.0284881591796875, 0.033111572265625, 0.0377349853515625, 0.0423583984375, 0.0469818115234375, 0.051605224609375, 0.0562286376953125, 0.06085205078125, 0.0654754638671875, 0.070098876953125, 0.0747222900390625, 0.079345703125, 0.0839691162109375, 0.088592529296875, 0.0932159423828125, 0.09783935546875, 0.1024627685546875, 0.107086181640625, 0.1117095947265625, 0.1163330078125, 0.1209564208984375, 0.125579833984375, 0.1302032470703125, 0.13482666015625, 0.1394500732421875, 0.144073486328125, 0.1486968994140625, 0.1533203125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 10.0, 5.0, 13.0, 13.0, 18.0, 23.0, 30.0, 32.0, 31.0, 31.0, 44.0, 52.0, 71.0, 60.0, 72.0, 76.0, 51.0, 47.0, 52.0, 61.0, 42.0, 31.0, 35.0, 31.0, 19.0, 18.0, 11.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042388916015625, -0.04110145568847656, -0.039813995361328125, -0.03852653503417969, -0.03723907470703125, -0.03595161437988281, -0.034664154052734375, -0.03337669372558594, -0.0320892333984375, -0.030801773071289062, -0.029514312744140625, -0.028226852416992188, -0.02693939208984375, -0.025651931762695312, -0.024364471435546875, -0.023077011108398438, -0.02178955078125, -0.020502090454101562, -0.019214630126953125, -0.017927169799804688, -0.01663970947265625, -0.015352249145507812, -0.014064788818359375, -0.012777328491210938, -0.0114898681640625, -0.010202407836914062, -0.008914947509765625, -0.0076274871826171875, -0.00634002685546875, -0.0050525665283203125, -0.003765106201171875, -0.0024776458740234375, -0.001190185546875, 9.72747802734375e-05, 0.001384735107421875, 0.0026721954345703125, 0.00395965576171875, 0.0052471160888671875, 0.006534576416015625, 0.007822036743164062, 0.0091094970703125, 0.010396957397460938, 0.011684417724609375, 0.012971878051757812, 0.01425933837890625, 0.015546798706054688, 0.016834259033203125, 0.018121719360351562, 0.0194091796875, 0.020696640014648438, 0.021984100341796875, 0.023271560668945312, 0.02455902099609375, 0.025846481323242188, 0.027133941650390625, 0.028421401977539062, 0.0297088623046875, 0.030996322631835938, 0.032283782958984375, 0.03357124328613281, 0.03485870361328125, 0.03614616394042969, 0.037433624267578125, 0.03872108459472656, 0.040008544921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 8.0, 5.0, 5.0, 7.0, 10.0, 7.0, 20.0, 17.0, 33.0, 41.0, 67.0, 83.0, 121.0, 176.0, 288.0, 518.0, 845.0, 1443.0, 2541.0, 4738.0, 9358.0, 19102.0, 43937.0, 99899.0, 202219.0, 274672.0, 203150.0, 101202.0, 44062.0, 19680.0, 9415.0, 4643.0, 2521.0, 1507.0, 794.0, 510.0, 292.0, 187.0, 142.0, 94.0, 60.0, 42.0, 24.0, 30.0, 13.0, 9.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09136962890625, -0.0881643295288086, -0.08495903015136719, -0.08175373077392578, -0.07854843139648438, -0.07534313201904297, -0.07213783264160156, -0.06893253326416016, -0.06572723388671875, -0.06252193450927734, -0.05931663513183594, -0.05611133575439453, -0.052906036376953125, -0.04970073699951172, -0.04649543762207031, -0.043290138244628906, -0.0400848388671875, -0.036879539489746094, -0.03367424011230469, -0.03046894073486328, -0.027263641357421875, -0.02405834197998047, -0.020853042602539062, -0.017647743225097656, -0.01444244384765625, -0.011237144470214844, -0.008031845092773438, -0.004826545715332031, -0.001621246337890625, 0.0015840530395507812, 0.0047893524169921875, 0.007994651794433594, 0.011199951171875, 0.014405250549316406, 0.017610549926757812, 0.02081584930419922, 0.024021148681640625, 0.02722644805908203, 0.030431747436523438, 0.033637046813964844, 0.03684234619140625, 0.040047645568847656, 0.04325294494628906, 0.04645824432373047, 0.049663543701171875, 0.05286884307861328, 0.05607414245605469, 0.059279441833496094, 0.0624847412109375, 0.0656900405883789, 0.06889533996582031, 0.07210063934326172, 0.07530593872070312, 0.07851123809814453, 0.08171653747558594, 0.08492183685302734, 0.08812713623046875, 0.09133243560791016, 0.09453773498535156, 0.09774303436279297, 0.10094833374023438, 0.10415363311767578, 0.10735893249511719, 0.1105642318725586, 0.11376953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 9.0, 13.0, 18.0, 16.0, 21.0, 33.0, 15.0, 22.0, 29.0, 39.0, 47.0, 43.0, 61.0, 49.0, 53.0, 42.0, 64.0, 52.0, 52.0, 47.0, 38.0, 46.0, 37.0, 23.0, 27.0, 23.0, 13.0, 9.0, 9.0, 15.0, 8.0, 4.0, 6.0, 1.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09259033203125, -0.08933639526367188, -0.08608245849609375, -0.08282852172851562, -0.0795745849609375, -0.07632064819335938, -0.07306671142578125, -0.06981277465820312, -0.066558837890625, -0.06330490112304688, -0.06005096435546875, -0.056797027587890625, -0.0535430908203125, -0.050289154052734375, -0.04703521728515625, -0.043781280517578125, -0.04052734375, -0.037273406982421875, -0.03401947021484375, -0.030765533447265625, -0.0275115966796875, -0.024257659912109375, -0.02100372314453125, -0.017749786376953125, -0.014495849609375, -0.011241912841796875, -0.00798797607421875, -0.004734039306640625, -0.0014801025390625, 0.001773834228515625, 0.00502777099609375, 0.008281707763671875, 0.01153564453125, 0.014789581298828125, 0.01804351806640625, 0.021297454833984375, 0.0245513916015625, 0.027805328369140625, 0.03105926513671875, 0.034313201904296875, 0.037567138671875, 0.040821075439453125, 0.04407501220703125, 0.047328948974609375, 0.0505828857421875, 0.053836822509765625, 0.05709075927734375, 0.060344696044921875, 0.0635986328125, 0.06685256958007812, 0.07010650634765625, 0.07336044311523438, 0.0766143798828125, 0.07986831665039062, 0.08312225341796875, 0.08637619018554688, 0.089630126953125, 0.09288406372070312, 0.09613800048828125, 0.09939193725585938, 0.1026458740234375, 0.10589981079101562, 0.10915374755859375, 0.11240768432617188, 0.11566162109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 6.0, 6.0, 8.0, 16.0, 16.0, 37.0, 49.0, 67.0, 111.0, 141.0, 214.0, 353.0, 518.0, 790.0, 1248.0, 1740.0, 2879.0, 4813.0, 8514.0, 16032.0, 33851.0, 79949.0, 200075.0, 328820.0, 209552.0, 84402.0, 35345.0, 16812.0, 8783.0, 5022.0, 3060.0, 1870.0, 1145.0, 761.0, 513.0, 354.0, 212.0, 161.0, 78.0, 72.0, 45.0, 39.0, 31.0, 12.0, 13.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.056121826171875, -0.054341793060302734, -0.05256175994873047, -0.0507817268371582, -0.04900169372558594, -0.04722166061401367, -0.045441627502441406, -0.04366159439086914, -0.041881561279296875, -0.04010152816772461, -0.038321495056152344, -0.03654146194458008, -0.03476142883300781, -0.03298139572143555, -0.03120136260986328, -0.029421329498291016, -0.02764129638671875, -0.025861263275146484, -0.02408123016357422, -0.022301197052001953, -0.020521163940429688, -0.018741130828857422, -0.016961097717285156, -0.01518106460571289, -0.013401031494140625, -0.01162099838256836, -0.009840965270996094, -0.008060932159423828, -0.0062808990478515625, -0.004500865936279297, -0.0027208328247070312, -0.0009407997131347656, 0.0008392333984375, 0.0026192665100097656, 0.004399299621582031, 0.006179332733154297, 0.007959365844726562, 0.009739398956298828, 0.011519432067871094, 0.01329946517944336, 0.015079498291015625, 0.01685953140258789, 0.018639564514160156, 0.020419597625732422, 0.022199630737304688, 0.023979663848876953, 0.02575969696044922, 0.027539730072021484, 0.02931976318359375, 0.031099796295166016, 0.03287982940673828, 0.03465986251831055, 0.03643989562988281, 0.03821992874145508, 0.039999961853027344, 0.04177999496459961, 0.043560028076171875, 0.04534006118774414, 0.047120094299316406, 0.04890012741088867, 0.05068016052246094, 0.0524601936340332, 0.05424022674560547, 0.056020259857177734, 0.05780029296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 9.0, 12.0, 18.0, 29.0, 30.0, 38.0, 53.0, 71.0, 67.0, 85.0, 70.0, 81.0, 87.0, 72.0, 66.0, 41.0, 35.0, 25.0, 27.0, 15.0, 13.0, 10.0, 8.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.62396240234375e-05, -3.532692790031433e-05, -3.441423177719116e-05, -3.350153565406799e-05, -3.2588839530944824e-05, -3.1676143407821655e-05, -3.0763447284698486e-05, -2.9850751161575317e-05, -2.893805503845215e-05, -2.802535891532898e-05, -2.711266279220581e-05, -2.619996666908264e-05, -2.5287270545959473e-05, -2.4374574422836304e-05, -2.3461878299713135e-05, -2.2549182176589966e-05, -2.1636486053466797e-05, -2.0723789930343628e-05, -1.981109380722046e-05, -1.889839768409729e-05, -1.798570156097412e-05, -1.7073005437850952e-05, -1.6160309314727783e-05, -1.5247613191604614e-05, -1.4334917068481445e-05, -1.3422220945358276e-05, -1.2509524822235107e-05, -1.1596828699111938e-05, -1.068413257598877e-05, -9.7714364528656e-06, -8.858740329742432e-06, -7.946044206619263e-06, -7.033348083496094e-06, -6.120651960372925e-06, -5.207955837249756e-06, -4.295259714126587e-06, -3.382563591003418e-06, -2.469867467880249e-06, -1.55717134475708e-06, -6.444752216339111e-07, 2.682209014892578e-07, 1.1809170246124268e-06, 2.0936131477355957e-06, 3.0063092708587646e-06, 3.919005393981934e-06, 4.8317015171051025e-06, 5.7443976402282715e-06, 6.6570937633514404e-06, 7.569789886474609e-06, 8.482486009597778e-06, 9.395182132720947e-06, 1.0307878255844116e-05, 1.1220574378967285e-05, 1.2133270502090454e-05, 1.3045966625213623e-05, 1.3958662748336792e-05, 1.4871358871459961e-05, 1.578405499458313e-05, 1.66967511177063e-05, 1.7609447240829468e-05, 1.8522143363952637e-05, 1.9434839487075806e-05, 2.0347535610198975e-05, 2.1260231733322144e-05, 2.2172927856445312e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 2.0, 4.0, 8.0, 16.0, 11.0, 23.0, 33.0, 50.0, 73.0, 129.0, 229.0, 357.0, 707.0, 1238.0, 2254.0, 5083.0, 12562.0, 37163.0, 155998.0, 504557.0, 244669.0, 53912.0, 16704.0, 6487.0, 2969.0, 1454.0, 745.0, 400.0, 267.0, 151.0, 100.0, 58.0, 51.0, 25.0, 13.0, 15.0, 7.0, 4.0, 4.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072998046875, -0.0703573226928711, -0.06771659851074219, -0.06507587432861328, -0.062435150146484375, -0.05979442596435547, -0.05715370178222656, -0.054512977600097656, -0.05187225341796875, -0.049231529235839844, -0.04659080505371094, -0.04395008087158203, -0.041309356689453125, -0.03866863250732422, -0.03602790832519531, -0.033387184143066406, -0.0307464599609375, -0.028105735778808594, -0.025465011596679688, -0.02282428741455078, -0.020183563232421875, -0.01754283905029297, -0.014902114868164062, -0.012261390686035156, -0.00962066650390625, -0.006979942321777344, -0.0043392181396484375, -0.0016984939575195312, 0.000942230224609375, 0.0035829544067382812, 0.0062236785888671875, 0.008864402770996094, 0.011505126953125, 0.014145851135253906, 0.016786575317382812, 0.01942729949951172, 0.022068023681640625, 0.02470874786376953, 0.027349472045898438, 0.029990196228027344, 0.03263092041015625, 0.035271644592285156, 0.03791236877441406, 0.04055309295654297, 0.043193817138671875, 0.04583454132080078, 0.04847526550292969, 0.051115989685058594, 0.0537567138671875, 0.056397438049316406, 0.05903816223144531, 0.06167888641357422, 0.06431961059570312, 0.06696033477783203, 0.06960105895996094, 0.07224178314208984, 0.07488250732421875, 0.07752323150634766, 0.08016395568847656, 0.08280467987060547, 0.08544540405273438, 0.08808612823486328, 0.09072685241699219, 0.0933675765991211, 0.09600830078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 13.0, 9.0, 14.0, 30.0, 53.0, 69.0, 100.0, 153.0, 142.0, 109.0, 100.0, 62.0, 35.0, 28.0, 25.0, 7.0, 9.0, 10.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0787353515625, -0.07645606994628906, -0.07417678833007812, -0.07189750671386719, -0.06961822509765625, -0.06733894348144531, -0.06505966186523438, -0.06278038024902344, -0.0605010986328125, -0.05822181701660156, -0.055942535400390625, -0.05366325378417969, -0.05138397216796875, -0.04910469055175781, -0.046825408935546875, -0.04454612731933594, -0.042266845703125, -0.03998756408691406, -0.037708282470703125, -0.03542900085449219, -0.03314971923828125, -0.030870437622070312, -0.028591156005859375, -0.026311874389648438, -0.0240325927734375, -0.021753311157226562, -0.019474029541015625, -0.017194747924804688, -0.01491546630859375, -0.012636184692382812, -0.010356903076171875, -0.008077621459960938, -0.00579833984375, -0.0035190582275390625, -0.001239776611328125, 0.0010395050048828125, 0.00331878662109375, 0.0055980682373046875, 0.007877349853515625, 0.010156631469726562, 0.0124359130859375, 0.014715194702148438, 0.016994476318359375, 0.019273757934570312, 0.02155303955078125, 0.023832321166992188, 0.026111602783203125, 0.028390884399414062, 0.030670166015625, 0.03294944763183594, 0.035228729248046875, 0.03750801086425781, 0.03978729248046875, 0.04206657409667969, 0.044345855712890625, 0.04662513732910156, 0.0489044189453125, 0.05118370056152344, 0.053462982177734375, 0.05574226379394531, 0.05802154541015625, 0.06030082702636719, 0.06258010864257812, 0.06485939025878906, 0.067138671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 4.0, 11.0, 12.0, 42.0, 67.0, 78.0, 98.0, 129.0, 132.0, 94.0, 108.0, 73.0, 51.0, 39.0, 34.0, 18.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.1436989307403564, -1.1205778121948242, -1.0974565744400024, -1.0743354558944702, -1.0512142181396484, -1.0280930995941162, -1.0049718618392944, -0.9818507432937622, -0.9587295055389404, -0.9356083273887634, -0.9124871492385864, -0.8893659710884094, -0.8662447929382324, -0.8431236147880554, -0.8200024366378784, -0.7968813180923462, -0.7737601399421692, -0.7506389617919922, -0.7275177836418152, -0.7043966054916382, -0.6812754273414612, -0.6581542491912842, -0.635033130645752, -0.6119118928909302, -0.588790774345398, -0.565669596195221, -0.542548418045044, -0.5194272398948669, -0.49630606174468994, -0.47318488359451294, -0.4500637352466583, -0.4269425570964813, -0.40382134914398193, -0.38070017099380493, -0.35757899284362793, -0.3344578146934509, -0.3113366365432739, -0.2882154583930969, -0.2650943100452423, -0.2419731318950653, -0.2188519537448883, -0.1957307755947113, -0.1726095974445343, -0.1494884341955185, -0.1263672560453415, -0.10324607789516449, -0.08012491464614868, -0.05700373649597168, -0.03388255834579468, -0.010761383920907974, 0.01235979050397873, 0.035480961203575134, 0.058602139353752136, 0.08172331750392914, 0.10484448075294495, 0.12796565890312195, 0.15108683705329895, 0.17420801520347595, 0.19732919335365295, 0.22045035660266876, 0.24357153475284576, 0.2666926980018616, 0.2898138761520386, 0.3129350543022156, 0.3360562324523926]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 4.0, 11.0, 14.0, 15.0, 15.0, 15.0, 26.0, 11.0, 22.0, 28.0, 27.0, 31.0, 27.0, 42.0, 36.0, 46.0, 46.0, 42.0, 34.0, 49.0, 36.0, 40.0, 34.0, 33.0, 39.0, 30.0, 36.0, 32.0, 19.0, 16.0, 18.0, 26.0, 17.0, 11.0, 9.0, 12.0, 8.0, 10.0, 6.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3224431872367859, -0.3119032084941864, -0.3013632297515869, -0.2908232510089874, -0.28028327226638794, -0.26974329352378845, -0.25920331478118896, -0.24866333603858948, -0.23812335729599, -0.2275833785533905, -0.21704339981079102, -0.20650342106819153, -0.19596344232559204, -0.18542346358299255, -0.17488348484039307, -0.16434350609779358, -0.15380354225635529, -0.1432635635137558, -0.1327235847711563, -0.12218360602855682, -0.11164362728595734, -0.10110364854335785, -0.09056367725133896, -0.08002369850873947, -0.06948371976613998, -0.0589437410235405, -0.04840376228094101, -0.03786378726363182, -0.027323808521032333, -0.016783829778432846, -0.006243854761123657, 0.00429612398147583, 0.014836102724075317, 0.025376081466674805, 0.03591606020927429, 0.04645603522658348, 0.05699601396918297, 0.06753599643707275, 0.07807596772909164, 0.08861594647169113, 0.09915592521429062, 0.1096959039568901, 0.1202358826994896, 0.13077585399150848, 0.14131583273410797, 0.15185581147670746, 0.16239579021930695, 0.17293576896190643, 0.18347574770450592, 0.1940157264471054, 0.2045557051897049, 0.21509568393230438, 0.22563566267490387, 0.23617564141750336, 0.24671560525894165, 0.25725558400154114, 0.2677955627441406, 0.2783355414867401, 0.2888755202293396, 0.2994154989719391, 0.3099554777145386, 0.32049545645713806, 0.33103543519973755, 0.34157541394233704, 0.3521153926849365]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 9.0, 15.0, 15.0, 23.0, 29.0, 64.0, 107.0, 173.0, 281.0, 542.0, 1040.0, 2524.0, 6466.0, 19596.0, 77477.0, 510437.0, 2471629.0, 935573.0, 125440.0, 28446.0, 8601.0, 3085.0, 1333.0, 613.0, 318.0, 179.0, 95.0, 57.0, 28.0, 31.0, 17.0, 8.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08843994140625, -0.08588695526123047, -0.08333396911621094, -0.0807809829711914, -0.07822799682617188, -0.07567501068115234, -0.07312202453613281, -0.07056903839111328, -0.06801605224609375, -0.06546306610107422, -0.06291007995605469, -0.060357093811035156, -0.057804107666015625, -0.055251121520996094, -0.05269813537597656, -0.05014514923095703, -0.0475921630859375, -0.04503917694091797, -0.04248619079589844, -0.039933204650878906, -0.037380218505859375, -0.034827232360839844, -0.03227424621582031, -0.02972126007080078, -0.02716827392578125, -0.02461528778076172, -0.022062301635742188, -0.019509315490722656, -0.016956329345703125, -0.014403343200683594, -0.011850357055664062, -0.009297370910644531, -0.006744384765625, -0.004191398620605469, -0.0016384124755859375, 0.0009145736694335938, 0.003467559814453125, 0.006020545959472656, 0.008573532104492188, 0.011126518249511719, 0.01367950439453125, 0.01623249053955078, 0.018785476684570312, 0.021338462829589844, 0.023891448974609375, 0.026444435119628906, 0.028997421264648438, 0.03155040740966797, 0.0341033935546875, 0.03665637969970703, 0.03920936584472656, 0.041762351989746094, 0.044315338134765625, 0.046868324279785156, 0.04942131042480469, 0.05197429656982422, 0.05452728271484375, 0.05708026885986328, 0.05963325500488281, 0.062186241149902344, 0.06473922729492188, 0.0672922134399414, 0.06984519958496094, 0.07239818572998047, 0.074951171875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 7.0, 14.0, 17.0, 20.0, 23.0, 33.0, 25.0, 37.0, 42.0, 51.0, 68.0, 63.0, 51.0, 62.0, 59.0, 53.0, 50.0, 48.0, 62.0, 43.0, 37.0, 31.0, 22.0, 17.0, 18.0, 12.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0535888671875, -0.051993370056152344, -0.05039787292480469, -0.04880237579345703, -0.047206878662109375, -0.04561138153076172, -0.04401588439941406, -0.042420387268066406, -0.04082489013671875, -0.039229393005371094, -0.03763389587402344, -0.03603839874267578, -0.034442901611328125, -0.03284740447998047, -0.03125190734863281, -0.029656410217285156, -0.0280609130859375, -0.026465415954589844, -0.024869918823242188, -0.02327442169189453, -0.021678924560546875, -0.02008342742919922, -0.018487930297851562, -0.016892433166503906, -0.01529693603515625, -0.013701438903808594, -0.012105941772460938, -0.010510444641113281, -0.008914947509765625, -0.007319450378417969, -0.0057239532470703125, -0.004128456115722656, -0.002532958984375, -0.0009374618530273438, 0.0006580352783203125, 0.0022535324096679688, 0.003849029541015625, 0.005444526672363281, 0.0070400238037109375, 0.008635520935058594, 0.01023101806640625, 0.011826515197753906, 0.013422012329101562, 0.015017509460449219, 0.016613006591796875, 0.01820850372314453, 0.019804000854492188, 0.021399497985839844, 0.0229949951171875, 0.024590492248535156, 0.026185989379882812, 0.02778148651123047, 0.029376983642578125, 0.03097248077392578, 0.03256797790527344, 0.034163475036621094, 0.03575897216796875, 0.037354469299316406, 0.03894996643066406, 0.04054546356201172, 0.042140960693359375, 0.04373645782470703, 0.04533195495605469, 0.046927452087402344, 0.04852294921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 17.0, 7.0, 23.0, 41.0, 59.0, 120.0, 188.0, 302.0, 599.0, 1293.0, 2805.0, 7604.0, 24441.0, 112993.0, 852593.0, 2582129.0, 505662.0, 75021.0, 17975.0, 5856.0, 2287.0, 1038.0, 521.0, 315.0, 168.0, 85.0, 51.0, 33.0, 19.0, 13.0, 9.0, 9.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13138961791992188, -0.12813568115234375, -0.12488174438476562, -0.1216278076171875, -0.11837387084960938, -0.11511993408203125, -0.11186599731445312, -0.108612060546875, -0.10535812377929688, -0.10210418701171875, -0.09885025024414062, -0.0955963134765625, -0.09234237670898438, -0.08908843994140625, -0.08583450317382812, -0.08258056640625, -0.07932662963867188, -0.07607269287109375, -0.07281875610351562, -0.0695648193359375, -0.06631088256835938, -0.06305694580078125, -0.059803009033203125, -0.056549072265625, -0.053295135498046875, -0.05004119873046875, -0.046787261962890625, -0.0435333251953125, -0.040279388427734375, -0.03702545166015625, -0.033771514892578125, -0.030517578125, -0.027263641357421875, -0.02400970458984375, -0.020755767822265625, -0.0175018310546875, -0.014247894287109375, -0.01099395751953125, -0.007740020751953125, -0.004486083984375, -0.001232147216796875, 0.00202178955078125, 0.005275726318359375, 0.0085296630859375, 0.011783599853515625, 0.01503753662109375, 0.018291473388671875, 0.02154541015625, 0.024799346923828125, 0.02805328369140625, 0.031307220458984375, 0.0345611572265625, 0.037815093994140625, 0.04106903076171875, 0.044322967529296875, 0.047576904296875, 0.050830841064453125, 0.05408477783203125, 0.057338714599609375, 0.0605926513671875, 0.06384658813476562, 0.06710052490234375, 0.07035446166992188, 0.0736083984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 12.0, 5.0, 28.0, 28.0, 50.0, 55.0, 88.0, 161.0, 255.0, 391.0, 633.0, 703.0, 581.0, 387.0, 264.0, 161.0, 76.0, 66.0, 40.0, 24.0, 16.0, 15.0, 10.0, 5.0, 8.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.05931520462036133, -0.056282997131347656, -0.053250789642333984, -0.05021858215332031, -0.04718637466430664, -0.04415416717529297, -0.0411219596862793, -0.038089752197265625, -0.03505754470825195, -0.03202533721923828, -0.02899312973022461, -0.025960922241210938, -0.022928714752197266, -0.019896507263183594, -0.016864299774169922, -0.01383209228515625, -0.010799884796142578, -0.007767677307128906, -0.004735469818115234, -0.0017032623291015625, 0.0013289451599121094, 0.004361152648925781, 0.007393360137939453, 0.010425567626953125, 0.013457775115966797, 0.01648998260498047, 0.01952219009399414, 0.022554397583007812, 0.025586605072021484, 0.028618812561035156, 0.03165102005004883, 0.0346832275390625, 0.03771543502807617, 0.040747642517089844, 0.043779850006103516, 0.04681205749511719, 0.04984426498413086, 0.05287647247314453, 0.0559086799621582, 0.058940887451171875, 0.06197309494018555, 0.06500530242919922, 0.06803750991821289, 0.07106971740722656, 0.07410192489624023, 0.0771341323852539, 0.08016633987426758, 0.08319854736328125, 0.08623075485229492, 0.0892629623413086, 0.09229516983032227, 0.09532737731933594, 0.09835958480834961, 0.10139179229736328, 0.10442399978637695, 0.10745620727539062, 0.1104884147644043, 0.11352062225341797, 0.11655282974243164, 0.11958503723144531, 0.12261724472045898, 0.12564945220947266, 0.12868165969848633, 0.1317138671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 12.0, 16.0, 15.0, 26.0, 29.0, 39.0, 39.0, 47.0, 71.0, 64.0, 79.0, 83.0, 82.0, 82.0, 59.0, 50.0, 34.0, 48.0, 32.0, 26.0, 17.0, 14.0, 10.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2281726896762848, -0.2185133844614029, -0.2088540941476822, -0.1991947889328003, -0.1895354986190796, -0.1798761934041977, -0.1702168881893158, -0.1605575978755951, -0.1508982926607132, -0.1412389874458313, -0.1315796971321106, -0.1219203919172287, -0.1122610941529274, -0.1026017963886261, -0.0929424911737442, -0.0832831934094429, -0.0736238956451416, -0.0639645978808403, -0.0543052963912487, -0.044645994901657104, -0.034986697137355804, -0.025327399373054504, -0.015668097883462906, -0.006008796393871307, 0.0036505013704299927, 0.013309800997376442, 0.02296910062432289, 0.03262840211391449, 0.04228769987821579, 0.05194699764251709, 0.06160629913210869, 0.07126560062170029, 0.0809248685836792, 0.0905841663479805, 0.1002434641122818, 0.1099027693271637, 0.119562067091465, 0.1292213648557663, 0.1388806700706482, 0.1485399603843689, 0.1581992655992508, 0.1678585708141327, 0.1775178611278534, 0.1871771663427353, 0.1968364715576172, 0.2064957618713379, 0.2161550670862198, 0.22581437230110168, 0.2354736626148224, 0.24513296782970428, 0.2547922730445862, 0.2644515633583069, 0.2741108536720276, 0.2837701439857483, 0.2934294641017914, 0.3030887544155121, 0.3127480745315552, 0.3224073648452759, 0.33206668496131897, 0.3417259752750397, 0.3513852655887604, 0.36104458570480347, 0.37070387601852417, 0.3803631663322449, 0.3900224566459656]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 10.0, 8.0, 5.0, 20.0, 14.0, 15.0, 25.0, 19.0, 20.0, 21.0, 43.0, 39.0, 34.0, 50.0, 40.0, 45.0, 48.0, 35.0, 56.0, 43.0, 27.0, 52.0, 49.0, 44.0, 37.0, 26.0, 28.0, 29.0, 25.0, 20.0, 12.0, 13.0, 17.0, 10.0, 7.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3033410310745239, -0.2945897579193115, -0.2858384847640991, -0.2770872116088867, -0.2683359384536743, -0.2595846652984619, -0.2508333921432495, -0.24208210408687592, -0.2333308309316635, -0.2245795577764511, -0.2158282846212387, -0.2070770114660263, -0.1983257234096527, -0.1895744502544403, -0.1808231770992279, -0.1720719039440155, -0.1633206307888031, -0.1545693576335907, -0.1458180844783783, -0.1370668113231659, -0.1283155381679535, -0.11956425756216049, -0.11081297695636749, -0.10206170380115509, -0.09331043064594269, -0.08455915749073029, -0.07580788433551788, -0.06705660372972488, -0.05830533057451248, -0.04955405741930008, -0.04080278053879738, -0.03205150365829468, -0.023300230503082275, -0.014548955485224724, -0.005797680467367172, 0.0029535945504903793, 0.011704869568347931, 0.020456142723560333, 0.029207419604063034, 0.037958696484565735, 0.04670996963977814, 0.05546124279499054, 0.06421251595020294, 0.07296379655599594, 0.08171506971120834, 0.09046634286642075, 0.09921762347221375, 0.10796889662742615, 0.11672016978263855, 0.12547144293785095, 0.13422271609306335, 0.14297398924827576, 0.15172526240348816, 0.16047653555870056, 0.16922782361507416, 0.17797909677028656, 0.18673036992549896, 0.19548164308071136, 0.20423291623592377, 0.21298418939113617, 0.22173547744750977, 0.23048675060272217, 0.23923802375793457, 0.24798929691314697, 0.2567405700683594]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 13.0, 9.0, 11.0, 22.0, 27.0, 40.0, 63.0, 69.0, 126.0, 208.0, 291.0, 684.0, 1241.0, 2307.0, 4890.0, 9884.0, 20999.0, 45868.0, 114073.0, 295207.0, 323825.0, 131328.0, 51927.0, 23162.0, 11097.0, 5481.0, 2595.0, 1393.0, 706.0, 408.0, 217.0, 151.0, 78.0, 44.0, 36.0, 22.0, 20.0, 6.0, 6.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11968994140625, -0.11557292938232422, -0.11145591735839844, -0.10733890533447266, -0.10322189331054688, -0.0991048812866211, -0.09498786926269531, -0.09087085723876953, -0.08675384521484375, -0.08263683319091797, -0.07851982116699219, -0.0744028091430664, -0.07028579711914062, -0.06616878509521484, -0.06205177307128906, -0.05793476104736328, -0.0538177490234375, -0.04970073699951172, -0.04558372497558594, -0.041466712951660156, -0.037349700927734375, -0.033232688903808594, -0.029115676879882812, -0.02499866485595703, -0.02088165283203125, -0.01676464080810547, -0.012647628784179688, -0.008530616760253906, -0.004413604736328125, -0.00029659271240234375, 0.0038204193115234375, 0.007937431335449219, 0.012054443359375, 0.01617145538330078, 0.020288467407226562, 0.024405479431152344, 0.028522491455078125, 0.032639503479003906, 0.03675651550292969, 0.04087352752685547, 0.04499053955078125, 0.04910755157470703, 0.05322456359863281, 0.057341575622558594, 0.061458587646484375, 0.06557559967041016, 0.06969261169433594, 0.07380962371826172, 0.0779266357421875, 0.08204364776611328, 0.08616065979003906, 0.09027767181396484, 0.09439468383789062, 0.0985116958618164, 0.10262870788574219, 0.10674571990966797, 0.11086273193359375, 0.11497974395751953, 0.11909675598144531, 0.1232137680053711, 0.12733078002929688, 0.13144779205322266, 0.13556480407714844, 0.13968181610107422, 0.143798828125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 13.0, 20.0, 23.0, 20.0, 26.0, 39.0, 38.0, 39.0, 43.0, 49.0, 70.0, 65.0, 50.0, 55.0, 64.0, 61.0, 44.0, 54.0, 42.0, 35.0, 31.0, 26.0, 15.0, 24.0, 11.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05029296875, -0.048707008361816406, -0.04712104797363281, -0.04553508758544922, -0.043949127197265625, -0.04236316680908203, -0.04077720642089844, -0.039191246032714844, -0.03760528564453125, -0.036019325256347656, -0.03443336486816406, -0.03284740447998047, -0.031261444091796875, -0.02967548370361328, -0.028089523315429688, -0.026503562927246094, -0.0249176025390625, -0.023331642150878906, -0.021745681762695312, -0.02015972137451172, -0.018573760986328125, -0.01698780059814453, -0.015401840209960938, -0.013815879821777344, -0.01222991943359375, -0.010643959045410156, -0.009057998657226562, -0.007472038269042969, -0.005886077880859375, -0.004300117492675781, -0.0027141571044921875, -0.0011281967163085938, 0.000457763671875, 0.0020437240600585938, 0.0036296844482421875, 0.005215644836425781, 0.006801605224609375, 0.008387565612792969, 0.009973526000976562, 0.011559486389160156, 0.01314544677734375, 0.014731407165527344, 0.016317367553710938, 0.01790332794189453, 0.019489288330078125, 0.02107524871826172, 0.022661209106445312, 0.024247169494628906, 0.0258331298828125, 0.027419090270996094, 0.029005050659179688, 0.03059101104736328, 0.032176971435546875, 0.03376293182373047, 0.03534889221191406, 0.036934852600097656, 0.03852081298828125, 0.040106773376464844, 0.04169273376464844, 0.04327869415283203, 0.044864654541015625, 0.04645061492919922, 0.04803657531738281, 0.049622535705566406, 0.05120849609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 18.0, 10.0, 22.0, 31.0, 37.0, 59.0, 93.0, 157.0, 256.0, 510.0, 1221.0, 3766.0, 12665.0, 45684.0, 184837.0, 519534.0, 208342.0, 50578.0, 13993.0, 4091.0, 1374.0, 550.0, 283.0, 133.0, 97.0, 55.0, 48.0, 34.0, 16.0, 17.0, 16.0, 10.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17942237854003906, -0.17390823364257812, -0.1683940887451172, -0.16287994384765625, -0.1573657989501953, -0.15185165405273438, -0.14633750915527344, -0.1408233642578125, -0.13530921936035156, -0.12979507446289062, -0.12428092956542969, -0.11876678466796875, -0.11325263977050781, -0.10773849487304688, -0.10222434997558594, -0.096710205078125, -0.09119606018066406, -0.08568191528320312, -0.08016777038574219, -0.07465362548828125, -0.06913948059082031, -0.06362533569335938, -0.05811119079589844, -0.0525970458984375, -0.04708290100097656, -0.041568756103515625, -0.03605461120605469, -0.03054046630859375, -0.025026321411132812, -0.019512176513671875, -0.013998031616210938, -0.00848388671875, -0.0029697418212890625, 0.002544403076171875, 0.008058547973632812, 0.01357269287109375, 0.019086837768554688, 0.024600982666015625, 0.030115127563476562, 0.0356292724609375, 0.04114341735839844, 0.046657562255859375, 0.05217170715332031, 0.05768585205078125, 0.06319999694824219, 0.06871414184570312, 0.07422828674316406, 0.079742431640625, 0.08525657653808594, 0.09077072143554688, 0.09628486633300781, 0.10179901123046875, 0.10731315612792969, 0.11282730102539062, 0.11834144592285156, 0.1238555908203125, 0.12936973571777344, 0.13488388061523438, 0.1403980255126953, 0.14591217041015625, 0.1514263153076172, 0.15694046020507812, 0.16245460510253906, 0.16796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 12.0, 11.0, 12.0, 12.0, 19.0, 30.0, 28.0, 29.0, 33.0, 45.0, 44.0, 48.0, 52.0, 52.0, 60.0, 52.0, 52.0, 57.0, 43.0, 46.0, 44.0, 27.0, 42.0, 33.0, 21.0, 22.0, 15.0, 9.0, 8.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.130615234375, -0.12652969360351562, -0.12244415283203125, -0.11835861206054688, -0.1142730712890625, -0.11018753051757812, -0.10610198974609375, -0.10201644897460938, -0.097930908203125, -0.09384536743164062, -0.08975982666015625, -0.08567428588867188, -0.0815887451171875, -0.07750320434570312, -0.07341766357421875, -0.06933212280273438, -0.06524658203125, -0.061161041259765625, -0.05707550048828125, -0.052989959716796875, -0.0489044189453125, -0.044818878173828125, -0.04073333740234375, -0.036647796630859375, -0.032562255859375, -0.028476715087890625, -0.02439117431640625, -0.020305633544921875, -0.0162200927734375, -0.012134552001953125, -0.00804901123046875, -0.003963470458984375, 0.0001220703125, 0.004207611083984375, 0.00829315185546875, 0.012378692626953125, 0.0164642333984375, 0.020549774169921875, 0.02463531494140625, 0.028720855712890625, 0.032806396484375, 0.036891937255859375, 0.04097747802734375, 0.045063018798828125, 0.0491485595703125, 0.053234100341796875, 0.05731964111328125, 0.061405181884765625, 0.06549072265625, 0.06957626342773438, 0.07366180419921875, 0.07774734497070312, 0.0818328857421875, 0.08591842651367188, 0.09000396728515625, 0.09408950805664062, 0.098175048828125, 0.10226058959960938, 0.10634613037109375, 0.11043167114257812, 0.1145172119140625, 0.11860275268554688, 0.12268829345703125, 0.12677383422851562, 0.130859375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 18.0, 6.0, 15.0, 29.0, 47.0, 83.0, 114.0, 167.0, 211.0, 322.0, 583.0, 926.0, 1486.0, 2343.0, 3844.0, 5849.0, 9797.0, 15463.0, 24937.0, 40096.0, 71270.0, 139067.0, 230764.0, 218134.0, 122582.0, 63701.0, 36597.0, 22319.0, 14241.0, 8830.0, 5508.0, 3393.0, 2215.0, 1326.0, 807.0, 524.0, 334.0, 235.0, 127.0, 81.0, 45.0, 46.0, 29.0, 13.0, 11.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04400634765625, -0.04274559020996094, -0.041484832763671875, -0.04022407531738281, -0.03896331787109375, -0.03770256042480469, -0.036441802978515625, -0.03518104553222656, -0.0339202880859375, -0.03265953063964844, -0.031398773193359375, -0.030138015747070312, -0.02887725830078125, -0.027616500854492188, -0.026355743408203125, -0.025094985961914062, -0.023834228515625, -0.022573471069335938, -0.021312713623046875, -0.020051956176757812, -0.01879119873046875, -0.017530441284179688, -0.016269683837890625, -0.015008926391601562, -0.0137481689453125, -0.012487411499023438, -0.011226654052734375, -0.009965896606445312, -0.00870513916015625, -0.0074443817138671875, -0.006183624267578125, -0.0049228668212890625, -0.003662109375, -0.0024013519287109375, -0.001140594482421875, 0.0001201629638671875, 0.00138092041015625, 0.0026416778564453125, 0.003902435302734375, 0.0051631927490234375, 0.0064239501953125, 0.0076847076416015625, 0.008945465087890625, 0.010206222534179688, 0.01146697998046875, 0.012727737426757812, 0.013988494873046875, 0.015249252319335938, 0.016510009765625, 0.017770767211914062, 0.019031524658203125, 0.020292282104492188, 0.02155303955078125, 0.022813796997070312, 0.024074554443359375, 0.025335311889648438, 0.0265960693359375, 0.027856826782226562, 0.029117584228515625, 0.030378341674804688, 0.03163909912109375, 0.03289985656738281, 0.034160614013671875, 0.03542137145996094, 0.03668212890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 8.0, 6.0, 3.0, 8.0, 15.0, 16.0, 19.0, 22.0, 28.0, 34.0, 39.0, 45.0, 56.0, 71.0, 59.0, 65.0, 65.0, 53.0, 58.0, 44.0, 67.0, 48.0, 36.0, 24.0, 13.0, 23.0, 19.0, 8.0, 12.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0623207092285156e-05, -1.9931234419345856e-05, -1.9239261746406555e-05, -1.8547289073467255e-05, -1.7855316400527954e-05, -1.7163343727588654e-05, -1.6471371054649353e-05, -1.5779398381710052e-05, -1.5087425708770752e-05, -1.4395453035831451e-05, -1.3703480362892151e-05, -1.301150768995285e-05, -1.231953501701355e-05, -1.162756234407425e-05, -1.0935589671134949e-05, -1.0243616998195648e-05, -9.551644325256348e-06, -8.859671652317047e-06, -8.167698979377747e-06, -7.475726306438446e-06, -6.7837536334991455e-06, -6.091780960559845e-06, -5.3998082876205444e-06, -4.707835614681244e-06, -4.015862941741943e-06, -3.323890268802643e-06, -2.6319175958633423e-06, -1.9399449229240417e-06, -1.2479722499847412e-06, -5.559995770454407e-07, 1.3597309589385986e-07, 8.279457688331604e-07, 1.519918441772461e-06, 2.2118911147117615e-06, 2.903863787651062e-06, 3.5958364605903625e-06, 4.287809133529663e-06, 4.979781806468964e-06, 5.671754479408264e-06, 6.363727152347565e-06, 7.055699825286865e-06, 7.747672498226166e-06, 8.439645171165466e-06, 9.131617844104767e-06, 9.823590517044067e-06, 1.0515563189983368e-05, 1.1207535862922668e-05, 1.1899508535861969e-05, 1.259148120880127e-05, 1.328345388174057e-05, 1.397542655467987e-05, 1.4667399227619171e-05, 1.535937190055847e-05, 1.6051344573497772e-05, 1.6743317246437073e-05, 1.7435289919376373e-05, 1.8127262592315674e-05, 1.8819235265254974e-05, 1.9511207938194275e-05, 2.0203180611133575e-05, 2.0895153284072876e-05, 2.1587125957012177e-05, 2.2279098629951477e-05, 2.2971071302890778e-05, 2.3663043975830078e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 10.0, 12.0, 8.0, 36.0, 51.0, 64.0, 93.0, 144.0, 250.0, 416.0, 883.0, 1853.0, 4021.0, 9198.0, 20894.0, 47399.0, 120804.0, 359506.0, 309233.0, 100177.0, 40700.0, 18021.0, 7708.0, 3548.0, 1636.0, 823.0, 424.0, 238.0, 138.0, 102.0, 66.0, 26.0, 17.0, 12.0, 10.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052215576171875, -0.050275325775146484, -0.04833507537841797, -0.04639482498168945, -0.04445457458496094, -0.04251432418823242, -0.040574073791503906, -0.03863382339477539, -0.036693572998046875, -0.03475332260131836, -0.032813072204589844, -0.030872821807861328, -0.028932571411132812, -0.026992321014404297, -0.02505207061767578, -0.023111820220947266, -0.02117156982421875, -0.019231319427490234, -0.01729106903076172, -0.015350818634033203, -0.013410568237304688, -0.011470317840576172, -0.009530067443847656, -0.007589817047119141, -0.005649566650390625, -0.0037093162536621094, -0.0017690658569335938, 0.00017118453979492188, 0.0021114349365234375, 0.004051685333251953, 0.005991935729980469, 0.007932186126708984, 0.0098724365234375, 0.011812686920166016, 0.013752937316894531, 0.015693187713623047, 0.017633438110351562, 0.019573688507080078, 0.021513938903808594, 0.02345418930053711, 0.025394439697265625, 0.02733469009399414, 0.029274940490722656, 0.031215190887451172, 0.03315544128417969, 0.0350956916809082, 0.03703594207763672, 0.038976192474365234, 0.04091644287109375, 0.042856693267822266, 0.04479694366455078, 0.0467371940612793, 0.04867744445800781, 0.05061769485473633, 0.052557945251464844, 0.05449819564819336, 0.056438446044921875, 0.05837869644165039, 0.060318946838378906, 0.06225919723510742, 0.06419944763183594, 0.06613969802856445, 0.06807994842529297, 0.07002019882202148, 0.07196044921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 8.0, 6.0, 5.0, 11.0, 11.0, 11.0, 16.0, 17.0, 25.0, 21.0, 23.0, 35.0, 57.0, 72.0, 82.0, 90.0, 86.0, 73.0, 63.0, 49.0, 44.0, 42.0, 23.0, 26.0, 20.0, 12.0, 10.0, 10.0, 8.0, 7.0, 8.0, 6.0, 6.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052093505859375, -0.050559043884277344, -0.04902458190917969, -0.04749011993408203, -0.045955657958984375, -0.04442119598388672, -0.04288673400878906, -0.041352272033691406, -0.03981781005859375, -0.038283348083496094, -0.03674888610839844, -0.03521442413330078, -0.033679962158203125, -0.03214550018310547, -0.030611038208007812, -0.029076576232910156, -0.0275421142578125, -0.026007652282714844, -0.024473190307617188, -0.02293872833251953, -0.021404266357421875, -0.01986980438232422, -0.018335342407226562, -0.016800880432128906, -0.01526641845703125, -0.013731956481933594, -0.012197494506835938, -0.010663032531738281, -0.009128570556640625, -0.007594108581542969, -0.0060596466064453125, -0.004525184631347656, -0.00299072265625, -0.0014562606811523438, 7.82012939453125e-05, 0.0016126632690429688, 0.003147125244140625, 0.004681587219238281, 0.0062160491943359375, 0.007750511169433594, 0.00928497314453125, 0.010819435119628906, 0.012353897094726562, 0.013888359069824219, 0.015422821044921875, 0.01695728302001953, 0.018491744995117188, 0.020026206970214844, 0.0215606689453125, 0.023095130920410156, 0.024629592895507812, 0.02616405487060547, 0.027698516845703125, 0.02923297882080078, 0.030767440795898438, 0.032301902770996094, 0.03383636474609375, 0.035370826721191406, 0.03690528869628906, 0.03843975067138672, 0.039974212646484375, 0.04150867462158203, 0.04304313659667969, 0.044577598571777344, 0.046112060546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 26.0, 121.0, 264.0, 293.0, 180.0, 78.0, 32.0, 13.0, 4.0, 1.0, 1.0], "bins": [-2.8056085109710693, -2.755821943283081, -2.7060351371765137, -2.6562485694885254, -2.606462001800537, -2.556675434112549, -2.5068886280059814, -2.457102060317993, -2.407315492630005, -2.3575289249420166, -2.307742118835449, -2.257955551147461, -2.2081689834594727, -2.1583824157714844, -2.108595609664917, -2.0588090419769287, -2.0090224742889404, -1.9592357873916626, -1.9094492197036743, -1.8596625328063965, -1.8098759651184082, -1.7600892782211304, -1.710302710533142, -1.6605160236358643, -1.6107293367385864, -1.5609426498413086, -1.5111560821533203, -1.4613693952560425, -1.4115828275680542, -1.3617961406707764, -1.312009572982788, -1.2622228860855103, -1.2124361991882324, -1.1626495122909546, -1.1128629446029663, -1.0630762577056885, -1.0132896900177002, -0.9635030627250671, -0.9137164354324341, -0.8639297485351562, -0.814143180847168, -0.7643565535545349, -0.7145699262619019, -0.6647832989692688, -0.6149966716766357, -0.5652100443840027, -0.5154234170913696, -0.4656367599964142, -0.4158501625061035, -0.36606353521347046, -0.3162769079208374, -0.26649028062820435, -0.2167036384344101, -0.16691701114177704, -0.11713036894798279, -0.06734374165534973, -0.017557114362716675, 0.03222951665520668, 0.08201614767313004, 0.1318027824163437, 0.18158940970897675, 0.2313760370016098, 0.28116267919540405, 0.3309493064880371, 0.38073593378067017]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 15.0, 17.0, 11.0, 18.0, 18.0, 18.0, 27.0, 31.0, 29.0, 30.0, 43.0, 43.0, 46.0, 43.0, 47.0, 44.0, 57.0, 46.0, 34.0, 45.0, 40.0, 40.0, 22.0, 34.0, 29.0, 25.0, 32.0, 18.0, 19.0, 13.0, 15.0, 11.0, 6.0, 7.0, 5.0, 6.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3697403073310852, -0.3588676154613495, -0.34799495339393616, -0.33712226152420044, -0.3262495696544647, -0.315376877784729, -0.3045042157173157, -0.29363152384757996, -0.28275883197784424, -0.2718861401081085, -0.2610134780406952, -0.2501407861709595, -0.23926809430122375, -0.22839541733264923, -0.2175227403640747, -0.206650048494339, -0.19577738642692566, -0.18490470945835114, -0.17403201758861542, -0.1631593406200409, -0.15228664875030518, -0.14141397178173065, -0.13054129481315613, -0.11966861039400101, -0.10879592597484589, -0.09792324155569077, -0.08705055713653564, -0.07617788016796112, -0.065305195748806, -0.05443251132965088, -0.043559834361076355, -0.032687149941921234, -0.021814465522766113, -0.010941782966256142, -6.910040974617004e-05, 0.010803580284118652, 0.021676264703273773, 0.032548949122428894, 0.04342162609100342, 0.05429431051015854, 0.06516699492931366, 0.07603967934846878, 0.0869123637676239, 0.09778504073619843, 0.10865772515535355, 0.11953040957450867, 0.1304030865430832, 0.14127576351165771, 0.15214845538139343, 0.16302113234996796, 0.17389382421970367, 0.1847665011882782, 0.19563919305801392, 0.20651187002658844, 0.21738454699516296, 0.22825723886489868, 0.2391299158334732, 0.25000259280204773, 0.26087528467178345, 0.2717479467391968, 0.2826206386089325, 0.2934933304786682, 0.30436599254608154, 0.31523868441581726, 0.326111376285553]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 18.0, 24.0, 46.0, 74.0, 87.0, 155.0, 257.0, 458.0, 871.0, 1637.0, 3173.0, 7169.0, 18760.0, 59948.0, 266926.0, 1458100.0, 1864577.0, 390333.0, 81018.0, 24049.0, 8856.0, 3788.0, 1787.0, 933.0, 530.0, 268.0, 171.0, 88.0, 65.0, 43.0, 24.0, 12.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09527587890625, -0.09283971786499023, -0.09040355682373047, -0.0879673957824707, -0.08553123474121094, -0.08309507369995117, -0.0806589126586914, -0.07822275161743164, -0.07578659057617188, -0.07335042953491211, -0.07091426849365234, -0.06847810745239258, -0.06604194641113281, -0.06360578536987305, -0.06116962432861328, -0.058733463287353516, -0.05629730224609375, -0.053861141204833984, -0.05142498016357422, -0.04898881912231445, -0.04655265808105469, -0.04411649703979492, -0.041680335998535156, -0.03924417495727539, -0.036808013916015625, -0.03437185287475586, -0.031935691833496094, -0.029499530792236328, -0.027063369750976562, -0.024627208709716797, -0.02219104766845703, -0.019754886627197266, -0.0173187255859375, -0.014882564544677734, -0.012446403503417969, -0.010010242462158203, -0.0075740814208984375, -0.005137920379638672, -0.0027017593383789062, -0.0002655982971191406, 0.002170562744140625, 0.004606723785400391, 0.007042884826660156, 0.009479045867919922, 0.011915206909179688, 0.014351367950439453, 0.01678752899169922, 0.019223690032958984, 0.02165985107421875, 0.024096012115478516, 0.02653217315673828, 0.028968334197998047, 0.03140449523925781, 0.03384065628051758, 0.036276817321777344, 0.03871297836303711, 0.041149139404296875, 0.04358530044555664, 0.046021461486816406, 0.04845762252807617, 0.05089378356933594, 0.0533299446105957, 0.05576610565185547, 0.058202266693115234, 0.060638427734375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 16.0, 20.0, 23.0, 34.0, 43.0, 32.0, 53.0, 39.0, 47.0, 58.0, 41.0, 51.0, 43.0, 55.0, 54.0, 44.0, 47.0, 45.0, 38.0, 27.0, 37.0, 31.0, 23.0, 10.0, 21.0, 7.0, 18.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05517578125, -0.05360746383666992, -0.052039146423339844, -0.050470829010009766, -0.04890251159667969, -0.04733419418334961, -0.04576587677001953, -0.04419755935668945, -0.042629241943359375, -0.0410609245300293, -0.03949260711669922, -0.03792428970336914, -0.03635597229003906, -0.034787654876708984, -0.033219337463378906, -0.03165102005004883, -0.03008270263671875, -0.028514385223388672, -0.026946067810058594, -0.025377750396728516, -0.023809432983398438, -0.02224111557006836, -0.02067279815673828, -0.019104480743408203, -0.017536163330078125, -0.015967845916748047, -0.014399528503417969, -0.01283121109008789, -0.011262893676757812, -0.009694576263427734, -0.008126258850097656, -0.006557941436767578, -0.0049896240234375, -0.003421306610107422, -0.0018529891967773438, -0.0002846717834472656, 0.0012836456298828125, 0.0028519630432128906, 0.004420280456542969, 0.005988597869873047, 0.007556915283203125, 0.009125232696533203, 0.010693550109863281, 0.01226186752319336, 0.013830184936523438, 0.015398502349853516, 0.016966819763183594, 0.018535137176513672, 0.02010345458984375, 0.021671772003173828, 0.023240089416503906, 0.024808406829833984, 0.026376724243164062, 0.02794504165649414, 0.02951335906982422, 0.031081676483154297, 0.032649993896484375, 0.03421831130981445, 0.03578662872314453, 0.03735494613647461, 0.03892326354980469, 0.040491580963134766, 0.042059898376464844, 0.04362821578979492, 0.045196533203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 11.0, 27.0, 35.0, 53.0, 84.0, 162.0, 237.0, 388.0, 722.0, 1389.0, 2884.0, 6544.0, 18048.0, 63976.0, 346163.0, 2094329.0, 1388322.0, 204601.0, 42848.0, 13369.0, 5213.0, 2318.0, 1127.0, 595.0, 317.0, 197.0, 116.0, 72.0, 46.0, 26.0, 12.0, 19.0, 12.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11126708984375, -0.10741138458251953, -0.10355567932128906, -0.0996999740600586, -0.09584426879882812, -0.09198856353759766, -0.08813285827636719, -0.08427715301513672, -0.08042144775390625, -0.07656574249267578, -0.07271003723144531, -0.06885433197021484, -0.06499862670898438, -0.061142921447753906, -0.05728721618652344, -0.05343151092529297, -0.0495758056640625, -0.04572010040283203, -0.04186439514160156, -0.038008689880371094, -0.034152984619140625, -0.030297279357910156, -0.026441574096679688, -0.02258586883544922, -0.01873016357421875, -0.014874458312988281, -0.011018753051757812, -0.007163047790527344, -0.003307342529296875, 0.0005483627319335938, 0.0044040679931640625, 0.008259773254394531, 0.012115478515625, 0.01597118377685547, 0.019826889038085938, 0.023682594299316406, 0.027538299560546875, 0.031394004821777344, 0.03524971008300781, 0.03910541534423828, 0.04296112060546875, 0.04681682586669922, 0.05067253112792969, 0.054528236389160156, 0.058383941650390625, 0.062239646911621094, 0.06609535217285156, 0.06995105743408203, 0.0738067626953125, 0.07766246795654297, 0.08151817321777344, 0.0853738784790039, 0.08922958374023438, 0.09308528900146484, 0.09694099426269531, 0.10079669952392578, 0.10465240478515625, 0.10850811004638672, 0.11236381530761719, 0.11621952056884766, 0.12007522583007812, 0.1239309310913086, 0.12778663635253906, 0.13164234161376953, 0.135498046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 9.0, 18.0, 33.0, 33.0, 32.0, 73.0, 147.0, 194.0, 305.0, 504.0, 653.0, 698.0, 498.0, 330.0, 201.0, 108.0, 78.0, 47.0, 36.0, 16.0, 17.0, 13.0, 8.0, 2.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.07871246337890625, -0.0747833251953125, -0.07085418701171875, -0.066925048828125, -0.06299591064453125, -0.0590667724609375, -0.05513763427734375, -0.05120849609375, -0.04727935791015625, -0.0433502197265625, -0.03942108154296875, -0.035491943359375, -0.03156280517578125, -0.0276336669921875, -0.02370452880859375, -0.019775390625, -0.01584625244140625, -0.0119171142578125, -0.00798797607421875, -0.004058837890625, -0.00012969970703125, 0.0037994384765625, 0.00772857666015625, 0.01165771484375, 0.01558685302734375, 0.0195159912109375, 0.02344512939453125, 0.027374267578125, 0.03130340576171875, 0.0352325439453125, 0.03916168212890625, 0.0430908203125, 0.04701995849609375, 0.0509490966796875, 0.05487823486328125, 0.058807373046875, 0.06273651123046875, 0.0666656494140625, 0.07059478759765625, 0.07452392578125, 0.07845306396484375, 0.0823822021484375, 0.08631134033203125, 0.090240478515625, 0.09416961669921875, 0.0980987548828125, 0.10202789306640625, 0.10595703125, 0.10988616943359375, 0.1138153076171875, 0.11774444580078125, 0.121673583984375, 0.12560272216796875, 0.1295318603515625, 0.13346099853515625, 0.13739013671875, 0.14131927490234375, 0.1452484130859375, 0.14917755126953125, 0.153106689453125, 0.15703582763671875, 0.1609649658203125, 0.16489410400390625, 0.1688232421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 9.0, 20.0, 52.0, 55.0, 125.0, 134.0, 161.0, 161.0, 115.0, 78.0, 53.0, 18.0, 9.0, 7.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1258838176727295, -1.0969610214233398, -1.0680381059646606, -1.039115309715271, -1.0101925134658813, -0.9812695980072021, -0.9523468017578125, -0.9234239459037781, -0.8945010900497437, -0.8655782341957092, -0.8366554379463196, -0.8077325820922852, -0.7788097262382507, -0.7498868703842163, -0.7209640741348267, -0.6920412182807922, -0.6631183624267578, -0.6341955065727234, -0.6052727103233337, -0.5763498544692993, -0.5474269986152649, -0.5185041427612305, -0.4895813465118408, -0.4606584906578064, -0.43173569440841675, -0.4028128683567047, -0.3738900125026703, -0.34496718645095825, -0.31604433059692383, -0.2871215045452118, -0.25819867849349976, -0.22927582263946533, -0.2003529667854309, -0.17143012583255768, -0.14250728487968445, -0.11358445137739182, -0.08466161042451859, -0.05573877692222595, -0.026815935969352722, 0.002106904983520508, 0.031029745936393738, 0.05995258688926697, 0.0888754278421402, 0.11779826134443283, 0.14672109484672546, 0.1756439357995987, 0.20456677675247192, 0.23348961770534515, 0.2624124586582184, 0.2913352847099304, 0.32025814056396484, 0.3491809666156769, 0.3781038224697113, 0.40702664852142334, 0.43594950437545776, 0.4648723304271698, 0.49379515647888184, 0.5227180123329163, 0.5516408085823059, 0.5805636644363403, 0.6094865202903748, 0.6384093761444092, 0.6673321723937988, 0.6962550282478333, 0.7251778841018677]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 10.0, 4.0, 12.0, 9.0, 12.0, 13.0, 11.0, 16.0, 19.0, 23.0, 24.0, 36.0, 39.0, 39.0, 38.0, 38.0, 54.0, 43.0, 56.0, 44.0, 51.0, 31.0, 42.0, 39.0, 47.0, 38.0, 23.0, 37.0, 23.0, 31.0, 17.0, 18.0, 13.0, 13.0, 14.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.4480839967727661, -0.43620961904525757, -0.424335241317749, -0.4124608635902405, -0.40058648586273193, -0.3887121081352234, -0.37683773040771484, -0.3649633526802063, -0.35308897495269775, -0.3412145972251892, -0.32934021949768066, -0.3174658417701721, -0.3055914640426636, -0.29371708631515503, -0.2818427085876465, -0.26996833086013794, -0.2580939531326294, -0.24621957540512085, -0.2343451976776123, -0.22247081995010376, -0.21059644222259521, -0.19872206449508667, -0.18684768676757812, -0.17497330904006958, -0.16309893131256104, -0.1512245535850525, -0.13935017585754395, -0.1274757981300354, -0.11560142040252686, -0.10372704267501831, -0.09185266494750977, -0.07997828722000122, -0.06810390949249268, -0.05622953176498413, -0.044355154037475586, -0.03248077630996704, -0.020606398582458496, -0.008732020854949951, 0.0031423568725585938, 0.015016734600067139, 0.026891112327575684, 0.03876549005508423, 0.05063986778259277, 0.06251424551010132, 0.07438862323760986, 0.08626300096511841, 0.09813737869262695, 0.1100117564201355, 0.12188613414764404, 0.1337605118751526, 0.14563488960266113, 0.15750926733016968, 0.16938364505767822, 0.18125802278518677, 0.1931324005126953, 0.20500677824020386, 0.2168811559677124, 0.22875553369522095, 0.2406299114227295, 0.25250428915023804, 0.2643786668777466, 0.2762530446052551, 0.28812742233276367, 0.3000018000602722, 0.31187617778778076]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 18.0, 14.0, 17.0, 24.0, 56.0, 60.0, 110.0, 152.0, 314.0, 432.0, 790.0, 1401.0, 2408.0, 4229.0, 7405.0, 13126.0, 22796.0, 40306.0, 71674.0, 131119.0, 224158.0, 226836.0, 133300.0, 72697.0, 40775.0, 23293.0, 13157.0, 7656.0, 4281.0, 2429.0, 1417.0, 810.0, 480.0, 275.0, 192.0, 113.0, 76.0, 47.0, 20.0, 19.0, 14.0, 16.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1134033203125, -0.11006927490234375, -0.1067352294921875, -0.10340118408203125, -0.100067138671875, -0.09673309326171875, -0.0933990478515625, -0.09006500244140625, -0.08673095703125, -0.08339691162109375, -0.0800628662109375, -0.07672882080078125, -0.073394775390625, -0.07006072998046875, -0.0667266845703125, -0.06339263916015625, -0.06005859375, -0.05672454833984375, -0.0533905029296875, -0.05005645751953125, -0.046722412109375, -0.04338836669921875, -0.0400543212890625, -0.03672027587890625, -0.03338623046875, -0.03005218505859375, -0.0267181396484375, -0.02338409423828125, -0.020050048828125, -0.01671600341796875, -0.0133819580078125, -0.01004791259765625, -0.0067138671875, -0.00337982177734375, -4.57763671875e-05, 0.00328826904296875, 0.006622314453125, 0.00995635986328125, 0.0132904052734375, 0.01662445068359375, 0.01995849609375, 0.02329254150390625, 0.0266265869140625, 0.02996063232421875, 0.033294677734375, 0.03662872314453125, 0.0399627685546875, 0.04329681396484375, 0.046630859375, 0.04996490478515625, 0.0532989501953125, 0.05663299560546875, 0.059967041015625, 0.06330108642578125, 0.0666351318359375, 0.06996917724609375, 0.07330322265625, 0.07663726806640625, 0.0799713134765625, 0.08330535888671875, 0.086639404296875, 0.08997344970703125, 0.0933074951171875, 0.09664154052734375, 0.0999755859375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 11.0, 7.0, 15.0, 18.0, 24.0, 26.0, 22.0, 32.0, 31.0, 41.0, 66.0, 48.0, 51.0, 46.0, 62.0, 54.0, 53.0, 64.0, 61.0, 46.0, 31.0, 29.0, 31.0, 22.0, 25.0, 20.0, 16.0, 17.0, 11.0, 5.0, 12.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0623779296875, -0.0605926513671875, -0.058807373046875, -0.0570220947265625, -0.05523681640625, -0.0534515380859375, -0.051666259765625, -0.0498809814453125, -0.048095703125, -0.0463104248046875, -0.044525146484375, -0.0427398681640625, -0.04095458984375, -0.0391693115234375, -0.037384033203125, -0.0355987548828125, -0.0338134765625, -0.0320281982421875, -0.030242919921875, -0.0284576416015625, -0.02667236328125, -0.0248870849609375, -0.023101806640625, -0.0213165283203125, -0.01953125, -0.0177459716796875, -0.015960693359375, -0.0141754150390625, -0.01239013671875, -0.0106048583984375, -0.008819580078125, -0.0070343017578125, -0.0052490234375, -0.0034637451171875, -0.001678466796875, 0.0001068115234375, 0.00189208984375, 0.0036773681640625, 0.005462646484375, 0.0072479248046875, 0.009033203125, 0.0108184814453125, 0.012603759765625, 0.0143890380859375, 0.01617431640625, 0.0179595947265625, 0.019744873046875, 0.0215301513671875, 0.0233154296875, 0.0251007080078125, 0.026885986328125, 0.0286712646484375, 0.03045654296875, 0.0322418212890625, 0.034027099609375, 0.0358123779296875, 0.03759765625, 0.0393829345703125, 0.041168212890625, 0.0429534912109375, 0.04473876953125, 0.0465240478515625, 0.048309326171875, 0.0500946044921875, 0.0518798828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 13.0, 10.0, 12.0, 13.0, 17.0, 30.0, 45.0, 78.0, 78.0, 135.0, 187.0, 311.0, 559.0, 1109.0, 2176.0, 4480.0, 9333.0, 20327.0, 44982.0, 106326.0, 278852.0, 336461.0, 138776.0, 56205.0, 25128.0, 11844.0, 5356.0, 2707.0, 1316.0, 651.0, 358.0, 226.0, 109.0, 94.0, 73.0, 51.0, 46.0, 21.0, 11.0, 5.0, 10.0, 5.0, 9.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1510009765625, -0.14581871032714844, -0.14063644409179688, -0.1354541778564453, -0.13027191162109375, -0.1250896453857422, -0.11990737915039062, -0.11472511291503906, -0.1095428466796875, -0.10436058044433594, -0.09917831420898438, -0.09399604797363281, -0.08881378173828125, -0.08363151550292969, -0.07844924926757812, -0.07326698303222656, -0.068084716796875, -0.06290245056152344, -0.057720184326171875, -0.05253791809082031, -0.04735565185546875, -0.04217338562011719, -0.036991119384765625, -0.03180885314941406, -0.0266265869140625, -0.021444320678710938, -0.016262054443359375, -0.011079788208007812, -0.00589752197265625, -0.0007152557373046875, 0.004467010498046875, 0.009649276733398438, 0.01483154296875, 0.020013809204101562, 0.025196075439453125, 0.030378341674804688, 0.03556060791015625, 0.04074287414550781, 0.045925140380859375, 0.05110740661621094, 0.0562896728515625, 0.06147193908691406, 0.06665420532226562, 0.07183647155761719, 0.07701873779296875, 0.08220100402832031, 0.08738327026367188, 0.09256553649902344, 0.097747802734375, 0.10293006896972656, 0.10811233520507812, 0.11329460144042969, 0.11847686767578125, 0.12365913391113281, 0.12884140014648438, 0.13402366638183594, 0.1392059326171875, 0.14438819885253906, 0.14957046508789062, 0.1547527313232422, 0.15993499755859375, 0.1651172637939453, 0.17029953002929688, 0.17548179626464844, 0.1806640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 8.0, 17.0, 12.0, 20.0, 22.0, 22.0, 23.0, 28.0, 34.0, 33.0, 36.0, 49.0, 36.0, 52.0, 48.0, 62.0, 32.0, 50.0, 59.0, 46.0, 33.0, 52.0, 43.0, 24.0, 26.0, 29.0, 23.0, 16.0, 14.0, 7.0, 8.0, 4.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.20556640625, -0.20009231567382812, -0.19461822509765625, -0.18914413452148438, -0.1836700439453125, -0.17819595336914062, -0.17272186279296875, -0.16724777221679688, -0.161773681640625, -0.15629959106445312, -0.15082550048828125, -0.14535140991210938, -0.1398773193359375, -0.13440322875976562, -0.12892913818359375, -0.12345504760742188, -0.11798095703125, -0.11250686645507812, -0.10703277587890625, -0.10155868530273438, -0.0960845947265625, -0.09061050415039062, -0.08513641357421875, -0.07966232299804688, -0.074188232421875, -0.06871414184570312, -0.06324005126953125, -0.057765960693359375, -0.0522918701171875, -0.046817779541015625, -0.04134368896484375, -0.035869598388671875, -0.0303955078125, -0.024921417236328125, -0.01944732666015625, -0.013973236083984375, -0.0084991455078125, -0.003025054931640625, 0.00244903564453125, 0.007923126220703125, 0.013397216796875, 0.018871307373046875, 0.02434539794921875, 0.029819488525390625, 0.0352935791015625, 0.040767669677734375, 0.04624176025390625, 0.051715850830078125, 0.05718994140625, 0.06266403198242188, 0.06813812255859375, 0.07361221313476562, 0.0790863037109375, 0.08456039428710938, 0.09003448486328125, 0.09550857543945312, 0.100982666015625, 0.10645675659179688, 0.11193084716796875, 0.11740493774414062, 0.1228790283203125, 0.12835311889648438, 0.13382720947265625, 0.13930130004882812, 0.144775390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 5.0, 15.0, 12.0, 22.0, 38.0, 73.0, 96.0, 135.0, 244.0, 383.0, 630.0, 1031.0, 1963.0, 3486.0, 6593.0, 12323.0, 23111.0, 43940.0, 84038.0, 160456.0, 258611.0, 211459.0, 113235.0, 59503.0, 31028.0, 16586.0, 8864.0, 4604.0, 2612.0, 1365.0, 873.0, 472.0, 275.0, 169.0, 108.0, 62.0, 42.0, 21.0, 20.0, 15.0, 11.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05731201171875, -0.05544710159301758, -0.053582191467285156, -0.051717281341552734, -0.04985237121582031, -0.04798746109008789, -0.04612255096435547, -0.04425764083862305, -0.042392730712890625, -0.0405278205871582, -0.03866291046142578, -0.03679800033569336, -0.03493309020996094, -0.033068180084228516, -0.031203269958496094, -0.029338359832763672, -0.02747344970703125, -0.025608539581298828, -0.023743629455566406, -0.021878719329833984, -0.020013809204101562, -0.01814889907836914, -0.01628398895263672, -0.014419078826904297, -0.012554168701171875, -0.010689258575439453, -0.008824348449707031, -0.006959438323974609, -0.0050945281982421875, -0.0032296180725097656, -0.0013647079467773438, 0.0005002021789550781, 0.0023651123046875, 0.004230022430419922, 0.006094932556152344, 0.007959842681884766, 0.009824752807617188, 0.01168966293334961, 0.013554573059082031, 0.015419483184814453, 0.017284393310546875, 0.019149303436279297, 0.02101421356201172, 0.02287912368774414, 0.024744033813476562, 0.026608943939208984, 0.028473854064941406, 0.030338764190673828, 0.03220367431640625, 0.03406858444213867, 0.035933494567871094, 0.037798404693603516, 0.03966331481933594, 0.04152822494506836, 0.04339313507080078, 0.0452580451965332, 0.047122955322265625, 0.04898786544799805, 0.05085277557373047, 0.05271768569946289, 0.05458259582519531, 0.056447505950927734, 0.058312416076660156, 0.06017732620239258, 0.062042236328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 5.0, 8.0, 7.0, 8.0, 6.0, 15.0, 11.0, 23.0, 14.0, 29.0, 30.0, 46.0, 49.0, 58.0, 58.0, 60.0, 61.0, 72.0, 78.0, 46.0, 52.0, 51.0, 34.0, 22.0, 33.0, 33.0, 18.0, 17.0, 7.0, 5.0, 5.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4080276489257812e-05, -2.3369677364826202e-05, -2.2659078240394592e-05, -2.1948479115962982e-05, -2.1237879991531372e-05, -2.0527280867099762e-05, -1.9816681742668152e-05, -1.9106082618236542e-05, -1.839548349380493e-05, -1.768488436937332e-05, -1.697428524494171e-05, -1.62636861205101e-05, -1.555308699607849e-05, -1.4842487871646881e-05, -1.4131888747215271e-05, -1.3421289622783661e-05, -1.271069049835205e-05, -1.200009137392044e-05, -1.128949224948883e-05, -1.057889312505722e-05, -9.86829400062561e-06, -9.157694876194e-06, -8.44709575176239e-06, -7.73649662733078e-06, -7.02589750289917e-06, -6.31529837846756e-06, -5.60469925403595e-06, -4.89410012960434e-06, -4.1835010051727295e-06, -3.4729018807411194e-06, -2.7623027563095093e-06, -2.051703631877899e-06, -1.341104507446289e-06, -6.30505383014679e-07, 8.009374141693115e-08, 7.906928658485413e-07, 1.5012919902801514e-06, 2.2118911147117615e-06, 2.9224902391433716e-06, 3.6330893635749817e-06, 4.343688488006592e-06, 5.054287612438202e-06, 5.764886736869812e-06, 6.475485861301422e-06, 7.186084985733032e-06, 7.896684110164642e-06, 8.607283234596252e-06, 9.317882359027863e-06, 1.0028481483459473e-05, 1.0739080607891083e-05, 1.1449679732322693e-05, 1.2160278856754303e-05, 1.2870877981185913e-05, 1.3581477105617523e-05, 1.4292076230049133e-05, 1.5002675354480743e-05, 1.5713274478912354e-05, 1.6423873603343964e-05, 1.7134472727775574e-05, 1.7845071852207184e-05, 1.8555670976638794e-05, 1.9266270101070404e-05, 1.9976869225502014e-05, 2.0687468349933624e-05, 2.1398067474365234e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 8.0, 9.0, 11.0, 24.0, 24.0, 30.0, 57.0, 106.0, 154.0, 248.0, 464.0, 950.0, 2109.0, 5032.0, 12388.0, 31797.0, 78623.0, 191012.0, 347893.0, 222585.0, 92592.0, 37144.0, 14579.0, 5923.0, 2477.0, 1084.0, 527.0, 258.0, 177.0, 91.0, 62.0, 33.0, 32.0, 16.0, 7.0, 8.0, 10.0, 11.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07501220703125, -0.07263755798339844, -0.07026290893554688, -0.06788825988769531, -0.06551361083984375, -0.06313896179199219, -0.060764312744140625, -0.05838966369628906, -0.0560150146484375, -0.05364036560058594, -0.051265716552734375, -0.04889106750488281, -0.04651641845703125, -0.04414176940917969, -0.041767120361328125, -0.03939247131347656, -0.037017822265625, -0.03464317321777344, -0.032268524169921875, -0.029893875122070312, -0.02751922607421875, -0.025144577026367188, -0.022769927978515625, -0.020395278930664062, -0.0180206298828125, -0.015645980834960938, -0.013271331787109375, -0.010896682739257812, -0.00852203369140625, -0.0061473846435546875, -0.003772735595703125, -0.0013980865478515625, 0.0009765625, 0.0033512115478515625, 0.005725860595703125, 0.008100509643554688, 0.01047515869140625, 0.012849807739257812, 0.015224456787109375, 0.017599105834960938, 0.0199737548828125, 0.022348403930664062, 0.024723052978515625, 0.027097702026367188, 0.02947235107421875, 0.03184700012207031, 0.034221649169921875, 0.03659629821777344, 0.038970947265625, 0.04134559631347656, 0.043720245361328125, 0.04609489440917969, 0.04846954345703125, 0.05084419250488281, 0.053218841552734375, 0.05559349060058594, 0.0579681396484375, 0.06034278869628906, 0.06271743774414062, 0.06509208679199219, 0.06746673583984375, 0.06984138488769531, 0.07221603393554688, 0.07459068298339844, 0.07696533203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 8.0, 3.0, 8.0, 17.0, 12.0, 30.0, 25.0, 35.0, 31.0, 50.0, 66.0, 68.0, 73.0, 75.0, 100.0, 83.0, 64.0, 54.0, 37.0, 38.0, 30.0, 21.0, 16.0, 12.0, 6.0, 7.0, 6.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049652099609375, -0.047335147857666016, -0.04501819610595703, -0.04270124435424805, -0.04038429260253906, -0.03806734085083008, -0.035750389099121094, -0.03343343734741211, -0.031116485595703125, -0.02879953384399414, -0.026482582092285156, -0.024165630340576172, -0.021848678588867188, -0.019531726837158203, -0.01721477508544922, -0.014897823333740234, -0.01258087158203125, -0.010263919830322266, -0.007946968078613281, -0.005630016326904297, -0.0033130645751953125, -0.0009961128234863281, 0.0013208389282226562, 0.0036377906799316406, 0.005954742431640625, 0.00827169418334961, 0.010588645935058594, 0.012905597686767578, 0.015222549438476562, 0.017539501190185547, 0.01985645294189453, 0.022173404693603516, 0.0244903564453125, 0.026807308197021484, 0.02912425994873047, 0.03144121170043945, 0.03375816345214844, 0.03607511520385742, 0.038392066955566406, 0.04070901870727539, 0.043025970458984375, 0.04534292221069336, 0.047659873962402344, 0.04997682571411133, 0.05229377746582031, 0.0546107292175293, 0.05692768096923828, 0.059244632720947266, 0.06156158447265625, 0.06387853622436523, 0.06619548797607422, 0.0685124397277832, 0.07082939147949219, 0.07314634323120117, 0.07546329498291016, 0.07778024673461914, 0.08009719848632812, 0.08241415023803711, 0.0847311019897461, 0.08704805374145508, 0.08936500549316406, 0.09168195724487305, 0.09399890899658203, 0.09631586074829102, 0.0986328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 20.0, 52.0, 79.0, 106.0, 163.0, 159.0, 149.0, 110.0, 61.0, 52.0, 26.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.876379132270813, -1.836872935295105, -1.7973666191101074, -1.7578604221343994, -1.7183542251586914, -1.6788479089736938, -1.6393417119979858, -1.5998353958129883, -1.5603291988372803, -1.5208230018615723, -1.4813166856765747, -1.4418104887008667, -1.4023041725158691, -1.3627979755401611, -1.3232917785644531, -1.2837855815887451, -1.2442792654037476, -1.2047730684280396, -1.165266752243042, -1.125760555267334, -1.086254358291626, -1.0467480421066284, -1.0072418451309204, -0.9677355885505676, -0.9282293319702148, -0.8887230753898621, -0.8492168188095093, -0.8097106218338013, -0.7702043652534485, -0.7306981086730957, -0.6911919116973877, -0.6516856551170349, -0.6121794581413269, -0.5726732015609741, -0.5331670045852661, -0.49366074800491333, -0.45415449142456055, -0.41464823484420776, -0.37514200806617737, -0.335635781288147, -0.2961295247077942, -0.2566232681274414, -0.217117041349411, -0.17761079967021942, -0.13810455799102783, -0.09859831631183624, -0.05909207463264465, -0.019585847854614258, 0.019920408725738525, 0.059426650404930115, 0.0989328920841217, 0.1384391337633133, 0.17794537544250488, 0.21745161712169647, 0.25695785880088806, 0.29646408557891846, 0.33597034215927124, 0.375476598739624, 0.4149828255176544, 0.4544890522956848, 0.4939953088760376, 0.5335015654563904, 0.5730078220367432, 0.6125140190124512, 0.652020275592804]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 10.0, 8.0, 6.0, 13.0, 11.0, 13.0, 13.0, 20.0, 16.0, 24.0, 30.0, 28.0, 31.0, 38.0, 34.0, 33.0, 41.0, 31.0, 38.0, 32.0, 56.0, 39.0, 54.0, 29.0, 30.0, 37.0, 29.0, 31.0, 33.0, 27.0, 27.0, 20.0, 12.0, 17.0, 18.0, 11.0, 7.0, 11.0, 8.0, 7.0, 6.0, 3.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36016714572906494, -0.34839215874671936, -0.3366171717643738, -0.3248422145843506, -0.313067227602005, -0.3012922406196594, -0.28951725363731384, -0.27774226665496826, -0.26596730947494507, -0.2541923224925995, -0.2424173504114151, -0.23064236342906952, -0.21886739134788513, -0.20709240436553955, -0.19531741738319397, -0.18354244530200958, -0.171767458319664, -0.15999247133731842, -0.14821749925613403, -0.13644251227378845, -0.12466754019260406, -0.11289255321025848, -0.1011175736784935, -0.08934259414672852, -0.07756761461496353, -0.06579263508319855, -0.05401765555143356, -0.04224267229437828, -0.030467692762613297, -0.018692713230848312, -0.00691772997379303, 0.004857249557971954, 0.01663222908973694, 0.028407208621501923, 0.04018218815326691, 0.05195717141032219, 0.06373214721679688, 0.07550713419914246, 0.08728211373090744, 0.09905709326267242, 0.11083207279443741, 0.12260705232620239, 0.13438203930854797, 0.14615701138973236, 0.15793199837207794, 0.16970697045326233, 0.1814819574356079, 0.1932569444179535, 0.20503191649913788, 0.21680690348148346, 0.22858187556266785, 0.24035686254501343, 0.252131849527359, 0.2639068067073822, 0.2756817936897278, 0.28745678067207336, 0.29923176765441895, 0.3110067546367645, 0.3227817416191101, 0.3345566987991333, 0.3463316857814789, 0.35810667276382446, 0.36988165974617004, 0.3816566467285156, 0.3934316039085388]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 11.0, 10.0, 13.0, 10.0, 19.0, 14.0, 26.0, 48.0, 75.0, 126.0, 209.0, 478.0, 1007.0, 2323.0, 6017.0, 17763.0, 64381.0, 334061.0, 2176434.0, 1336445.0, 192625.0, 42501.0, 12225.0, 4357.0, 1626.0, 674.0, 348.0, 165.0, 88.0, 44.0, 35.0, 25.0, 24.0, 16.0, 12.0, 15.0, 5.0, 11.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.130615234375, -0.12707042694091797, -0.12352561950683594, -0.1199808120727539, -0.11643600463867188, -0.11289119720458984, -0.10934638977050781, -0.10580158233642578, -0.10225677490234375, -0.09871196746826172, -0.09516716003417969, -0.09162235260009766, -0.08807754516601562, -0.0845327377319336, -0.08098793029785156, -0.07744312286376953, -0.0738983154296875, -0.07035350799560547, -0.06680870056152344, -0.0632638931274414, -0.059719085693359375, -0.056174278259277344, -0.05262947082519531, -0.04908466339111328, -0.04553985595703125, -0.04199504852294922, -0.03845024108886719, -0.034905433654785156, -0.031360626220703125, -0.027815818786621094, -0.024271011352539062, -0.02072620391845703, -0.017181396484375, -0.013636589050292969, -0.010091781616210938, -0.006546974182128906, -0.003002166748046875, 0.0005426406860351562, 0.0040874481201171875, 0.007632255554199219, 0.01117706298828125, 0.014721870422363281, 0.018266677856445312, 0.021811485290527344, 0.025356292724609375, 0.028901100158691406, 0.03244590759277344, 0.03599071502685547, 0.0395355224609375, 0.04308032989501953, 0.04662513732910156, 0.050169944763183594, 0.053714752197265625, 0.057259559631347656, 0.06080436706542969, 0.06434917449951172, 0.06789398193359375, 0.07143878936767578, 0.07498359680175781, 0.07852840423583984, 0.08207321166992188, 0.0856180191040039, 0.08916282653808594, 0.09270763397216797, 0.09625244140625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 10.0, 12.0, 11.0, 16.0, 10.0, 27.0, 15.0, 23.0, 26.0, 35.0, 39.0, 38.0, 46.0, 53.0, 38.0, 64.0, 51.0, 50.0, 43.0, 52.0, 33.0, 43.0, 37.0, 53.0, 31.0, 21.0, 29.0, 19.0, 12.0, 15.0, 13.0, 8.0, 10.0, 7.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.06805419921875, -0.0662994384765625, -0.064544677734375, -0.0627899169921875, -0.06103515625, -0.0592803955078125, -0.057525634765625, -0.0557708740234375, -0.05401611328125, -0.0522613525390625, -0.050506591796875, -0.0487518310546875, -0.0469970703125, -0.0452423095703125, -0.043487548828125, -0.0417327880859375, -0.03997802734375, -0.0382232666015625, -0.036468505859375, -0.0347137451171875, -0.032958984375, -0.0312042236328125, -0.029449462890625, -0.0276947021484375, -0.02593994140625, -0.0241851806640625, -0.022430419921875, -0.0206756591796875, -0.0189208984375, -0.0171661376953125, -0.015411376953125, -0.0136566162109375, -0.01190185546875, -0.0101470947265625, -0.008392333984375, -0.0066375732421875, -0.0048828125, -0.0031280517578125, -0.001373291015625, 0.0003814697265625, 0.00213623046875, 0.0038909912109375, 0.005645751953125, 0.0074005126953125, 0.0091552734375, 0.0109100341796875, 0.012664794921875, 0.0144195556640625, 0.01617431640625, 0.0179290771484375, 0.019683837890625, 0.0214385986328125, 0.023193359375, 0.0249481201171875, 0.026702880859375, 0.0284576416015625, 0.03021240234375, 0.0319671630859375, 0.033721923828125, 0.0354766845703125, 0.0372314453125, 0.0389862060546875, 0.040740966796875, 0.0424957275390625, 0.04425048828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 9.0, 17.0, 24.0, 44.0, 60.0, 89.0, 114.0, 162.0, 252.0, 398.0, 623.0, 998.0, 1782.0, 2986.0, 5552.0, 10992.0, 24198.0, 58323.0, 163626.0, 534667.0, 1626158.0, 1211139.0, 356928.0, 114281.0, 42825.0, 18369.0, 8641.0, 4608.0, 2505.0, 1483.0, 887.0, 503.0, 345.0, 212.0, 151.0, 105.0, 52.0, 41.0, 39.0, 28.0, 13.0, 13.0, 7.0, 4.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10205078125, -0.0985116958618164, -0.09497261047363281, -0.09143352508544922, -0.08789443969726562, -0.08435535430908203, -0.08081626892089844, -0.07727718353271484, -0.07373809814453125, -0.07019901275634766, -0.06665992736816406, -0.06312084197998047, -0.059581756591796875, -0.05604267120361328, -0.05250358581542969, -0.048964500427246094, -0.0454254150390625, -0.041886329650878906, -0.03834724426269531, -0.03480815887451172, -0.031269073486328125, -0.02772998809814453, -0.024190902709960938, -0.020651817321777344, -0.01711273193359375, -0.013573646545410156, -0.010034561157226562, -0.006495475769042969, -0.002956390380859375, 0.0005826950073242188, 0.0041217803955078125, 0.007660865783691406, 0.011199951171875, 0.014739036560058594, 0.018278121948242188, 0.02181720733642578, 0.025356292724609375, 0.02889537811279297, 0.03243446350097656, 0.035973548889160156, 0.03951263427734375, 0.043051719665527344, 0.04659080505371094, 0.05012989044189453, 0.053668975830078125, 0.05720806121826172, 0.06074714660644531, 0.0642862319946289, 0.0678253173828125, 0.0713644027709961, 0.07490348815917969, 0.07844257354736328, 0.08198165893554688, 0.08552074432373047, 0.08905982971191406, 0.09259891510009766, 0.09613800048828125, 0.09967708587646484, 0.10321617126464844, 0.10675525665283203, 0.11029434204101562, 0.11383342742919922, 0.11737251281738281, 0.1209115982055664, 0.12445068359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 3.0, 8.0, 10.0, 20.0, 22.0, 36.0, 61.0, 60.0, 112.0, 143.0, 206.0, 335.0, 477.0, 646.0, 598.0, 424.0, 285.0, 188.0, 137.0, 102.0, 69.0, 39.0, 25.0, 14.0, 10.0, 14.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1026611328125, -0.09851646423339844, -0.09437179565429688, -0.09022712707519531, -0.08608245849609375, -0.08193778991699219, -0.07779312133789062, -0.07364845275878906, -0.0695037841796875, -0.06535911560058594, -0.061214447021484375, -0.05706977844238281, -0.05292510986328125, -0.04878044128417969, -0.044635772705078125, -0.04049110412597656, -0.036346435546875, -0.03220176696777344, -0.028057098388671875, -0.023912429809570312, -0.01976776123046875, -0.015623092651367188, -0.011478424072265625, -0.0073337554931640625, -0.0031890869140625, 0.0009555816650390625, 0.005100250244140625, 0.009244918823242188, 0.01338958740234375, 0.017534255981445312, 0.021678924560546875, 0.025823593139648438, 0.02996826171875, 0.03411293029785156, 0.038257598876953125, 0.04240226745605469, 0.04654693603515625, 0.05069160461425781, 0.054836273193359375, 0.05898094177246094, 0.0631256103515625, 0.06727027893066406, 0.07141494750976562, 0.07555961608886719, 0.07970428466796875, 0.08384895324707031, 0.08799362182617188, 0.09213829040527344, 0.096282958984375, 0.10042762756347656, 0.10457229614257812, 0.10871696472167969, 0.11286163330078125, 0.11700630187988281, 0.12115097045898438, 0.12529563903808594, 0.1294403076171875, 0.13358497619628906, 0.13772964477539062, 0.1418743133544922, 0.14601898193359375, 0.1501636505126953, 0.15430831909179688, 0.15845298767089844, 0.16259765625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 8.0, 19.0, 18.0, 29.0, 49.0, 51.0, 60.0, 69.0, 73.0, 90.0, 83.0, 96.0, 81.0, 73.0, 56.0, 41.0, 34.0, 25.0, 14.0, 9.0, 8.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.8232011795043945, -0.8040823340415955, -0.7849634289741516, -0.7658445835113525, -0.7467256784439087, -0.7276068329811096, -0.7084879875183105, -0.6893690824508667, -0.6702502369880676, -0.6511313915252686, -0.6320124864578247, -0.6128936409950256, -0.5937747359275818, -0.5746558904647827, -0.5555369853973389, -0.5364181399345398, -0.5172992944717407, -0.49818041920661926, -0.4790615439414978, -0.45994269847869873, -0.44082382321357727, -0.4217049479484558, -0.40258607268333435, -0.3834671974182129, -0.36434829235076904, -0.3452294170856476, -0.3261105418205261, -0.30699169635772705, -0.2878728210926056, -0.26875394582748413, -0.24963507056236267, -0.2305162101984024, -0.21139734983444214, -0.19227847456932068, -0.1731596142053604, -0.15404073894023895, -0.1349218785762787, -0.11580300331115723, -0.09668412804603577, -0.0775652676820755, -0.05844639241695404, -0.03932752460241318, -0.020208653062582016, -0.0010897815227508545, 0.01802908629179001, 0.03714795410633087, 0.05626682937145233, 0.0753856897354126, 0.09450456500053406, 0.11362343281507492, 0.13274230062961578, 0.15186117589473724, 0.1709800362586975, 0.19009891152381897, 0.20921778678894043, 0.2283366471529007, 0.24745552241802216, 0.2665743827819824, 0.2856932580471039, 0.30481213331222534, 0.3239310085773468, 0.34304988384246826, 0.36216872930526733, 0.3812876045703888, 0.40040647983551025]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 3.0, 7.0, 10.0, 7.0, 13.0, 14.0, 11.0, 19.0, 13.0, 18.0, 30.0, 28.0, 33.0, 38.0, 29.0, 42.0, 34.0, 41.0, 43.0, 39.0, 57.0, 45.0, 39.0, 37.0, 43.0, 42.0, 39.0, 34.0, 24.0, 27.0, 23.0, 19.0, 17.0, 13.0, 11.0, 17.0, 7.0, 13.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.3826666474342346, -0.3711805045604706, -0.35969439148902893, -0.3482082486152649, -0.33672213554382324, -0.3252359926700592, -0.31374984979629517, -0.3022637367248535, -0.29077762365341187, -0.2792914807796478, -0.2678053677082062, -0.25631922483444214, -0.2448331117630005, -0.23334696888923645, -0.2218608409166336, -0.21037471294403076, -0.19888857007026672, -0.18740244209766388, -0.17591631412506104, -0.164430171251297, -0.15294405817985535, -0.1414579153060913, -0.12997178733348846, -0.11848565936088562, -0.10699953138828278, -0.09551340341567993, -0.08402727544307709, -0.07254114001989365, -0.0610550120472908, -0.04956888407468796, -0.03808274865150452, -0.026596620678901672, -0.015110492706298828, -0.0036243628710508347, 0.007861766964197159, 0.0193478986620903, 0.030834026634693146, 0.04232015460729599, 0.05380629003047943, 0.06529241800308228, 0.07677854597568512, 0.08826467394828796, 0.09975080192089081, 0.11123693734407425, 0.1227230653166771, 0.13420918583869934, 0.14569532871246338, 0.15718145668506622, 0.16866758465766907, 0.1801537126302719, 0.19163984060287476, 0.2031259834766388, 0.21461209654808044, 0.22609823942184448, 0.23758436739444733, 0.24907049536705017, 0.2605566382408142, 0.27204278111457825, 0.2835288941860199, 0.29501503705978394, 0.3065011501312256, 0.3179872930049896, 0.32947343587875366, 0.3409595489501953, 0.35244566202163696]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 10.0, 20.0, 42.0, 42.0, 53.0, 85.0, 137.0, 181.0, 282.0, 472.0, 707.0, 1053.0, 1579.0, 2543.0, 4000.0, 6296.0, 9928.0, 16204.0, 26603.0, 44987.0, 82914.0, 161702.0, 246216.0, 198117.0, 105128.0, 55431.0, 31856.0, 19438.0, 11940.0, 7411.0, 4654.0, 2951.0, 1936.0, 1221.0, 830.0, 520.0, 345.0, 232.0, 171.0, 97.0, 76.0, 46.0, 27.0, 16.0, 12.0, 14.0, 7.0, 6.0, 1.0, 4.0, 1.0], "bins": [-0.09912109375, -0.0963430404663086, -0.09356498718261719, -0.09078693389892578, -0.08800888061523438, -0.08523082733154297, -0.08245277404785156, -0.07967472076416016, -0.07689666748046875, -0.07411861419677734, -0.07134056091308594, -0.06856250762939453, -0.06578445434570312, -0.06300640106201172, -0.06022834777832031, -0.057450294494628906, -0.0546722412109375, -0.051894187927246094, -0.04911613464355469, -0.04633808135986328, -0.043560028076171875, -0.04078197479248047, -0.03800392150878906, -0.035225868225097656, -0.03244781494140625, -0.029669761657714844, -0.026891708374023438, -0.02411365509033203, -0.021335601806640625, -0.01855754852294922, -0.015779495239257812, -0.013001441955566406, -0.010223388671875, -0.007445335388183594, -0.0046672821044921875, -0.0018892288208007812, 0.000888824462890625, 0.0036668777465820312, 0.0064449310302734375, 0.009222984313964844, 0.01200103759765625, 0.014779090881347656, 0.017557144165039062, 0.02033519744873047, 0.023113250732421875, 0.02589130401611328, 0.028669357299804688, 0.031447410583496094, 0.0342254638671875, 0.037003517150878906, 0.03978157043457031, 0.04255962371826172, 0.045337677001953125, 0.04811573028564453, 0.05089378356933594, 0.053671836853027344, 0.05644989013671875, 0.059227943420410156, 0.06200599670410156, 0.06478404998779297, 0.06756210327148438, 0.07034015655517578, 0.07311820983886719, 0.0758962631225586, 0.07867431640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 8.0, 8.0, 5.0, 13.0, 16.0, 19.0, 18.0, 27.0, 27.0, 25.0, 33.0, 40.0, 39.0, 32.0, 53.0, 51.0, 44.0, 57.0, 50.0, 52.0, 38.0, 45.0, 40.0, 34.0, 43.0, 27.0, 31.0, 22.0, 17.0, 19.0, 13.0, 9.0, 13.0, 13.0, 6.0, 5.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.07257080078125, -0.07063865661621094, -0.06870651245117188, -0.06677436828613281, -0.06484222412109375, -0.06291007995605469, -0.060977935791015625, -0.05904579162597656, -0.0571136474609375, -0.05518150329589844, -0.053249359130859375, -0.05131721496582031, -0.04938507080078125, -0.04745292663574219, -0.045520782470703125, -0.04358863830566406, -0.041656494140625, -0.03972434997558594, -0.037792205810546875, -0.03586006164550781, -0.03392791748046875, -0.03199577331542969, -0.030063629150390625, -0.028131484985351562, -0.0261993408203125, -0.024267196655273438, -0.022335052490234375, -0.020402908325195312, -0.01847076416015625, -0.016538619995117188, -0.014606475830078125, -0.012674331665039062, -0.0107421875, -0.008810043334960938, -0.006877899169921875, -0.0049457550048828125, -0.00301361083984375, -0.0010814666748046875, 0.000850677490234375, 0.0027828216552734375, 0.0047149658203125, 0.0066471099853515625, 0.008579254150390625, 0.010511398315429688, 0.01244354248046875, 0.014375686645507812, 0.016307830810546875, 0.018239974975585938, 0.020172119140625, 0.022104263305664062, 0.024036407470703125, 0.025968551635742188, 0.02790069580078125, 0.029832839965820312, 0.031764984130859375, 0.03369712829589844, 0.0356292724609375, 0.03756141662597656, 0.039493560791015625, 0.04142570495605469, 0.04335784912109375, 0.04528999328613281, 0.047222137451171875, 0.04915428161621094, 0.05108642578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 9.0, 9.0, 14.0, 11.0, 14.0, 14.0, 32.0, 41.0, 57.0, 92.0, 149.0, 347.0, 693.0, 1447.0, 3552.0, 8818.0, 22861.0, 64423.0, 260619.0, 496327.0, 125211.0, 39030.0, 14531.0, 5806.0, 2362.0, 973.0, 470.0, 228.0, 142.0, 71.0, 55.0, 37.0, 26.0, 14.0, 20.0, 9.0, 6.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.22900390625, -0.222320556640625, -0.21563720703125, -0.208953857421875, -0.2022705078125, -0.195587158203125, -0.18890380859375, -0.182220458984375, -0.175537109375, -0.168853759765625, -0.16217041015625, -0.155487060546875, -0.1488037109375, -0.142120361328125, -0.13543701171875, -0.128753662109375, -0.1220703125, -0.115386962890625, -0.10870361328125, -0.102020263671875, -0.0953369140625, -0.088653564453125, -0.08197021484375, -0.075286865234375, -0.068603515625, -0.061920166015625, -0.05523681640625, -0.048553466796875, -0.0418701171875, -0.035186767578125, -0.02850341796875, -0.021820068359375, -0.01513671875, -0.008453369140625, -0.00177001953125, 0.004913330078125, 0.0115966796875, 0.018280029296875, 0.02496337890625, 0.031646728515625, 0.038330078125, 0.045013427734375, 0.05169677734375, 0.058380126953125, 0.0650634765625, 0.071746826171875, 0.07843017578125, 0.085113525390625, 0.091796875, 0.098480224609375, 0.10516357421875, 0.111846923828125, 0.1185302734375, 0.125213623046875, 0.13189697265625, 0.138580322265625, 0.145263671875, 0.151947021484375, 0.15863037109375, 0.165313720703125, 0.1719970703125, 0.178680419921875, 0.18536376953125, 0.192047119140625, 0.19873046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 6.0, 10.0, 11.0, 5.0, 8.0, 10.0, 26.0, 29.0, 45.0, 30.0, 45.0, 48.0, 54.0, 43.0, 43.0, 64.0, 61.0, 60.0, 65.0, 67.0, 43.0, 43.0, 24.0, 25.0, 32.0, 15.0, 16.0, 12.0, 15.0, 7.0, 4.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2078857421875, -0.20049095153808594, -0.19309616088867188, -0.1857013702392578, -0.17830657958984375, -0.1709117889404297, -0.16351699829101562, -0.15612220764160156, -0.1487274169921875, -0.14133262634277344, -0.13393783569335938, -0.1265430450439453, -0.11914825439453125, -0.11175346374511719, -0.10435867309570312, -0.09696388244628906, -0.089569091796875, -0.08217430114746094, -0.07477951049804688, -0.06738471984863281, -0.05998992919921875, -0.05259513854980469, -0.045200347900390625, -0.03780555725097656, -0.0304107666015625, -0.023015975952148438, -0.015621185302734375, -0.008226394653320312, -0.00083160400390625, 0.0065631866455078125, 0.013957977294921875, 0.021352767944335938, 0.02874755859375, 0.03614234924316406, 0.043537139892578125, 0.05093193054199219, 0.05832672119140625, 0.06572151184082031, 0.07311630249023438, 0.08051109313964844, 0.0879058837890625, 0.09530067443847656, 0.10269546508789062, 0.11009025573730469, 0.11748504638671875, 0.12487983703613281, 0.13227462768554688, 0.13966941833496094, 0.147064208984375, 0.15445899963378906, 0.16185379028320312, 0.1692485809326172, 0.17664337158203125, 0.1840381622314453, 0.19143295288085938, 0.19882774353027344, 0.2062225341796875, 0.21361732482910156, 0.22101211547851562, 0.2284069061279297, 0.23580169677734375, 0.2431964874267578, 0.2505912780761719, 0.25798606872558594, 0.265380859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 13.0, 21.0, 30.0, 32.0, 43.0, 70.0, 105.0, 153.0, 224.0, 354.0, 532.0, 871.0, 1310.0, 2021.0, 3167.0, 4944.0, 8166.0, 13470.0, 22677.0, 39856.0, 75505.0, 167063.0, 306790.0, 201776.0, 88587.0, 45367.0, 25479.0, 15181.0, 9123.0, 5709.0, 3553.0, 2165.0, 1477.0, 944.0, 620.0, 391.0, 239.0, 173.0, 100.0, 78.0, 53.0, 37.0, 27.0, 12.0, 13.0, 11.0, 10.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.07012939453125, -0.0681600570678711, -0.06619071960449219, -0.06422138214111328, -0.062252044677734375, -0.06028270721435547, -0.05831336975097656, -0.056344032287597656, -0.05437469482421875, -0.052405357360839844, -0.05043601989746094, -0.04846668243408203, -0.046497344970703125, -0.04452800750732422, -0.04255867004394531, -0.040589332580566406, -0.0386199951171875, -0.036650657653808594, -0.03468132019042969, -0.03271198272705078, -0.030742645263671875, -0.02877330780029297, -0.026803970336914062, -0.024834632873535156, -0.02286529541015625, -0.020895957946777344, -0.018926620483398438, -0.01695728302001953, -0.014987945556640625, -0.013018608093261719, -0.011049270629882812, -0.009079933166503906, -0.007110595703125, -0.005141258239746094, -0.0031719207763671875, -0.0012025833129882812, 0.000766754150390625, 0.0027360916137695312, 0.0047054290771484375, 0.006674766540527344, 0.00864410400390625, 0.010613441467285156, 0.012582778930664062, 0.014552116394042969, 0.016521453857421875, 0.01849079132080078, 0.020460128784179688, 0.022429466247558594, 0.0243988037109375, 0.026368141174316406, 0.028337478637695312, 0.03030681610107422, 0.032276153564453125, 0.03424549102783203, 0.03621482849121094, 0.038184165954589844, 0.04015350341796875, 0.042122840881347656, 0.04409217834472656, 0.04606151580810547, 0.048030853271484375, 0.05000019073486328, 0.05196952819824219, 0.053938865661621094, 0.055908203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 14.0, 8.0, 19.0, 24.0, 32.0, 32.0, 48.0, 51.0, 53.0, 85.0, 78.0, 88.0, 88.0, 57.0, 52.0, 56.0, 41.0, 29.0, 20.0, 22.0, 12.0, 12.0, 6.0, 7.0, 8.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4437904357910156e-05, -2.37245112657547e-05, -2.3011118173599243e-05, -2.2297725081443787e-05, -2.158433198928833e-05, -2.0870938897132874e-05, -2.0157545804977417e-05, -1.944415271282196e-05, -1.8730759620666504e-05, -1.8017366528511047e-05, -1.730397343635559e-05, -1.6590580344200134e-05, -1.5877187252044678e-05, -1.5163794159889221e-05, -1.4450401067733765e-05, -1.3737007975578308e-05, -1.3023614883422852e-05, -1.2310221791267395e-05, -1.1596828699111938e-05, -1.0883435606956482e-05, -1.0170042514801025e-05, -9.456649422645569e-06, -8.743256330490112e-06, -8.029863238334656e-06, -7.316470146179199e-06, -6.603077054023743e-06, -5.889683961868286e-06, -5.17629086971283e-06, -4.462897777557373e-06, -3.7495046854019165e-06, -3.03611159324646e-06, -2.3227185010910034e-06, -1.6093254089355469e-06, -8.959323167800903e-07, -1.825392246246338e-07, 5.308538675308228e-07, 1.2442469596862793e-06, 1.957640051841736e-06, 2.6710331439971924e-06, 3.384426236152649e-06, 4.0978193283081055e-06, 4.811212420463562e-06, 5.5246055126190186e-06, 6.237998604774475e-06, 6.951391696929932e-06, 7.664784789085388e-06, 8.378177881240845e-06, 9.091570973396301e-06, 9.804964065551758e-06, 1.0518357157707214e-05, 1.1231750249862671e-05, 1.1945143342018127e-05, 1.2658536434173584e-05, 1.337192952632904e-05, 1.4085322618484497e-05, 1.4798715710639954e-05, 1.551210880279541e-05, 1.6225501894950867e-05, 1.6938894987106323e-05, 1.765228807926178e-05, 1.8365681171417236e-05, 1.9079074263572693e-05, 1.979246735572815e-05, 2.0505860447883606e-05, 2.1219253540039062e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 5.0, 6.0, 10.0, 15.0, 24.0, 25.0, 29.0, 75.0, 116.0, 193.0, 347.0, 633.0, 1274.0, 2703.0, 5910.0, 13300.0, 30946.0, 76158.0, 223986.0, 425502.0, 163162.0, 59762.0, 24659.0, 10529.0, 4700.0, 2199.0, 1052.0, 561.0, 251.0, 159.0, 87.0, 53.0, 43.0, 22.0, 11.0, 9.0, 8.0, 8.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08685302734375, -0.08399295806884766, -0.08113288879394531, -0.07827281951904297, -0.07541275024414062, -0.07255268096923828, -0.06969261169433594, -0.0668325424194336, -0.06397247314453125, -0.061112403869628906, -0.05825233459472656, -0.05539226531982422, -0.052532196044921875, -0.04967212677001953, -0.04681205749511719, -0.043951988220214844, -0.0410919189453125, -0.038231849670410156, -0.03537178039550781, -0.03251171112060547, -0.029651641845703125, -0.02679157257080078, -0.023931503295898438, -0.021071434020996094, -0.01821136474609375, -0.015351295471191406, -0.012491226196289062, -0.009631156921386719, -0.006771087646484375, -0.003911018371582031, -0.0010509490966796875, 0.0018091201782226562, 0.004669189453125, 0.007529258728027344, 0.010389328002929688, 0.013249397277832031, 0.016109466552734375, 0.01896953582763672, 0.021829605102539062, 0.024689674377441406, 0.02754974365234375, 0.030409812927246094, 0.03326988220214844, 0.03612995147705078, 0.038990020751953125, 0.04185009002685547, 0.04471015930175781, 0.047570228576660156, 0.0504302978515625, 0.053290367126464844, 0.05615043640136719, 0.05901050567626953, 0.061870574951171875, 0.06473064422607422, 0.06759071350097656, 0.0704507827758789, 0.07331085205078125, 0.0761709213256836, 0.07903099060058594, 0.08189105987548828, 0.08475112915039062, 0.08761119842529297, 0.09047126770019531, 0.09333133697509766, 0.09619140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 4.0, 7.0, 6.0, 11.0, 15.0, 13.0, 19.0, 19.0, 29.0, 36.0, 49.0, 83.0, 99.0, 120.0, 109.0, 85.0, 67.0, 38.0, 40.0, 25.0, 20.0, 14.0, 17.0, 9.0, 13.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.060333251953125, -0.057569026947021484, -0.05480480194091797, -0.05204057693481445, -0.04927635192871094, -0.04651212692260742, -0.043747901916503906, -0.04098367691040039, -0.038219451904296875, -0.03545522689819336, -0.032691001892089844, -0.029926776885986328, -0.027162551879882812, -0.024398326873779297, -0.02163410186767578, -0.018869876861572266, -0.01610565185546875, -0.013341426849365234, -0.010577201843261719, -0.007812976837158203, -0.0050487518310546875, -0.002284526824951172, 0.00047969818115234375, 0.0032439231872558594, 0.006008148193359375, 0.00877237319946289, 0.011536598205566406, 0.014300823211669922, 0.017065048217773438, 0.019829273223876953, 0.02259349822998047, 0.025357723236083984, 0.0281219482421875, 0.030886173248291016, 0.03365039825439453, 0.03641462326049805, 0.03917884826660156, 0.04194307327270508, 0.044707298278808594, 0.04747152328491211, 0.050235748291015625, 0.05299997329711914, 0.055764198303222656, 0.05852842330932617, 0.06129264831542969, 0.0640568733215332, 0.06682109832763672, 0.06958532333374023, 0.07234954833984375, 0.07511377334594727, 0.07787799835205078, 0.0806422233581543, 0.08340644836425781, 0.08617067337036133, 0.08893489837646484, 0.09169912338256836, 0.09446334838867188, 0.09722757339477539, 0.0999917984008789, 0.10275602340698242, 0.10552024841308594, 0.10828447341918945, 0.11104869842529297, 0.11381292343139648, 0.1165771484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 48.0, 203.0, 387.0, 256.0, 89.0, 19.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7232165336608887, -1.6262346506118774, -1.5292527675628662, -1.432270884513855, -1.3352890014648438, -1.2383071184158325, -1.1413252353668213, -1.0443432331085205, -0.947361409664154, -0.8503795266151428, -0.7533976435661316, -0.6564157009124756, -0.5594338178634644, -0.4624519646167755, -0.3654700517654419, -0.26848816871643066, -0.17150628566741943, -0.0745243951678276, 0.02245749533176422, 0.11943939328193665, 0.21642127633094788, 0.3134031593799591, 0.4103850722312927, 0.507366955280304, 0.6043488383293152, 0.7013307213783264, 0.7983126044273376, 0.8952945470809937, 0.9922764301300049, 1.0892583131790161, 1.1862401962280273, 1.2832220792770386, 1.3802039623260498, 1.477185845375061, 1.5741677284240723, 1.6711496114730835, 1.7681314945220947, 1.865113377571106, 1.9620952606201172, 2.059077262878418, 2.1560590267181396, 2.2530410289764404, 2.350022792816162, 2.447004795074463, 2.5439865589141846, 2.6409685611724854, 2.737950325012207, 2.834932327270508, 2.9319143295288086, 3.0288963317871094, 3.125878095626831, 3.222860097885132, 3.3198418617248535, 3.4168238639831543, 3.513805627822876, 3.6107876300811768, 3.7077693939208984, 3.804751396179199, 3.901733160018921, 3.9987151622772217, 4.095696926116943, 4.192678928375244, 4.289660930633545, 4.3866424560546875, 4.483624458312988]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 5.0, 3.0, 5.0, 15.0, 17.0, 4.0, 13.0, 16.0, 15.0, 13.0, 17.0, 20.0, 28.0, 20.0, 36.0, 28.0, 39.0, 31.0, 40.0, 32.0, 43.0, 25.0, 44.0, 30.0, 39.0, 38.0, 27.0, 38.0, 50.0, 26.0, 25.0, 21.0, 34.0, 29.0, 19.0, 19.0, 22.0, 10.0, 11.0, 13.0, 5.0, 9.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.5647876262664795, -0.5483518242835999, -0.5319159626960754, -0.5154801607131958, -0.4990442991256714, -0.48260849714279175, -0.4661726653575897, -0.4497368335723877, -0.43330100178718567, -0.41686517000198364, -0.4004293382167816, -0.3839935064315796, -0.36755770444869995, -0.35112184286117554, -0.3346860408782959, -0.31825020909309387, -0.30181437730789185, -0.2853785455226898, -0.2689427137374878, -0.25250688195228577, -0.23607106506824493, -0.2196352332830429, -0.20319941639900208, -0.18676358461380005, -0.17032775282859802, -0.153891921043396, -0.13745608925819397, -0.12102027237415314, -0.10458444058895111, -0.08814860880374908, -0.07171278446912766, -0.055276960134506226, -0.038841068744659424, -0.022405240684747696, -0.005969412624835968, 0.01046641543507576, 0.026902243494987488, 0.043338075280189514, 0.059773899614810944, 0.07620972394943237, 0.0926455557346344, 0.10908138751983643, 0.12551721930503845, 0.14195303618907928, 0.1583888679742813, 0.17482469975948334, 0.19126051664352417, 0.2076963484287262, 0.22413218021392822, 0.24056801199913025, 0.2570038437843323, 0.2734396755695343, 0.28987550735473633, 0.30631130933761597, 0.322747141122818, 0.33918297290802, 0.35561880469322205, 0.3720546364784241, 0.3884904682636261, 0.4049263000488281, 0.42136210203170776, 0.4377979636192322, 0.4542337656021118, 0.47066959738731384, 0.48710542917251587]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 2.0, 10.0, 11.0, 11.0, 17.0, 28.0, 31.0, 48.0, 68.0, 88.0, 137.0, 240.0, 344.0, 552.0, 981.0, 1705.0, 3319.0, 6527.0, 14564.0, 36182.0, 108271.0, 429539.0, 2203014.0, 1061639.0, 219963.0, 63884.0, 23217.0, 9868.0, 4614.0, 2241.0, 1220.0, 708.0, 442.0, 254.0, 172.0, 116.0, 74.0, 57.0, 23.0, 34.0, 20.0, 14.0, 7.0, 10.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.11846923828125, -0.1151571273803711, -0.11184501647949219, -0.10853290557861328, -0.10522079467773438, -0.10190868377685547, -0.09859657287597656, -0.09528446197509766, -0.09197235107421875, -0.08866024017333984, -0.08534812927246094, -0.08203601837158203, -0.07872390747070312, -0.07541179656982422, -0.07209968566894531, -0.0687875747680664, -0.0654754638671875, -0.062163352966308594, -0.05885124206542969, -0.05553913116455078, -0.052227020263671875, -0.04891490936279297, -0.04560279846191406, -0.042290687561035156, -0.03897857666015625, -0.035666465759277344, -0.03235435485839844, -0.02904224395751953, -0.025730133056640625, -0.02241802215576172, -0.019105911254882812, -0.015793800354003906, -0.012481689453125, -0.009169578552246094, -0.0058574676513671875, -0.0025453567504882812, 0.000766754150390625, 0.004078865051269531, 0.0073909759521484375, 0.010703086853027344, 0.01401519775390625, 0.017327308654785156, 0.020639419555664062, 0.02395153045654297, 0.027263641357421875, 0.03057575225830078, 0.03388786315917969, 0.037199974060058594, 0.0405120849609375, 0.043824195861816406, 0.04713630676269531, 0.05044841766357422, 0.053760528564453125, 0.05707263946533203, 0.06038475036621094, 0.06369686126708984, 0.06700897216796875, 0.07032108306884766, 0.07363319396972656, 0.07694530487060547, 0.08025741577148438, 0.08356952667236328, 0.08688163757324219, 0.0901937484741211, 0.093505859375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 8.0, 3.0, 11.0, 6.0, 12.0, 7.0, 10.0, 14.0, 22.0, 16.0, 19.0, 28.0, 26.0, 46.0, 34.0, 46.0, 37.0, 50.0, 44.0, 51.0, 60.0, 37.0, 48.0, 40.0, 40.0, 43.0, 33.0, 27.0, 31.0, 26.0, 20.0, 23.0, 21.0, 19.0, 10.0, 12.0, 5.0, 3.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.0762939453125, -0.07423210144042969, -0.07217025756835938, -0.07010841369628906, -0.06804656982421875, -0.06598472595214844, -0.06392288208007812, -0.06186103820800781, -0.0597991943359375, -0.05773735046386719, -0.055675506591796875, -0.05361366271972656, -0.05155181884765625, -0.04948997497558594, -0.047428131103515625, -0.04536628723144531, -0.043304443359375, -0.04124259948730469, -0.039180755615234375, -0.03711891174316406, -0.03505706787109375, -0.03299522399902344, -0.030933380126953125, -0.028871536254882812, -0.0268096923828125, -0.024747848510742188, -0.022686004638671875, -0.020624160766601562, -0.01856231689453125, -0.016500473022460938, -0.014438629150390625, -0.012376785278320312, -0.01031494140625, -0.008253097534179688, -0.006191253662109375, -0.0041294097900390625, -0.00206756591796875, -5.7220458984375e-06, 0.002056121826171875, 0.0041179656982421875, 0.0061798095703125, 0.008241653442382812, 0.010303497314453125, 0.012365341186523438, 0.01442718505859375, 0.016489028930664062, 0.018550872802734375, 0.020612716674804688, 0.022674560546875, 0.024736404418945312, 0.026798248291015625, 0.028860092163085938, 0.03092193603515625, 0.03298377990722656, 0.035045623779296875, 0.03710746765136719, 0.0391693115234375, 0.04123115539550781, 0.043292999267578125, 0.04535484313964844, 0.04741668701171875, 0.04947853088378906, 0.051540374755859375, 0.05360221862792969, 0.0556640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 8.0, 5.0, 13.0, 21.0, 23.0, 35.0, 66.0, 82.0, 118.0, 173.0, 325.0, 575.0, 1046.0, 2078.0, 4545.0, 11217.0, 33856.0, 128198.0, 722717.0, 2600350.0, 538612.0, 103484.0, 28825.0, 9686.0, 3985.0, 1882.0, 964.0, 515.0, 309.0, 193.0, 110.0, 65.0, 47.0, 41.0, 37.0, 17.0, 12.0, 9.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2301025390625, -0.2227802276611328, -0.21545791625976562, -0.20813560485839844, -0.20081329345703125, -0.19349098205566406, -0.18616867065429688, -0.1788463592529297, -0.1715240478515625, -0.1642017364501953, -0.15687942504882812, -0.14955711364746094, -0.14223480224609375, -0.13491249084472656, -0.12759017944335938, -0.12026786804199219, -0.112945556640625, -0.10562324523925781, -0.09830093383789062, -0.09097862243652344, -0.08365631103515625, -0.07633399963378906, -0.06901168823242188, -0.06168937683105469, -0.0543670654296875, -0.04704475402832031, -0.039722442626953125, -0.03240013122558594, -0.02507781982421875, -0.017755508422851562, -0.010433197021484375, -0.0031108856201171875, 0.00421142578125, 0.011533737182617188, 0.018856048583984375, 0.026178359985351562, 0.03350067138671875, 0.04082298278808594, 0.048145294189453125, 0.05546760559082031, 0.0627899169921875, 0.07011222839355469, 0.07743453979492188, 0.08475685119628906, 0.09207916259765625, 0.09940147399902344, 0.10672378540039062, 0.11404609680175781, 0.121368408203125, 0.1286907196044922, 0.13601303100585938, 0.14333534240722656, 0.15065765380859375, 0.15797996520996094, 0.16530227661132812, 0.1726245880126953, 0.1799468994140625, 0.1872692108154297, 0.19459152221679688, 0.20191383361816406, 0.20923614501953125, 0.21655845642089844, 0.22388076782226562, 0.2312030792236328, 0.238525390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 12.0, 9.0, 21.0, 20.0, 45.0, 63.0, 79.0, 145.0, 269.0, 490.0, 792.0, 884.0, 510.0, 275.0, 152.0, 105.0, 71.0, 38.0, 31.0, 16.0, 16.0, 7.0, 5.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125, -0.11875152587890625, -0.1125030517578125, -0.10625457763671875, -0.100006103515625, -0.09375762939453125, -0.0875091552734375, -0.08126068115234375, -0.07501220703125, -0.06876373291015625, -0.0625152587890625, -0.05626678466796875, -0.050018310546875, -0.04376983642578125, -0.0375213623046875, -0.03127288818359375, -0.0250244140625, -0.01877593994140625, -0.0125274658203125, -0.00627899169921875, -3.0517578125e-05, 0.00621795654296875, 0.0124664306640625, 0.01871490478515625, 0.02496337890625, 0.03121185302734375, 0.0374603271484375, 0.04370880126953125, 0.049957275390625, 0.05620574951171875, 0.0624542236328125, 0.06870269775390625, 0.074951171875, 0.08119964599609375, 0.0874481201171875, 0.09369659423828125, 0.099945068359375, 0.10619354248046875, 0.1124420166015625, 0.11869049072265625, 0.12493896484375, 0.13118743896484375, 0.1374359130859375, 0.14368438720703125, 0.149932861328125, 0.15618133544921875, 0.1624298095703125, 0.16867828369140625, 0.1749267578125, 0.18117523193359375, 0.1874237060546875, 0.19367218017578125, 0.199920654296875, 0.20616912841796875, 0.2124176025390625, 0.21866607666015625, 0.22491455078125, 0.23116302490234375, 0.2374114990234375, 0.24365997314453125, 0.249908447265625, 0.25615692138671875, 0.2624053955078125, 0.26865386962890625, 0.27490234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 8.0, 7.0, 17.0, 37.0, 52.0, 86.0, 113.0, 119.0, 135.0, 130.0, 95.0, 89.0, 41.0, 33.0, 18.0, 15.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7478920221328735, -0.7160083651542664, -0.6841246485710144, -0.6522409915924072, -0.6203572750091553, -0.5884736180305481, -0.5565899610519409, -0.524706244468689, -0.4928225576877594, -0.46093887090682983, -0.42905518412590027, -0.3971714973449707, -0.3652878403663635, -0.3334041237831116, -0.3015204668045044, -0.26963678002357483, -0.23775309324264526, -0.2058694064617157, -0.17398571968078613, -0.14210204780101776, -0.1102183610200882, -0.07833467423915863, -0.04645100235939026, -0.014567315578460693, 0.017316371202468872, 0.04920005425810814, 0.0810837373137474, 0.11296741664409637, 0.14485110342502594, 0.1767347902059555, 0.20861846208572388, 0.24050214886665344, 0.272385835647583, 0.3042695224285126, 0.33615320920944214, 0.3680368661880493, 0.39992058277130127, 0.43180423974990845, 0.463687926530838, 0.4955716133117676, 0.5274553298950195, 0.5593389868736267, 0.5912227034568787, 0.6231063604354858, 0.6549900770187378, 0.686873733997345, 0.7187573909759521, 0.7506411075592041, 0.7825247645378113, 0.8144084215164185, 0.8462921380996704, 0.8781757950782776, 0.9100595116615295, 0.9419431686401367, 0.9738268852233887, 1.0057106018066406, 1.037594199180603, 1.069477915763855, 1.1013615131378174, 1.1332452297210693, 1.1651289463043213, 1.1970126628875732, 1.2288962602615356, 1.2607799768447876, 1.2926636934280396]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 0.0, 5.0, 6.0, 9.0, 11.0, 11.0, 10.0, 19.0, 18.0, 18.0, 32.0, 17.0, 17.0, 36.0, 22.0, 41.0, 36.0, 32.0, 40.0, 33.0, 36.0, 30.0, 46.0, 34.0, 41.0, 33.0, 42.0, 34.0, 36.0, 28.0, 22.0, 41.0, 15.0, 28.0, 24.0, 14.0, 13.0, 7.0, 16.0, 10.0, 8.0, 6.0, 10.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.38295233249664307, -0.37084120512008667, -0.3587300479412079, -0.3466189205646515, -0.3345077931880951, -0.3223966658115387, -0.3102855086326599, -0.2981743812561035, -0.2860632538795471, -0.2739521265029907, -0.26184096932411194, -0.24972984194755554, -0.23761871457099915, -0.22550757229328156, -0.21339643001556396, -0.20128530263900757, -0.18917416036128998, -0.1770630180835724, -0.164951890707016, -0.1528407484292984, -0.140729621052742, -0.12861847877502441, -0.11650734394788742, -0.10439620912075043, -0.09228507429361343, -0.08017393946647644, -0.06806280463933945, -0.055951666086912155, -0.04384053125977516, -0.03172939643263817, -0.019618257880210876, -0.007507123053073883, 0.00460401177406311, 0.016715146601200104, 0.028826283290982246, 0.04093741998076439, 0.05304855480790138, 0.06515969336032867, 0.07727082818746567, 0.08938196301460266, 0.10149309784173965, 0.11360423266887665, 0.12571537494659424, 0.13782650232315063, 0.14993764460086823, 0.16204877197742462, 0.1741599142551422, 0.1862710416316986, 0.1983821839094162, 0.2104933261871338, 0.22260445356369019, 0.23471559584140778, 0.24682672321796417, 0.25893786549568176, 0.27104899287223816, 0.28316015005111694, 0.29527127742767334, 0.30738240480422974, 0.3194935619831085, 0.3316046893596649, 0.3437158167362213, 0.3558269441127777, 0.3679381012916565, 0.3800492286682129, 0.3921603560447693]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 21.0, 20.0, 26.0, 51.0, 76.0, 111.0, 161.0, 232.0, 358.0, 576.0, 826.0, 1185.0, 1934.0, 2961.0, 4413.0, 6689.0, 10454.0, 16067.0, 25925.0, 44720.0, 87275.0, 189924.0, 282622.0, 178359.0, 81994.0, 42251.0, 24828.0, 15469.0, 10092.0, 6472.0, 4187.0, 2834.0, 1900.0, 1151.0, 817.0, 511.0, 326.0, 246.0, 158.0, 114.0, 76.0, 37.0, 42.0, 25.0, 8.0, 10.0, 12.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.098876953125, -0.09592151641845703, -0.09296607971191406, -0.0900106430053711, -0.08705520629882812, -0.08409976959228516, -0.08114433288574219, -0.07818889617919922, -0.07523345947265625, -0.07227802276611328, -0.06932258605957031, -0.06636714935302734, -0.06341171264648438, -0.060456275939941406, -0.05750083923339844, -0.05454540252685547, -0.0515899658203125, -0.04863452911376953, -0.04567909240722656, -0.042723655700683594, -0.039768218994140625, -0.036812782287597656, -0.03385734558105469, -0.03090190887451172, -0.02794647216796875, -0.02499103546142578, -0.022035598754882812, -0.019080162048339844, -0.016124725341796875, -0.013169288635253906, -0.010213851928710938, -0.007258415222167969, -0.004302978515625, -0.0013475418090820312, 0.0016078948974609375, 0.004563331604003906, 0.007518768310546875, 0.010474205017089844, 0.013429641723632812, 0.01638507843017578, 0.01934051513671875, 0.02229595184326172, 0.025251388549804688, 0.028206825256347656, 0.031162261962890625, 0.034117698669433594, 0.03707313537597656, 0.04002857208251953, 0.0429840087890625, 0.04593944549560547, 0.04889488220214844, 0.051850318908691406, 0.054805755615234375, 0.057761192321777344, 0.06071662902832031, 0.06367206573486328, 0.06662750244140625, 0.06958293914794922, 0.07253837585449219, 0.07549381256103516, 0.07844924926757812, 0.0814046859741211, 0.08436012268066406, 0.08731555938720703, 0.09027099609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 7.0, 10.0, 10.0, 7.0, 13.0, 17.0, 26.0, 25.0, 23.0, 18.0, 32.0, 31.0, 29.0, 33.0, 33.0, 37.0, 45.0, 50.0, 38.0, 34.0, 53.0, 49.0, 37.0, 36.0, 26.0, 38.0, 29.0, 25.0, 23.0, 26.0, 34.0, 13.0, 12.0, 17.0, 13.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.07305908203125, -0.07106924057006836, -0.06907939910888672, -0.06708955764770508, -0.06509971618652344, -0.0631098747253418, -0.061120033264160156, -0.059130191802978516, -0.057140350341796875, -0.055150508880615234, -0.053160667419433594, -0.05117082595825195, -0.04918098449707031, -0.04719114303588867, -0.04520130157470703, -0.04321146011352539, -0.04122161865234375, -0.03923177719116211, -0.03724193572998047, -0.03525209426879883, -0.03326225280761719, -0.03127241134643555, -0.029282569885253906, -0.027292728424072266, -0.025302886962890625, -0.023313045501708984, -0.021323204040527344, -0.019333362579345703, -0.017343521118164062, -0.015353679656982422, -0.013363838195800781, -0.01137399673461914, -0.0093841552734375, -0.007394313812255859, -0.005404472351074219, -0.003414630889892578, -0.0014247894287109375, 0.0005650520324707031, 0.0025548934936523438, 0.004544734954833984, 0.006534576416015625, 0.008524417877197266, 0.010514259338378906, 0.012504100799560547, 0.014493942260742188, 0.016483783721923828, 0.01847362518310547, 0.02046346664428711, 0.02245330810546875, 0.02444314956665039, 0.02643299102783203, 0.028422832489013672, 0.030412673950195312, 0.03240251541137695, 0.034392356872558594, 0.036382198333740234, 0.038372039794921875, 0.040361881256103516, 0.042351722717285156, 0.0443415641784668, 0.04633140563964844, 0.04832124710083008, 0.05031108856201172, 0.05230093002319336, 0.054290771484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 10.0, 8.0, 3.0, 7.0, 6.0, 13.0, 17.0, 28.0, 45.0, 45.0, 63.0, 99.0, 183.0, 289.0, 592.0, 1203.0, 2802.0, 6994.0, 18253.0, 52629.0, 259388.0, 556116.0, 101375.0, 29639.0, 10971.0, 4238.0, 1739.0, 785.0, 376.0, 223.0, 130.0, 84.0, 53.0, 36.0, 28.0, 26.0, 12.0, 13.0, 7.0, 7.0, 7.0, 6.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.281982421875, -0.2742023468017578, -0.2664222717285156, -0.25864219665527344, -0.25086212158203125, -0.24308204650878906, -0.23530197143554688, -0.2275218963623047, -0.2197418212890625, -0.2119617462158203, -0.20418167114257812, -0.19640159606933594, -0.18862152099609375, -0.18084144592285156, -0.17306137084960938, -0.1652812957763672, -0.157501220703125, -0.1497211456298828, -0.14194107055664062, -0.13416099548339844, -0.12638092041015625, -0.11860084533691406, -0.11082077026367188, -0.10304069519042969, -0.0952606201171875, -0.08748054504394531, -0.07970046997070312, -0.07192039489746094, -0.06414031982421875, -0.05636024475097656, -0.048580169677734375, -0.04080009460449219, -0.03302001953125, -0.025239944458007812, -0.017459869384765625, -0.009679794311523438, -0.00189971923828125, 0.0058803558349609375, 0.013660430908203125, 0.021440505981445312, 0.0292205810546875, 0.03700065612792969, 0.044780731201171875, 0.05256080627441406, 0.06034088134765625, 0.06812095642089844, 0.07590103149414062, 0.08368110656738281, 0.091461181640625, 0.09924125671386719, 0.10702133178710938, 0.11480140686035156, 0.12258148193359375, 0.13036155700683594, 0.13814163208007812, 0.1459217071533203, 0.1537017822265625, 0.1614818572998047, 0.16926193237304688, 0.17704200744628906, 0.18482208251953125, 0.19260215759277344, 0.20038223266601562, 0.2081623077392578, 0.2159423828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 10.0, 9.0, 20.0, 21.0, 24.0, 28.0, 33.0, 36.0, 45.0, 53.0, 66.0, 58.0, 59.0, 65.0, 53.0, 64.0, 44.0, 48.0, 50.0, 41.0, 40.0, 30.0, 26.0, 18.0, 11.0, 11.0, 4.0, 8.0, 3.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.25923919677734375, -0.2499237060546875, -0.24060821533203125, -0.231292724609375, -0.22197723388671875, -0.2126617431640625, -0.20334625244140625, -0.19403076171875, -0.18471527099609375, -0.1753997802734375, -0.16608428955078125, -0.156768798828125, -0.14745330810546875, -0.1381378173828125, -0.12882232666015625, -0.1195068359375, -0.11019134521484375, -0.1008758544921875, -0.09156036376953125, -0.082244873046875, -0.07292938232421875, -0.0636138916015625, -0.05429840087890625, -0.04498291015625, -0.03566741943359375, -0.0263519287109375, -0.01703643798828125, -0.007720947265625, 0.00159454345703125, 0.0109100341796875, 0.02022552490234375, 0.029541015625, 0.03885650634765625, 0.0481719970703125, 0.05748748779296875, 0.066802978515625, 0.07611846923828125, 0.0854339599609375, 0.09474945068359375, 0.10406494140625, 0.11338043212890625, 0.1226959228515625, 0.13201141357421875, 0.141326904296875, 0.15064239501953125, 0.1599578857421875, 0.16927337646484375, 0.1785888671875, 0.18790435791015625, 0.1972198486328125, 0.20653533935546875, 0.215850830078125, 0.22516632080078125, 0.2344818115234375, 0.24379730224609375, 0.25311279296875, 0.26242828369140625, 0.2717437744140625, 0.28105926513671875, 0.290374755859375, 0.29969024658203125, 0.3090057373046875, 0.31832122802734375, 0.32763671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 1.0, 9.0, 3.0, 14.0, 23.0, 19.0, 30.0, 31.0, 53.0, 76.0, 97.0, 137.0, 178.0, 300.0, 337.0, 541.0, 804.0, 1159.0, 2007.0, 3658.0, 7836.0, 18212.0, 48207.0, 245363.0, 569405.0, 96074.0, 29087.0, 12062.0, 5483.0, 2670.0, 1549.0, 888.0, 609.0, 448.0, 352.0, 237.0, 150.0, 126.0, 87.0, 72.0, 44.0, 37.0, 22.0, 16.0, 14.0, 14.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.130126953125, -0.12609291076660156, -0.12205886840820312, -0.11802482604980469, -0.11399078369140625, -0.10995674133300781, -0.10592269897460938, -0.10188865661621094, -0.0978546142578125, -0.09382057189941406, -0.08978652954101562, -0.08575248718261719, -0.08171844482421875, -0.07768440246582031, -0.07365036010742188, -0.06961631774902344, -0.065582275390625, -0.06154823303222656, -0.057514190673828125, -0.05348014831542969, -0.04944610595703125, -0.04541206359863281, -0.041378021240234375, -0.03734397888183594, -0.0333099365234375, -0.029275894165039062, -0.025241851806640625, -0.021207809448242188, -0.01717376708984375, -0.013139724731445312, -0.009105682373046875, -0.0050716400146484375, -0.00103759765625, 0.0029964447021484375, 0.007030487060546875, 0.011064529418945312, 0.01509857177734375, 0.019132614135742188, 0.023166656494140625, 0.027200698852539062, 0.0312347412109375, 0.03526878356933594, 0.039302825927734375, 0.04333686828613281, 0.04737091064453125, 0.05140495300292969, 0.055438995361328125, 0.05947303771972656, 0.063507080078125, 0.06754112243652344, 0.07157516479492188, 0.07560920715332031, 0.07964324951171875, 0.08367729187011719, 0.08771133422851562, 0.09174537658691406, 0.0957794189453125, 0.09981346130371094, 0.10384750366210938, 0.10788154602050781, 0.11191558837890625, 0.11594963073730469, 0.11998367309570312, 0.12401771545410156, 0.1280517578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 6.0, 2.0, 3.0, 12.0, 13.0, 15.0, 31.0, 31.0, 33.0, 43.0, 67.0, 79.0, 83.0, 98.0, 91.0, 71.0, 80.0, 62.0, 41.0, 24.0, 14.0, 17.0, 7.0, 14.0, 10.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5570392608642578e-05, -2.4809502065181732e-05, -2.4048611521720886e-05, -2.328772097826004e-05, -2.2526830434799194e-05, -2.176593989133835e-05, -2.1005049347877502e-05, -2.0244158804416656e-05, -1.948326826095581e-05, -1.8722377717494965e-05, -1.796148717403412e-05, -1.7200596630573273e-05, -1.6439706087112427e-05, -1.567881554365158e-05, -1.4917925000190735e-05, -1.4157034456729889e-05, -1.3396143913269043e-05, -1.2635253369808197e-05, -1.1874362826347351e-05, -1.1113472282886505e-05, -1.035258173942566e-05, -9.591691195964813e-06, -8.830800652503967e-06, -8.069910109043121e-06, -7.309019565582275e-06, -6.5481290221214294e-06, -5.7872384786605835e-06, -5.0263479351997375e-06, -4.265457391738892e-06, -3.5045668482780457e-06, -2.7436763048171997e-06, -1.9827857613563538e-06, -1.2218952178955078e-06, -4.6100467443466187e-07, 2.998858690261841e-07, 1.06077641248703e-06, 1.821666955947876e-06, 2.582557499408722e-06, 3.343448042869568e-06, 4.104338586330414e-06, 4.86522912979126e-06, 5.626119673252106e-06, 6.387010216712952e-06, 7.147900760173798e-06, 7.908791303634644e-06, 8.66968184709549e-06, 9.430572390556335e-06, 1.0191462934017181e-05, 1.0952353477478027e-05, 1.1713244020938873e-05, 1.247413456439972e-05, 1.3235025107860565e-05, 1.3995915651321411e-05, 1.4756806194782257e-05, 1.5517696738243103e-05, 1.627858728170395e-05, 1.7039477825164795e-05, 1.780036836862564e-05, 1.8561258912086487e-05, 1.9322149455547333e-05, 2.008303999900818e-05, 2.0843930542469025e-05, 2.160482108592987e-05, 2.2365711629390717e-05, 2.3126602172851562e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 3.0, 9.0, 8.0, 7.0, 8.0, 12.0, 13.0, 26.0, 35.0, 46.0, 81.0, 203.0, 379.0, 836.0, 2051.0, 4915.0, 13506.0, 39555.0, 189694.0, 639068.0, 111589.0, 29452.0, 10104.0, 3917.0, 1556.0, 677.0, 349.0, 191.0, 95.0, 37.0, 26.0, 27.0, 17.0, 13.0, 15.0, 9.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1514892578125, -0.1470813751220703, -0.14267349243164062, -0.13826560974121094, -0.13385772705078125, -0.12944984436035156, -0.12504196166992188, -0.12063407897949219, -0.1162261962890625, -0.11181831359863281, -0.10741043090820312, -0.10300254821777344, -0.09859466552734375, -0.09418678283691406, -0.08977890014648438, -0.08537101745605469, -0.080963134765625, -0.07655525207519531, -0.07214736938476562, -0.06773948669433594, -0.06333160400390625, -0.05892372131347656, -0.054515838623046875, -0.05010795593261719, -0.0457000732421875, -0.04129219055175781, -0.036884307861328125, -0.03247642517089844, -0.02806854248046875, -0.023660659790039062, -0.019252777099609375, -0.014844894409179688, -0.01043701171875, -0.0060291290283203125, -0.001621246337890625, 0.0027866363525390625, 0.00719451904296875, 0.011602401733398438, 0.016010284423828125, 0.020418167114257812, 0.0248260498046875, 0.029233932495117188, 0.033641815185546875, 0.03804969787597656, 0.04245758056640625, 0.04686546325683594, 0.051273345947265625, 0.05568122863769531, 0.060089111328125, 0.06449699401855469, 0.06890487670898438, 0.07331275939941406, 0.07772064208984375, 0.08212852478027344, 0.08653640747070312, 0.09094429016113281, 0.0953521728515625, 0.09976005554199219, 0.10416793823242188, 0.10857582092285156, 0.11298370361328125, 0.11739158630371094, 0.12179946899414062, 0.1262073516845703, 0.130615234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 7.0, 17.0, 19.0, 29.0, 66.0, 149.0, 241.0, 208.0, 101.0, 42.0, 24.0, 16.0, 20.0, 7.0, 4.0, 4.0, 7.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1865234375, -0.18144798278808594, -0.17637252807617188, -0.1712970733642578, -0.16622161865234375, -0.1611461639404297, -0.15607070922851562, -0.15099525451660156, -0.1459197998046875, -0.14084434509277344, -0.13576889038085938, -0.1306934356689453, -0.12561798095703125, -0.12054252624511719, -0.11546707153320312, -0.11039161682128906, -0.105316162109375, -0.10024070739746094, -0.09516525268554688, -0.09008979797363281, -0.08501434326171875, -0.07993888854980469, -0.07486343383789062, -0.06978797912597656, -0.0647125244140625, -0.05963706970214844, -0.054561614990234375, -0.04948616027832031, -0.04441070556640625, -0.03933525085449219, -0.034259796142578125, -0.029184341430664062, -0.02410888671875, -0.019033432006835938, -0.013957977294921875, -0.008882522583007812, -0.00380706787109375, 0.0012683868408203125, 0.006343841552734375, 0.011419296264648438, 0.0164947509765625, 0.021570205688476562, 0.026645660400390625, 0.03172111511230469, 0.03679656982421875, 0.04187202453613281, 0.046947479248046875, 0.05202293395996094, 0.057098388671875, 0.06217384338378906, 0.06724929809570312, 0.07232475280761719, 0.07740020751953125, 0.08247566223144531, 0.08755111694335938, 0.09262657165527344, 0.0977020263671875, 0.10277748107910156, 0.10785293579101562, 0.11292839050292969, 0.11800384521484375, 0.12307929992675781, 0.12815475463867188, 0.13323020935058594, 0.1383056640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 9.0, 9.0, 34.0, 110.0, 210.0, 279.0, 166.0, 120.0, 44.0, 24.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7653948664665222, -0.6990396976470947, -0.6326845288276672, -0.5663293600082397, -0.49997416138648987, -0.4336189925670624, -0.3672637939453125, -0.300908625125885, -0.23455345630645752, -0.16819828748703003, -0.10184310376644135, -0.03548792004585266, 0.03086724877357483, 0.09722241759300232, 0.1635776162147522, 0.2299327850341797, 0.2962879538536072, 0.36264312267303467, 0.42899829149246216, 0.49535349011421204, 0.5617086887359619, 0.6280637979507446, 0.6944190263748169, 0.7607741951942444, 0.8271293640136719, 0.8934845328330994, 0.9598397016525269, 1.0261949300765991, 1.0925500392913818, 1.158905267715454, 1.2252604961395264, 1.291615605354309, 1.3579707145690918, 1.424325942993164, 1.4906810522079468, 1.557036280632019, 1.6233913898468018, 1.689746618270874, 1.7561018466949463, 1.822456955909729, 1.8888120651245117, 1.955167293548584, 2.0215225219726562, 2.0878775119781494, 2.1542327404022217, 2.220587968826294, 2.286943197250366, 2.3532981872558594, 2.4196534156799316, 2.486008644104004, 2.552363872528076, 2.6187188625335693, 2.6850740909576416, 2.751429319381714, 2.817784547805786, 2.8841395378112793, 2.9504950046539307, 3.016850233078003, 3.083205461502075, 3.1495604515075684, 3.2159156799316406, 3.282270908355713, 3.348626136779785, 3.4149813652038574, 3.4813363552093506]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 7.0, 19.0, 16.0, 20.0, 34.0, 17.0, 26.0, 43.0, 29.0, 29.0, 43.0, 38.0, 52.0, 43.0, 42.0, 52.0, 47.0, 33.0, 40.0, 41.0, 57.0, 30.0, 40.0, 23.0, 24.0, 21.0, 20.0, 20.0, 11.0, 9.0, 14.0, 9.0, 0.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.651595950126648, -0.6304101943969727, -0.6092244386672974, -0.5880386829376221, -0.5668529272079468, -0.5456671714782715, -0.5244814157485962, -0.5032956600189209, -0.4821099042892456, -0.4609241485595703, -0.439738392829895, -0.4185526371002197, -0.39736688137054443, -0.37618112564086914, -0.35499536991119385, -0.33380961418151855, -0.31262385845184326, -0.29143810272216797, -0.2702523469924927, -0.24906659126281738, -0.2278808355331421, -0.2066950798034668, -0.1855093240737915, -0.1643235683441162, -0.14313781261444092, -0.12195205688476562, -0.10076630115509033, -0.07958054542541504, -0.058394789695739746, -0.03720903396606445, -0.01602327823638916, 0.005162477493286133, 0.0263482928276062, 0.047534048557281494, 0.06871980428695679, 0.08990556001663208, 0.11109131574630737, 0.13227707147598267, 0.15346282720565796, 0.17464858293533325, 0.19583433866500854, 0.21702009439468384, 0.23820585012435913, 0.2593916058540344, 0.2805773615837097, 0.301763117313385, 0.3229488730430603, 0.3441346287727356, 0.3653203845024109, 0.3865061402320862, 0.4076918959617615, 0.42887765169143677, 0.45006340742111206, 0.47124916315078735, 0.49243491888046265, 0.5136206746101379, 0.5348064303398132, 0.5559921860694885, 0.5771779417991638, 0.5983636975288391, 0.6195494532585144, 0.6407352089881897, 0.661920964717865, 0.6831067204475403, 0.7042924761772156]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 18.0, 23.0, 19.0, 26.0, 33.0, 51.0, 110.0, 102.0, 213.0, 325.0, 563.0, 1023.0, 1834.0, 3624.0, 7094.0, 15904.0, 39515.0, 119465.0, 489449.0, 2546712.0, 723668.0, 158927.0, 50165.0, 18970.0, 8148.0, 3959.0, 1943.0, 1013.0, 546.0, 318.0, 193.0, 91.0, 74.0, 49.0, 24.0, 28.0, 11.0, 14.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.14697265625, -0.14272594451904297, -0.13847923278808594, -0.1342325210571289, -0.12998580932617188, -0.12573909759521484, -0.12149238586425781, -0.11724567413330078, -0.11299896240234375, -0.10875225067138672, -0.10450553894042969, -0.10025882720947266, -0.09601211547851562, -0.0917654037475586, -0.08751869201660156, -0.08327198028564453, -0.0790252685546875, -0.07477855682373047, -0.07053184509277344, -0.0662851333618164, -0.062038421630859375, -0.057791709899902344, -0.05354499816894531, -0.04929828643798828, -0.04505157470703125, -0.04080486297607422, -0.03655815124511719, -0.032311439514160156, -0.028064727783203125, -0.023818016052246094, -0.019571304321289062, -0.015324592590332031, -0.011077880859375, -0.006831169128417969, -0.0025844573974609375, 0.0016622543334960938, 0.005908966064453125, 0.010155677795410156, 0.014402389526367188, 0.01864910125732422, 0.02289581298828125, 0.02714252471923828, 0.03138923645019531, 0.035635948181152344, 0.039882659912109375, 0.044129371643066406, 0.04837608337402344, 0.05262279510498047, 0.0568695068359375, 0.06111621856689453, 0.06536293029785156, 0.0696096420288086, 0.07385635375976562, 0.07810306549072266, 0.08234977722167969, 0.08659648895263672, 0.09084320068359375, 0.09508991241455078, 0.09933662414550781, 0.10358333587646484, 0.10783004760742188, 0.1120767593383789, 0.11632347106933594, 0.12057018280029297, 0.12481689453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 9.0, 7.0, 11.0, 10.0, 13.0, 15.0, 13.0, 18.0, 24.0, 29.0, 28.0, 33.0, 30.0, 29.0, 31.0, 37.0, 42.0, 30.0, 44.0, 39.0, 45.0, 41.0, 29.0, 46.0, 46.0, 40.0, 34.0, 31.0, 26.0, 21.0, 15.0, 21.0, 14.0, 20.0, 10.0, 15.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.07684326171875, -0.0746612548828125, -0.072479248046875, -0.0702972412109375, -0.068115234375, -0.0659332275390625, -0.063751220703125, -0.0615692138671875, -0.05938720703125, -0.0572052001953125, -0.055023193359375, -0.0528411865234375, -0.0506591796875, -0.0484771728515625, -0.046295166015625, -0.0441131591796875, -0.04193115234375, -0.0397491455078125, -0.037567138671875, -0.0353851318359375, -0.033203125, -0.0310211181640625, -0.028839111328125, -0.0266571044921875, -0.02447509765625, -0.0222930908203125, -0.020111083984375, -0.0179290771484375, -0.0157470703125, -0.0135650634765625, -0.011383056640625, -0.0092010498046875, -0.00701904296875, -0.0048370361328125, -0.002655029296875, -0.0004730224609375, 0.001708984375, 0.0038909912109375, 0.006072998046875, 0.0082550048828125, 0.01043701171875, 0.0126190185546875, 0.014801025390625, 0.0169830322265625, 0.0191650390625, 0.0213470458984375, 0.023529052734375, 0.0257110595703125, 0.02789306640625, 0.0300750732421875, 0.032257080078125, 0.0344390869140625, 0.03662109375, 0.0388031005859375, 0.040985107421875, 0.0431671142578125, 0.04534912109375, 0.0475311279296875, 0.049713134765625, 0.0518951416015625, 0.0540771484375, 0.0562591552734375, 0.058441162109375, 0.0606231689453125, 0.06280517578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 1.0, 4.0, 3.0, 9.0, 7.0, 13.0, 14.0, 22.0, 29.0, 41.0, 69.0, 84.0, 103.0, 128.0, 237.0, 302.0, 494.0, 856.0, 1665.0, 3319.0, 8112.0, 21181.0, 68673.0, 299678.0, 2198609.0, 1310268.0, 201395.0, 50005.0, 16259.0, 6216.0, 2842.0, 1408.0, 796.0, 446.0, 272.0, 213.0, 119.0, 97.0, 84.0, 66.0, 35.0, 32.0, 21.0, 13.0, 11.0, 10.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.2900390625, -0.2817230224609375, -0.273406982421875, -0.2650909423828125, -0.25677490234375, -0.2484588623046875, -0.240142822265625, -0.2318267822265625, -0.2235107421875, -0.2151947021484375, -0.206878662109375, -0.1985626220703125, -0.19024658203125, -0.1819305419921875, -0.173614501953125, -0.1652984619140625, -0.156982421875, -0.1486663818359375, -0.140350341796875, -0.1320343017578125, -0.12371826171875, -0.1154022216796875, -0.107086181640625, -0.0987701416015625, -0.0904541015625, -0.0821380615234375, -0.073822021484375, -0.0655059814453125, -0.05718994140625, -0.0488739013671875, -0.040557861328125, -0.0322418212890625, -0.02392578125, -0.0156097412109375, -0.007293701171875, 0.0010223388671875, 0.00933837890625, 0.0176544189453125, 0.025970458984375, 0.0342864990234375, 0.0426025390625, 0.0509185791015625, 0.059234619140625, 0.0675506591796875, 0.07586669921875, 0.0841827392578125, 0.092498779296875, 0.1008148193359375, 0.109130859375, 0.1174468994140625, 0.125762939453125, 0.1340789794921875, 0.14239501953125, 0.1507110595703125, 0.159027099609375, 0.1673431396484375, 0.1756591796875, 0.1839752197265625, 0.192291259765625, 0.2006072998046875, 0.20892333984375, 0.2172393798828125, 0.225555419921875, 0.2338714599609375, 0.2421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 12.0, 14.0, 29.0, 66.0, 86.0, 176.0, 339.0, 704.0, 1248.0, 685.0, 327.0, 156.0, 94.0, 50.0, 30.0, 13.0, 12.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.19922828674316406, -0.19032669067382812, -0.1814250946044922, -0.17252349853515625, -0.1636219024658203, -0.15472030639648438, -0.14581871032714844, -0.1369171142578125, -0.12801551818847656, -0.11911392211914062, -0.11021232604980469, -0.10131072998046875, -0.09240913391113281, -0.08350753784179688, -0.07460594177246094, -0.065704345703125, -0.05680274963378906, -0.047901153564453125, -0.03899955749511719, -0.03009796142578125, -0.021196365356445312, -0.012294769287109375, -0.0033931732177734375, 0.0055084228515625, 0.014410018920898438, 0.023311614990234375, 0.03221321105957031, 0.04111480712890625, 0.05001640319824219, 0.058917999267578125, 0.06781959533691406, 0.07672119140625, 0.08562278747558594, 0.09452438354492188, 0.10342597961425781, 0.11232757568359375, 0.12122917175292969, 0.13013076782226562, 0.13903236389160156, 0.1479339599609375, 0.15683555603027344, 0.16573715209960938, 0.1746387481689453, 0.18354034423828125, 0.1924419403076172, 0.20134353637695312, 0.21024513244628906, 0.219146728515625, 0.22804832458496094, 0.23694992065429688, 0.2458515167236328, 0.25475311279296875, 0.2636547088623047, 0.2725563049316406, 0.28145790100097656, 0.2903594970703125, 0.29926109313964844, 0.3081626892089844, 0.3170642852783203, 0.32596588134765625, 0.3348674774169922, 0.3437690734863281, 0.35267066955566406, 0.361572265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 3.0, 20.0, 16.0, 29.0, 32.0, 47.0, 66.0, 62.0, 82.0, 105.0, 107.0, 86.0, 88.0, 74.0, 52.0, 37.0, 38.0, 16.0, 17.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9097804427146912, -0.8842428922653198, -0.8587054014205933, -0.8331679105758667, -0.8076303601264954, -0.782092809677124, -0.7565553188323975, -0.7310178279876709, -0.7054802775382996, -0.6799427270889282, -0.6544052362442017, -0.6288677453994751, -0.6033301949501038, -0.5777926445007324, -0.5522551536560059, -0.5267176628112793, -0.501180112361908, -0.475642591714859, -0.45010507106781006, -0.4245675504207611, -0.39903002977371216, -0.3734925091266632, -0.34795498847961426, -0.3224174678325653, -0.29687994718551636, -0.2713424265384674, -0.24580490589141846, -0.2202673852443695, -0.19472986459732056, -0.1691923439502716, -0.14365482330322266, -0.1181173026561737, -0.09257972240447998, -0.06704220175743103, -0.04150468111038208, -0.01596716046333313, 0.00957036018371582, 0.03510788083076477, 0.06064540147781372, 0.08618292212486267, 0.11172044277191162, 0.13725796341896057, 0.16279548406600952, 0.18833300471305847, 0.21387052536010742, 0.23940804600715637, 0.2649455666542053, 0.2904830873012543, 0.3160206079483032, 0.3415581285953522, 0.3670956492424011, 0.3926331698894501, 0.418170690536499, 0.443708211183548, 0.4692457318305969, 0.4947832524776459, 0.5203207731246948, 0.5458582639694214, 0.5713958144187927, 0.5969333648681641, 0.6224708557128906, 0.6480083465576172, 0.6735458970069885, 0.6990834474563599, 0.7246209383010864]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 9.0, 5.0, 9.0, 11.0, 11.0, 12.0, 21.0, 17.0, 31.0, 24.0, 32.0, 25.0, 36.0, 49.0, 43.0, 36.0, 34.0, 39.0, 55.0, 41.0, 52.0, 39.0, 30.0, 47.0, 43.0, 34.0, 25.0, 22.0, 31.0, 19.0, 20.0, 15.0, 15.0, 18.0, 10.0, 7.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5010194182395935, -0.48457351326942444, -0.46812760829925537, -0.4516817033290863, -0.43523579835891724, -0.41878989338874817, -0.4023439884185791, -0.3858981132507324, -0.36945217847824097, -0.3530062735080719, -0.33656036853790283, -0.32011446356773376, -0.3036685585975647, -0.28722265362739563, -0.27077674865722656, -0.2543308734893799, -0.23788496851921082, -0.22143906354904175, -0.20499315857887268, -0.1885472536087036, -0.17210134863853455, -0.15565544366836548, -0.1392095535993576, -0.12276364862918854, -0.10631774365901947, -0.0898718386888504, -0.07342593371868134, -0.056980036199092865, -0.0405341312289238, -0.02408822625875473, -0.00764232873916626, 0.008803576231002808, 0.025249481201171875, 0.04169538617134094, 0.05814128741621971, 0.07458718866109848, 0.09103309363126755, 0.10747899860143661, 0.12392489612102509, 0.14037080109119415, 0.15681670606136322, 0.1732626110315323, 0.18970851600170135, 0.20615440607070923, 0.2226003110408783, 0.23904621601104736, 0.25549212098121643, 0.2719380259513855, 0.28838393092155457, 0.30482983589172363, 0.3212757408618927, 0.33772164583206177, 0.35416755080223083, 0.3706134557723999, 0.3870593309402466, 0.40350526571273804, 0.4199511408805847, 0.4363970458507538, 0.45284295082092285, 0.4692888557910919, 0.485734760761261, 0.5021806359291077, 0.5186265707015991, 0.5350724458694458, 0.5515183806419373]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 19.0, 28.0, 32.0, 66.0, 95.0, 163.0, 227.0, 377.0, 628.0, 967.0, 1521.0, 2501.0, 3980.0, 6238.0, 10748.0, 17928.0, 30591.0, 53213.0, 95177.0, 186100.0, 269349.0, 164743.0, 85864.0, 48248.0, 27996.0, 16326.0, 9818.0, 5924.0, 3693.0, 2240.0, 1335.0, 906.0, 552.0, 343.0, 230.0, 130.0, 78.0, 71.0, 32.0, 20.0, 18.0, 10.0, 9.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.10833740234375, -0.10518932342529297, -0.10204124450683594, -0.0988931655883789, -0.09574508666992188, -0.09259700775146484, -0.08944892883300781, -0.08630084991455078, -0.08315277099609375, -0.08000469207763672, -0.07685661315917969, -0.07370853424072266, -0.07056045532226562, -0.0674123764038086, -0.06426429748535156, -0.06111621856689453, -0.0579681396484375, -0.05482006072998047, -0.05167198181152344, -0.048523902893066406, -0.045375823974609375, -0.042227745056152344, -0.03907966613769531, -0.03593158721923828, -0.03278350830078125, -0.02963542938232422, -0.026487350463867188, -0.023339271545410156, -0.020191192626953125, -0.017043113708496094, -0.013895034790039062, -0.010746955871582031, -0.007598876953125, -0.004450798034667969, -0.0013027191162109375, 0.0018453598022460938, 0.004993438720703125, 0.008141517639160156, 0.011289596557617188, 0.014437675476074219, 0.01758575439453125, 0.02073383331298828, 0.023881912231445312, 0.027029991149902344, 0.030178070068359375, 0.033326148986816406, 0.03647422790527344, 0.03962230682373047, 0.0427703857421875, 0.04591846466064453, 0.04906654357910156, 0.052214622497558594, 0.055362701416015625, 0.058510780334472656, 0.06165885925292969, 0.06480693817138672, 0.06795501708984375, 0.07110309600830078, 0.07425117492675781, 0.07739925384521484, 0.08054733276367188, 0.0836954116821289, 0.08684349060058594, 0.08999156951904297, 0.0931396484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 5.0, 3.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 27.0, 17.0, 22.0, 30.0, 26.0, 37.0, 26.0, 39.0, 45.0, 43.0, 42.0, 60.0, 45.0, 50.0, 42.0, 36.0, 42.0, 35.0, 34.0, 39.0, 31.0, 17.0, 24.0, 24.0, 19.0, 14.0, 14.0, 9.0, 9.0, 9.0, 9.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.0832672119140625, -0.080718994140625, -0.0781707763671875, -0.07562255859375, -0.0730743408203125, -0.070526123046875, -0.0679779052734375, -0.0654296875, -0.0628814697265625, -0.060333251953125, -0.0577850341796875, -0.05523681640625, -0.0526885986328125, -0.050140380859375, -0.0475921630859375, -0.0450439453125, -0.0424957275390625, -0.039947509765625, -0.0373992919921875, -0.03485107421875, -0.0323028564453125, -0.029754638671875, -0.0272064208984375, -0.024658203125, -0.0221099853515625, -0.019561767578125, -0.0170135498046875, -0.01446533203125, -0.0119171142578125, -0.009368896484375, -0.0068206787109375, -0.0042724609375, -0.0017242431640625, 0.000823974609375, 0.0033721923828125, 0.00592041015625, 0.0084686279296875, 0.011016845703125, 0.0135650634765625, 0.01611328125, 0.0186614990234375, 0.021209716796875, 0.0237579345703125, 0.02630615234375, 0.0288543701171875, 0.031402587890625, 0.0339508056640625, 0.0364990234375, 0.0390472412109375, 0.041595458984375, 0.0441436767578125, 0.04669189453125, 0.0492401123046875, 0.051788330078125, 0.0543365478515625, 0.056884765625, 0.0594329833984375, 0.061981201171875, 0.0645294189453125, 0.06707763671875, 0.0696258544921875, 0.072174072265625, 0.0747222900390625, 0.0772705078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 11.0, 9.0, 14.0, 17.0, 21.0, 26.0, 48.0, 72.0, 144.0, 373.0, 1423.0, 6707.0, 40979.0, 512635.0, 441867.0, 36132.0, 6072.0, 1299.0, 336.0, 124.0, 80.0, 54.0, 20.0, 25.0, 19.0, 11.0, 9.0, 6.0, 6.0, 4.0, 1.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31103515625, -0.29749298095703125, -0.2839508056640625, -0.27040863037109375, -0.256866455078125, -0.24332427978515625, -0.2297821044921875, -0.21623992919921875, -0.20269775390625, -0.18915557861328125, -0.1756134033203125, -0.16207122802734375, -0.148529052734375, -0.13498687744140625, -0.1214447021484375, -0.10790252685546875, -0.0943603515625, -0.08081817626953125, -0.0672760009765625, -0.05373382568359375, -0.040191650390625, -0.02664947509765625, -0.0131072998046875, 0.00043487548828125, 0.01397705078125, 0.02751922607421875, 0.0410614013671875, 0.05460357666015625, 0.068145751953125, 0.08168792724609375, 0.0952301025390625, 0.10877227783203125, 0.122314453125, 0.13585662841796875, 0.1493988037109375, 0.16294097900390625, 0.176483154296875, 0.19002532958984375, 0.2035675048828125, 0.21710968017578125, 0.23065185546875, 0.24419403076171875, 0.2577362060546875, 0.27127838134765625, 0.284820556640625, 0.29836273193359375, 0.3119049072265625, 0.32544708251953125, 0.3389892578125, 0.35253143310546875, 0.3660736083984375, 0.37961578369140625, 0.393157958984375, 0.40670013427734375, 0.4202423095703125, 0.43378448486328125, 0.44732666015625, 0.46086883544921875, 0.4744110107421875, 0.48795318603515625, 0.501495361328125, 0.5150375366210938, 0.5285797119140625, 0.5421218872070312, 0.5556640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 6.0, 3.0, 6.0, 10.0, 13.0, 10.0, 16.0, 21.0, 16.0, 26.0, 31.0, 35.0, 43.0, 53.0, 46.0, 47.0, 48.0, 59.0, 62.0, 63.0, 57.0, 48.0, 58.0, 40.0, 39.0, 30.0, 18.0, 17.0, 23.0, 16.0, 6.0, 12.0, 8.0, 9.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38818359375, -0.37804412841796875, -0.3679046630859375, -0.35776519775390625, -0.347625732421875, -0.33748626708984375, -0.3273468017578125, -0.31720733642578125, -0.30706787109375, -0.29692840576171875, -0.2867889404296875, -0.27664947509765625, -0.266510009765625, -0.25637054443359375, -0.2462310791015625, -0.23609161376953125, -0.2259521484375, -0.21581268310546875, -0.2056732177734375, -0.19553375244140625, -0.185394287109375, -0.17525482177734375, -0.1651153564453125, -0.15497589111328125, -0.14483642578125, -0.13469696044921875, -0.1245574951171875, -0.11441802978515625, -0.104278564453125, -0.09413909912109375, -0.0839996337890625, -0.07386016845703125, -0.063720703125, -0.05358123779296875, -0.0434417724609375, -0.03330230712890625, -0.023162841796875, -0.01302337646484375, -0.0028839111328125, 0.00725555419921875, 0.01739501953125, 0.02753448486328125, 0.0376739501953125, 0.04781341552734375, 0.057952880859375, 0.06809234619140625, 0.0782318115234375, 0.08837127685546875, 0.0985107421875, 0.10865020751953125, 0.1187896728515625, 0.12892913818359375, 0.139068603515625, 0.14920806884765625, 0.1593475341796875, 0.16948699951171875, 0.17962646484375, 0.18976593017578125, 0.1999053955078125, 0.21004486083984375, 0.220184326171875, 0.23032379150390625, 0.2404632568359375, 0.25060272216796875, 0.2607421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 20.0, 26.0, 38.0, 58.0, 78.0, 150.0, 247.0, 329.0, 521.0, 818.0, 1411.0, 2263.0, 3786.0, 6605.0, 10928.0, 18431.0, 30251.0, 50395.0, 90707.0, 214321.0, 309923.0, 139188.0, 68053.0, 39716.0, 24255.0, 14456.0, 8544.0, 5197.0, 3037.0, 1809.0, 1078.0, 699.0, 449.0, 279.0, 161.0, 111.0, 61.0, 47.0, 26.0, 15.0, 9.0, 19.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06005859375, -0.05813789367675781, -0.056217193603515625, -0.05429649353027344, -0.05237579345703125, -0.05045509338378906, -0.048534393310546875, -0.04661369323730469, -0.0446929931640625, -0.04277229309082031, -0.040851593017578125, -0.03893089294433594, -0.03701019287109375, -0.03508949279785156, -0.033168792724609375, -0.031248092651367188, -0.029327392578125, -0.027406692504882812, -0.025485992431640625, -0.023565292358398438, -0.02164459228515625, -0.019723892211914062, -0.017803192138671875, -0.015882492065429688, -0.0139617919921875, -0.012041091918945312, -0.010120391845703125, -0.008199691772460938, -0.00627899169921875, -0.0043582916259765625, -0.002437591552734375, -0.0005168914794921875, 0.00140380859375, 0.0033245086669921875, 0.005245208740234375, 0.0071659088134765625, 0.00908660888671875, 0.011007308959960938, 0.012928009033203125, 0.014848709106445312, 0.0167694091796875, 0.018690109252929688, 0.020610809326171875, 0.022531509399414062, 0.02445220947265625, 0.026372909545898438, 0.028293609619140625, 0.030214309692382812, 0.032135009765625, 0.03405570983886719, 0.035976409912109375, 0.03789710998535156, 0.03981781005859375, 0.04173851013183594, 0.043659210205078125, 0.04557991027832031, 0.0475006103515625, 0.04942131042480469, 0.051342010498046875, 0.05326271057128906, 0.05518341064453125, 0.05710411071777344, 0.059024810791015625, 0.06094551086425781, 0.0628662109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 10.0, 9.0, 13.0, 10.0, 7.0, 19.0, 22.0, 19.0, 22.0, 33.0, 51.0, 62.0, 60.0, 57.0, 80.0, 75.0, 73.0, 69.0, 59.0, 58.0, 33.0, 33.0, 24.0, 18.0, 12.0, 14.0, 9.0, 8.0, 6.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.9490718841552734e-05, -1.887138932943344e-05, -1.8252059817314148e-05, -1.7632730305194855e-05, -1.701340079307556e-05, -1.639407128095627e-05, -1.5774741768836975e-05, -1.5155412256717682e-05, -1.4536082744598389e-05, -1.3916753232479095e-05, -1.3297423720359802e-05, -1.2678094208240509e-05, -1.2058764696121216e-05, -1.1439435184001923e-05, -1.082010567188263e-05, -1.0200776159763336e-05, -9.581446647644043e-06, -8.96211713552475e-06, -8.342787623405457e-06, -7.723458111286163e-06, -7.10412859916687e-06, -6.484799087047577e-06, -5.865469574928284e-06, -5.2461400628089905e-06, -4.626810550689697e-06, -4.007481038570404e-06, -3.388151526451111e-06, -2.7688220143318176e-06, -2.1494925022125244e-06, -1.5301629900932312e-06, -9.10833477973938e-07, -2.915039658546448e-07, 3.2782554626464844e-07, 9.471550583839417e-07, 1.5664845705032349e-06, 2.185814082622528e-06, 2.8051435947418213e-06, 3.4244731068611145e-06, 4.043802618980408e-06, 4.663132131099701e-06, 5.282461643218994e-06, 5.901791155338287e-06, 6.5211206674575806e-06, 7.140450179576874e-06, 7.759779691696167e-06, 8.37910920381546e-06, 8.998438715934753e-06, 9.617768228054047e-06, 1.023709774017334e-05, 1.0856427252292633e-05, 1.1475756764411926e-05, 1.209508627653122e-05, 1.2714415788650513e-05, 1.3333745300769806e-05, 1.3953074812889099e-05, 1.4572404325008392e-05, 1.5191733837127686e-05, 1.581106334924698e-05, 1.6430392861366272e-05, 1.7049722373485565e-05, 1.766905188560486e-05, 1.828838139772415e-05, 1.8907710909843445e-05, 1.9527040421962738e-05, 2.014636993408203e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 14.0, 18.0, 16.0, 45.0, 54.0, 76.0, 149.0, 212.0, 470.0, 1131.0, 3442.0, 12577.0, 49333.0, 200210.0, 593471.0, 138040.0, 35612.0, 9197.0, 2668.0, 879.0, 413.0, 213.0, 125.0, 64.0, 42.0, 23.0, 21.0, 11.0, 8.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.12730789184570312, -0.12229156494140625, -0.11727523803710938, -0.1122589111328125, -0.10724258422851562, -0.10222625732421875, -0.09720993041992188, -0.092193603515625, -0.08717727661132812, -0.08216094970703125, -0.07714462280273438, -0.0721282958984375, -0.06711196899414062, -0.06209564208984375, -0.057079315185546875, -0.05206298828125, -0.047046661376953125, -0.04203033447265625, -0.037014007568359375, -0.0319976806640625, -0.026981353759765625, -0.02196502685546875, -0.016948699951171875, -0.011932373046875, -0.006916046142578125, -0.00189971923828125, 0.003116607666015625, 0.0081329345703125, 0.013149261474609375, 0.01816558837890625, 0.023181915283203125, 0.0281982421875, 0.033214569091796875, 0.03823089599609375, 0.043247222900390625, 0.0482635498046875, 0.053279876708984375, 0.05829620361328125, 0.06331253051757812, 0.068328857421875, 0.07334518432617188, 0.07836151123046875, 0.08337783813476562, 0.0883941650390625, 0.09341049194335938, 0.09842681884765625, 0.10344314575195312, 0.10845947265625, 0.11347579956054688, 0.11849212646484375, 0.12350845336914062, 0.1285247802734375, 0.13354110717773438, 0.13855743408203125, 0.14357376098632812, 0.148590087890625, 0.15360641479492188, 0.15862274169921875, 0.16363906860351562, 0.1686553955078125, 0.17367172241210938, 0.17868804931640625, 0.18370437622070312, 0.188720703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 7.0, 10.0, 11.0, 13.0, 19.0, 15.0, 26.0, 38.0, 49.0, 55.0, 76.0, 98.0, 129.0, 111.0, 75.0, 46.0, 54.0, 28.0, 28.0, 19.0, 19.0, 14.0, 13.0, 15.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08697509765625, -0.08394336700439453, -0.08091163635253906, -0.0778799057006836, -0.07484817504882812, -0.07181644439697266, -0.06878471374511719, -0.06575298309326172, -0.06272125244140625, -0.05968952178955078, -0.05665779113769531, -0.053626060485839844, -0.050594329833984375, -0.047562599182128906, -0.04453086853027344, -0.04149913787841797, -0.0384674072265625, -0.03543567657470703, -0.03240394592285156, -0.029372215270996094, -0.026340484619140625, -0.023308753967285156, -0.020277023315429688, -0.01724529266357422, -0.01421356201171875, -0.011181831359863281, -0.008150100708007812, -0.005118370056152344, -0.002086639404296875, 0.0009450912475585938, 0.0039768218994140625, 0.007008552551269531, 0.010040283203125, 0.013072013854980469, 0.016103744506835938, 0.019135475158691406, 0.022167205810546875, 0.025198936462402344, 0.028230667114257812, 0.03126239776611328, 0.03429412841796875, 0.03732585906982422, 0.04035758972167969, 0.043389320373535156, 0.046421051025390625, 0.049452781677246094, 0.05248451232910156, 0.05551624298095703, 0.0585479736328125, 0.06157970428466797, 0.06461143493652344, 0.0676431655883789, 0.07067489624023438, 0.07370662689208984, 0.07673835754394531, 0.07977008819580078, 0.08280181884765625, 0.08583354949951172, 0.08886528015136719, 0.09189701080322266, 0.09492874145507812, 0.0979604721069336, 0.10099220275878906, 0.10402393341064453, 0.1070556640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 17.0, 26.0, 61.0, 113.0, 169.0, 217.0, 182.0, 124.0, 63.0, 24.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6537616848945618, -0.5969516634941101, -0.5401415824890137, -0.483331561088562, -0.42652150988578796, -0.3697114586830139, -0.31290143728256226, -0.2560913860797882, -0.19928133487701416, -0.1424712836742401, -0.08566124737262726, -0.028851211071014404, 0.027958840131759644, 0.08476889133453369, 0.14157891273498535, 0.1983889639377594, 0.25519901514053345, 0.3120090663433075, 0.36881911754608154, 0.4256291389465332, 0.48243919014930725, 0.5392492413520813, 0.596059262752533, 0.6528693437576294, 0.709679365158081, 0.7664893865585327, 0.8232994675636292, 0.8801094889640808, 0.9369195699691772, 0.9937295913696289, 1.0505396127700806, 1.1073496341705322, 1.1641597747802734, 1.220969796180725, 1.2777798175811768, 1.334589958190918, 1.3913999795913696, 1.4482100009918213, 1.505020022392273, 1.5618300437927246, 1.6186401844024658, 1.6754502058029175, 1.7322602272033691, 1.7890703678131104, 1.845880389213562, 1.9026904106140137, 1.9595004320144653, 2.016310453414917, 2.073120594024658, 2.1299307346343994, 2.1867406368255615, 2.2435507774353027, 2.300360679626465, 2.357170820236206, 2.4139809608459473, 2.4707908630371094, 2.5276007652282715, 2.5844109058380127, 2.641220808029175, 2.698030948638916, 2.754840850830078, 2.8116509914398193, 2.8684611320495605, 2.9252710342407227, 2.982081174850464]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 9.0, 4.0, 5.0, 9.0, 12.0, 15.0, 14.0, 14.0, 22.0, 28.0, 18.0, 30.0, 33.0, 32.0, 22.0, 31.0, 32.0, 36.0, 42.0, 50.0, 40.0, 34.0, 34.0, 34.0, 33.0, 38.0, 37.0, 38.0, 25.0, 31.0, 32.0, 19.0, 16.0, 18.0, 10.0, 20.0, 15.0, 12.0, 7.0, 8.0, 10.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5651933550834656, -0.5453123450279236, -0.5254312753677368, -0.5055502653121948, -0.48566919565200806, -0.46578818559646606, -0.4459071457386017, -0.4260261058807373, -0.4061450660228729, -0.38626402616500854, -0.36638298630714417, -0.3465019464492798, -0.3266209363937378, -0.306739866733551, -0.28685885667800903, -0.26697781682014465, -0.24709677696228027, -0.2272157371044159, -0.2073346972465515, -0.18745367228984833, -0.16757263243198395, -0.14769159257411957, -0.12781056761741638, -0.107929527759552, -0.08804848790168762, -0.06816744804382324, -0.04828641563653946, -0.028405379503965378, -0.008524343371391296, 0.011356696486473083, 0.031237728893756866, 0.05111876130104065, 0.07099980115890503, 0.09088084101676941, 0.11076187342405319, 0.13064290583133698, 0.15052394568920135, 0.17040498554706573, 0.19028601050376892, 0.2101670503616333, 0.23004809021949768, 0.24992913007736206, 0.26981016993522644, 0.2896912097930908, 0.3095722198486328, 0.3294532895088196, 0.3493342995643616, 0.36921533942222595, 0.38909637928009033, 0.4089774191379547, 0.4288584589958191, 0.44873949885368347, 0.46862053871154785, 0.48850154876708984, 0.5083826184272766, 0.5282636284828186, 0.5481446981430054, 0.5680257081985474, 0.5879067778587341, 0.6077877879142761, 0.6276688575744629, 0.6475498676300049, 0.6674309372901917, 0.6873119473457336, 0.7071929574012756]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 18.0, 18.0, 29.0, 39.0, 35.0, 78.0, 88.0, 108.0, 202.0, 306.0, 473.0, 728.0, 1211.0, 2159.0, 3658.0, 6483.0, 12374.0, 25758.0, 57899.0, 150253.0, 495527.0, 2043889.0, 979325.0, 249045.0, 89441.0, 37592.0, 17332.0, 8777.0, 4716.0, 2696.0, 1543.0, 829.0, 578.0, 365.0, 206.0, 160.0, 91.0, 70.0, 42.0, 31.0, 28.0, 17.0, 19.0, 9.0, 6.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.1179208755493164, -0.11395454406738281, -0.10998821258544922, -0.10602188110351562, -0.10205554962158203, -0.09808921813964844, -0.09412288665771484, -0.09015655517578125, -0.08619022369384766, -0.08222389221191406, -0.07825756072998047, -0.07429122924804688, -0.07032489776611328, -0.06635856628417969, -0.062392234802246094, -0.0584259033203125, -0.054459571838378906, -0.05049324035644531, -0.04652690887451172, -0.042560577392578125, -0.03859424591064453, -0.03462791442871094, -0.030661582946777344, -0.02669525146484375, -0.022728919982910156, -0.018762588500976562, -0.014796257019042969, -0.010829925537109375, -0.006863594055175781, -0.0028972625732421875, 0.0010690689086914062, 0.005035400390625, 0.009001731872558594, 0.012968063354492188, 0.01693439483642578, 0.020900726318359375, 0.02486705780029297, 0.028833389282226562, 0.032799720764160156, 0.03676605224609375, 0.040732383728027344, 0.04469871520996094, 0.04866504669189453, 0.052631378173828125, 0.05659770965576172, 0.06056404113769531, 0.0645303726196289, 0.0684967041015625, 0.0724630355834961, 0.07642936706542969, 0.08039569854736328, 0.08436203002929688, 0.08832836151123047, 0.09229469299316406, 0.09626102447509766, 0.10022735595703125, 0.10419368743896484, 0.10816001892089844, 0.11212635040283203, 0.11609268188476562, 0.12005901336669922, 0.12402534484863281, 0.1279916763305664, 0.1319580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 4.0, 2.0, 7.0, 10.0, 9.0, 9.0, 14.0, 17.0, 20.0, 10.0, 29.0, 31.0, 34.0, 30.0, 20.0, 36.0, 41.0, 33.0, 48.0, 50.0, 34.0, 49.0, 47.0, 42.0, 35.0, 46.0, 28.0, 26.0, 32.0, 28.0, 19.0, 21.0, 25.0, 18.0, 11.0, 13.0, 14.0, 7.0, 6.0, 7.0, 9.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.08343505859375, -0.08101940155029297, -0.07860374450683594, -0.0761880874633789, -0.07377243041992188, -0.07135677337646484, -0.06894111633300781, -0.06652545928955078, -0.06410980224609375, -0.06169414520263672, -0.05927848815917969, -0.056862831115722656, -0.054447174072265625, -0.052031517028808594, -0.04961585998535156, -0.04720020294189453, -0.0447845458984375, -0.04236888885498047, -0.03995323181152344, -0.037537574768066406, -0.035121917724609375, -0.032706260681152344, -0.030290603637695312, -0.02787494659423828, -0.02545928955078125, -0.02304363250732422, -0.020627975463867188, -0.018212318420410156, -0.015796661376953125, -0.013381004333496094, -0.010965347290039062, -0.008549690246582031, -0.006134033203125, -0.0037183761596679688, -0.0013027191162109375, 0.0011129379272460938, 0.003528594970703125, 0.005944252014160156, 0.008359909057617188, 0.010775566101074219, 0.01319122314453125, 0.015606880187988281, 0.018022537231445312, 0.020438194274902344, 0.022853851318359375, 0.025269508361816406, 0.027685165405273438, 0.03010082244873047, 0.0325164794921875, 0.03493213653564453, 0.03734779357910156, 0.039763450622558594, 0.042179107666015625, 0.044594764709472656, 0.04701042175292969, 0.04942607879638672, 0.05184173583984375, 0.05425739288330078, 0.05667304992675781, 0.059088706970214844, 0.061504364013671875, 0.0639200210571289, 0.06633567810058594, 0.06875133514404297, 0.0711669921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 3.0, 5.0, 7.0, 13.0, 22.0, 35.0, 42.0, 70.0, 93.0, 125.0, 243.0, 397.0, 661.0, 1244.0, 2470.0, 5229.0, 12201.0, 31351.0, 96724.0, 364841.0, 2061741.0, 1262474.0, 243681.0, 69194.0, 23538.0, 9379.0, 3969.0, 1971.0, 1057.0, 544.0, 330.0, 212.0, 125.0, 90.0, 55.0, 37.0, 29.0, 24.0, 11.0, 14.0, 11.0, 8.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25830078125, -0.25089073181152344, -0.24348068237304688, -0.2360706329345703, -0.22866058349609375, -0.2212505340576172, -0.21384048461914062, -0.20643043518066406, -0.1990203857421875, -0.19161033630371094, -0.18420028686523438, -0.1767902374267578, -0.16938018798828125, -0.1619701385498047, -0.15456008911132812, -0.14715003967285156, -0.139739990234375, -0.13232994079589844, -0.12491989135742188, -0.11750984191894531, -0.11009979248046875, -0.10268974304199219, -0.09527969360351562, -0.08786964416503906, -0.0804595947265625, -0.07304954528808594, -0.06563949584960938, -0.05822944641113281, -0.05081939697265625, -0.04340934753417969, -0.035999298095703125, -0.028589248657226562, -0.02117919921875, -0.013769149780273438, -0.006359100341796875, 0.0010509490966796875, 0.00846099853515625, 0.015871047973632812, 0.023281097412109375, 0.030691146850585938, 0.0381011962890625, 0.04551124572753906, 0.052921295166015625, 0.06033134460449219, 0.06774139404296875, 0.07515144348144531, 0.08256149291992188, 0.08997154235839844, 0.097381591796875, 0.10479164123535156, 0.11220169067382812, 0.11961174011230469, 0.12702178955078125, 0.1344318389892578, 0.14184188842773438, 0.14925193786621094, 0.1566619873046875, 0.16407203674316406, 0.17148208618164062, 0.1788921356201172, 0.18630218505859375, 0.1937122344970703, 0.20112228393554688, 0.20853233337402344, 0.2159423828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 14.0, 19.0, 21.0, 35.0, 46.0, 76.0, 116.0, 153.0, 285.0, 449.0, 808.0, 783.0, 398.0, 258.0, 184.0, 118.0, 100.0, 55.0, 33.0, 25.0, 20.0, 16.0, 14.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.1990489959716797, -0.19167709350585938, -0.18430519104003906, -0.17693328857421875, -0.16956138610839844, -0.16218948364257812, -0.1548175811767578, -0.1474456787109375, -0.1400737762451172, -0.13270187377929688, -0.12532997131347656, -0.11795806884765625, -0.11058616638183594, -0.10321426391601562, -0.09584236145019531, -0.088470458984375, -0.08109855651855469, -0.07372665405273438, -0.06635475158691406, -0.05898284912109375, -0.05161094665527344, -0.044239044189453125, -0.03686714172363281, -0.0294952392578125, -0.022123336791992188, -0.014751434326171875, -0.0073795318603515625, -7.62939453125e-06, 0.0073642730712890625, 0.014736175537109375, 0.022108078002929688, 0.02947998046875, 0.03685188293457031, 0.044223785400390625, 0.05159568786621094, 0.05896759033203125, 0.06633949279785156, 0.07371139526367188, 0.08108329772949219, 0.0884552001953125, 0.09582710266113281, 0.10319900512695312, 0.11057090759277344, 0.11794281005859375, 0.12531471252441406, 0.13268661499023438, 0.1400585174560547, 0.147430419921875, 0.1548023223876953, 0.16217422485351562, 0.16954612731933594, 0.17691802978515625, 0.18428993225097656, 0.19166183471679688, 0.1990337371826172, 0.2064056396484375, 0.2137775421142578, 0.22114944458007812, 0.22852134704589844, 0.23589324951171875, 0.24326515197753906, 0.2506370544433594, 0.2580089569091797, 0.265380859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 13.0, 20.0, 33.0, 45.0, 58.0, 75.0, 89.0, 103.0, 123.0, 95.0, 96.0, 87.0, 43.0, 47.0, 26.0, 19.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9431825876235962, -0.9066481590270996, -0.870113730430603, -0.8335792422294617, -0.7970448136329651, -0.7605103850364685, -0.7239758968353271, -0.6874414682388306, -0.650907039642334, -0.6143726110458374, -0.5778381824493408, -0.5413036942481995, -0.5047692656517029, -0.4682348370552063, -0.43170037865638733, -0.39516592025756836, -0.3586314916610718, -0.3220970630645752, -0.2855626046657562, -0.24902816116809845, -0.21249371767044067, -0.1759592741727829, -0.13942483067512512, -0.10289037227630615, -0.06635594367980957, -0.029821500182151794, 0.0067129433155059814, 0.04324738681316376, 0.07978183031082153, 0.11631627380847931, 0.15285071730613708, 0.18938517570495605, 0.22591948509216309, 0.26245391368865967, 0.29898837208747864, 0.3355228304862976, 0.3720572590827942, 0.40859168767929077, 0.44512614607810974, 0.4816606044769287, 0.5181950330734253, 0.5547294616699219, 0.5912638902664185, 0.6277983784675598, 0.6643328070640564, 0.700867235660553, 0.7374017238616943, 0.7739361524581909, 0.8104705810546875, 0.8470050096511841, 0.8835394382476807, 0.920073926448822, 0.9566083550453186, 0.9931427836418152, 1.0296772718429565, 1.0662117004394531, 1.1027461290359497, 1.1392805576324463, 1.1758149862289429, 1.2123494148254395, 1.2488839626312256, 1.2854183912277222, 1.3219528198242188, 1.3584872484207153, 1.395021677017212]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 8.0, 8.0, 14.0, 19.0, 18.0, 18.0, 20.0, 23.0, 31.0, 35.0, 30.0, 47.0, 41.0, 41.0, 47.0, 46.0, 37.0, 42.0, 45.0, 39.0, 45.0, 49.0, 40.0, 29.0, 30.0, 16.0, 26.0, 16.0, 19.0, 21.0, 19.0, 20.0, 9.0, 7.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6378845572471619, -0.618523895740509, -0.5991631746292114, -0.5798025131225586, -0.560441792011261, -0.5410811305046082, -0.5217204093933105, -0.5023597478866577, -0.4829990565776825, -0.4636383652687073, -0.44427767395973206, -0.42491698265075684, -0.405556321144104, -0.3861956000328064, -0.36683493852615356, -0.34747424721717834, -0.3281135559082031, -0.3087528645992279, -0.2893921732902527, -0.27003148198127747, -0.25067079067230225, -0.23131011426448822, -0.2119494378566742, -0.19258874654769897, -0.17322805523872375, -0.15386736392974854, -0.13450667262077332, -0.11514599621295929, -0.09578530490398407, -0.07642461359500885, -0.05706392973661423, -0.037703245878219604, -0.01834261417388916, 0.001018073409795761, 0.020378760993480682, 0.039739448577165604, 0.059100136160850525, 0.07846082746982574, 0.09782151132822037, 0.11718219518661499, 0.1365428864955902, 0.15590357780456543, 0.17526426911354065, 0.19462494552135468, 0.2139856368303299, 0.23334632813930511, 0.25270700454711914, 0.27206769585609436, 0.2914283871650696, 0.3107890784740448, 0.33014976978302, 0.34951046109199524, 0.36887115240097046, 0.3882318139076233, 0.4075925052165985, 0.42695319652557373, 0.44631388783454895, 0.46567457914352417, 0.4850352704524994, 0.5043959617614746, 0.5237566232681274, 0.543117344379425, 0.5624780058860779, 0.5818387269973755, 0.6011993885040283]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 9.0, 21.0, 23.0, 39.0, 58.0, 106.0, 147.0, 168.0, 277.0, 470.0, 662.0, 998.0, 1579.0, 2520.0, 3773.0, 6056.0, 9515.0, 15038.0, 24688.0, 40292.0, 69438.0, 129520.0, 251934.0, 223280.0, 111440.0, 61096.0, 35969.0, 22040.0, 13527.0, 8613.0, 5521.0, 3354.0, 2184.0, 1468.0, 920.0, 619.0, 408.0, 246.0, 167.0, 116.0, 91.0, 48.0, 37.0, 17.0, 19.0, 15.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1314697265625, -0.12691879272460938, -0.12236785888671875, -0.11781692504882812, -0.1132659912109375, -0.10871505737304688, -0.10416412353515625, -0.09961318969726562, -0.095062255859375, -0.09051132202148438, -0.08596038818359375, -0.08140945434570312, -0.0768585205078125, -0.07230758666992188, -0.06775665283203125, -0.06320571899414062, -0.05865478515625, -0.054103851318359375, -0.04955291748046875, -0.045001983642578125, -0.0404510498046875, -0.035900115966796875, -0.03134918212890625, -0.026798248291015625, -0.022247314453125, -0.017696380615234375, -0.01314544677734375, -0.008594512939453125, -0.0040435791015625, 0.000507354736328125, 0.00505828857421875, 0.009609222412109375, 0.01416015625, 0.018711090087890625, 0.02326202392578125, 0.027812957763671875, 0.0323638916015625, 0.036914825439453125, 0.04146575927734375, 0.046016693115234375, 0.050567626953125, 0.055118560791015625, 0.05966949462890625, 0.06422042846679688, 0.0687713623046875, 0.07332229614257812, 0.07787322998046875, 0.08242416381835938, 0.08697509765625, 0.09152603149414062, 0.09607696533203125, 0.10062789916992188, 0.1051788330078125, 0.10972976684570312, 0.11428070068359375, 0.11883163452148438, 0.123382568359375, 0.12793350219726562, 0.13248443603515625, 0.13703536987304688, 0.1415863037109375, 0.14613723754882812, 0.15068817138671875, 0.15523910522460938, 0.1597900390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 5.0, 4.0, 5.0, 11.0, 10.0, 13.0, 14.0, 17.0, 17.0, 29.0, 27.0, 39.0, 37.0, 35.0, 49.0, 36.0, 37.0, 51.0, 38.0, 43.0, 35.0, 46.0, 47.0, 37.0, 50.0, 28.0, 44.0, 35.0, 18.0, 23.0, 17.0, 10.0, 15.0, 11.0, 10.0, 8.0, 9.0, 4.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.097900390625, -0.09518623352050781, -0.09247207641601562, -0.08975791931152344, -0.08704376220703125, -0.08432960510253906, -0.08161544799804688, -0.07890129089355469, -0.0761871337890625, -0.07347297668457031, -0.07075881958007812, -0.06804466247558594, -0.06533050537109375, -0.06261634826660156, -0.059902191162109375, -0.05718803405761719, -0.054473876953125, -0.05175971984863281, -0.049045562744140625, -0.04633140563964844, -0.04361724853515625, -0.04090309143066406, -0.038188934326171875, -0.03547477722167969, -0.0327606201171875, -0.030046463012695312, -0.027332305908203125, -0.024618148803710938, -0.02190399169921875, -0.019189834594726562, -0.016475677490234375, -0.013761520385742188, -0.01104736328125, -0.008333206176757812, -0.005619049072265625, -0.0029048919677734375, -0.00019073486328125, 0.0025234222412109375, 0.005237579345703125, 0.007951736450195312, 0.0106658935546875, 0.013380050659179688, 0.016094207763671875, 0.018808364868164062, 0.02152252197265625, 0.024236679077148438, 0.026950836181640625, 0.029664993286132812, 0.032379150390625, 0.03509330749511719, 0.037807464599609375, 0.04052162170410156, 0.04323577880859375, 0.04594993591308594, 0.048664093017578125, 0.05137825012207031, 0.0540924072265625, 0.05680656433105469, 0.059520721435546875, 0.06223487854003906, 0.06494903564453125, 0.06766319274902344, 0.07037734985351562, 0.07309150695800781, 0.0758056640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 10.0, 9.0, 7.0, 12.0, 15.0, 26.0, 27.0, 39.0, 39.0, 69.0, 84.0, 104.0, 157.0, 269.0, 517.0, 986.0, 2189.0, 5309.0, 13107.0, 33432.0, 89344.0, 284334.0, 407582.0, 132306.0, 46977.0, 18416.0, 7298.0, 2965.0, 1236.0, 634.0, 347.0, 169.0, 131.0, 97.0, 75.0, 62.0, 36.0, 29.0, 28.0, 13.0, 15.0, 11.0, 10.0, 6.0, 7.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0], "bins": [-0.29638671875, -0.2879619598388672, -0.2795372009277344, -0.27111244201660156, -0.26268768310546875, -0.25426292419433594, -0.24583816528320312, -0.2374134063720703, -0.2289886474609375, -0.2205638885498047, -0.21213912963867188, -0.20371437072753906, -0.19528961181640625, -0.18686485290527344, -0.17844009399414062, -0.1700153350830078, -0.161590576171875, -0.1531658172607422, -0.14474105834960938, -0.13631629943847656, -0.12789154052734375, -0.11946678161621094, -0.11104202270507812, -0.10261726379394531, -0.0941925048828125, -0.08576774597167969, -0.07734298706054688, -0.06891822814941406, -0.06049346923828125, -0.05206871032714844, -0.043643951416015625, -0.03521919250488281, -0.02679443359375, -0.018369674682617188, -0.009944915771484375, -0.0015201568603515625, 0.00690460205078125, 0.015329360961914062, 0.023754119873046875, 0.03217887878417969, 0.0406036376953125, 0.04902839660644531, 0.057453155517578125, 0.06587791442871094, 0.07430267333984375, 0.08272743225097656, 0.09115219116210938, 0.09957695007324219, 0.108001708984375, 0.11642646789550781, 0.12485122680664062, 0.13327598571777344, 0.14170074462890625, 0.15012550354003906, 0.15855026245117188, 0.1669750213623047, 0.1753997802734375, 0.1838245391845703, 0.19224929809570312, 0.20067405700683594, 0.20909881591796875, 0.21752357482910156, 0.22594833374023438, 0.2343730926513672, 0.2427978515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 3.0, 7.0, 6.0, 13.0, 7.0, 16.0, 16.0, 15.0, 20.0, 16.0, 24.0, 25.0, 23.0, 33.0, 32.0, 38.0, 52.0, 46.0, 35.0, 42.0, 34.0, 54.0, 38.0, 45.0, 26.0, 35.0, 34.0, 32.0, 29.0, 25.0, 29.0, 24.0, 21.0, 18.0, 10.0, 12.0, 9.0, 14.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.276611328125, -0.2676277160644531, -0.25864410400390625, -0.24966049194335938, -0.2406768798828125, -0.23169326782226562, -0.22270965576171875, -0.21372604370117188, -0.204742431640625, -0.19575881958007812, -0.18677520751953125, -0.17779159545898438, -0.1688079833984375, -0.15982437133789062, -0.15084075927734375, -0.14185714721679688, -0.13287353515625, -0.12388992309570312, -0.11490631103515625, -0.10592269897460938, -0.0969390869140625, -0.08795547485351562, -0.07897186279296875, -0.06998825073242188, -0.061004638671875, -0.052021026611328125, -0.04303741455078125, -0.034053802490234375, -0.0250701904296875, -0.016086578369140625, -0.00710296630859375, 0.001880645751953125, 0.0108642578125, 0.019847869873046875, 0.02883148193359375, 0.037815093994140625, 0.0467987060546875, 0.055782318115234375, 0.06476593017578125, 0.07374954223632812, 0.082733154296875, 0.09171676635742188, 0.10070037841796875, 0.10968399047851562, 0.1186676025390625, 0.12765121459960938, 0.13663482666015625, 0.14561843872070312, 0.15460205078125, 0.16358566284179688, 0.17256927490234375, 0.18155288696289062, 0.1905364990234375, 0.19952011108398438, 0.20850372314453125, 0.21748733520507812, 0.226470947265625, 0.23545455932617188, 0.24443817138671875, 0.2534217834472656, 0.2624053955078125, 0.2713890075683594, 0.28037261962890625, 0.2893562316894531, 0.29833984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 15.0, 14.0, 29.0, 41.0, 27.0, 72.0, 86.0, 150.0, 251.0, 468.0, 988.0, 2102.0, 5815.0, 17178.0, 57656.0, 238253.0, 539285.0, 132201.0, 35414.0, 11223.0, 4003.0, 1632.0, 704.0, 369.0, 175.0, 119.0, 76.0, 53.0, 41.0, 25.0, 18.0, 21.0, 14.0, 9.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.231689453125, -0.22564125061035156, -0.21959304809570312, -0.2135448455810547, -0.20749664306640625, -0.2014484405517578, -0.19540023803710938, -0.18935203552246094, -0.1833038330078125, -0.17725563049316406, -0.17120742797851562, -0.1651592254638672, -0.15911102294921875, -0.1530628204345703, -0.14701461791992188, -0.14096641540527344, -0.134918212890625, -0.12887001037597656, -0.12282180786132812, -0.11677360534667969, -0.11072540283203125, -0.10467720031738281, -0.09862899780273438, -0.09258079528808594, -0.0865325927734375, -0.08048439025878906, -0.07443618774414062, -0.06838798522949219, -0.06233978271484375, -0.05629158020019531, -0.050243377685546875, -0.04419517517089844, -0.03814697265625, -0.03209877014160156, -0.026050567626953125, -0.020002365112304688, -0.01395416259765625, -0.007905960083007812, -0.001857757568359375, 0.0041904449462890625, 0.0102386474609375, 0.016286849975585938, 0.022335052490234375, 0.028383255004882812, 0.03443145751953125, 0.04047966003417969, 0.046527862548828125, 0.05257606506347656, 0.058624267578125, 0.06467247009277344, 0.07072067260742188, 0.07676887512207031, 0.08281707763671875, 0.08886528015136719, 0.09491348266601562, 0.10096168518066406, 0.1070098876953125, 0.11305809020996094, 0.11910629272460938, 0.1251544952392578, 0.13120269775390625, 0.1372509002685547, 0.14329910278320312, 0.14934730529785156, 0.1553955078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 6.0, 8.0, 10.0, 16.0, 16.0, 17.0, 31.0, 38.0, 50.0, 65.0, 109.0, 116.0, 98.0, 87.0, 64.0, 48.0, 49.0, 21.0, 22.0, 25.0, 10.0, 18.0, 11.0, 9.0, 6.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2961368560791016e-05, -3.192666918039322e-05, -3.089196979999542e-05, -2.9857270419597626e-05, -2.882257103919983e-05, -2.7787871658802032e-05, -2.6753172278404236e-05, -2.571847289800644e-05, -2.4683773517608643e-05, -2.3649074137210846e-05, -2.261437475681305e-05, -2.1579675376415253e-05, -2.0544975996017456e-05, -1.951027661561966e-05, -1.8475577235221863e-05, -1.7440877854824066e-05, -1.640617847442627e-05, -1.5371479094028473e-05, -1.4336779713630676e-05, -1.330208033323288e-05, -1.2267380952835083e-05, -1.1232681572437286e-05, -1.019798219203949e-05, -9.163282811641693e-06, -8.128583431243896e-06, -7.0938840508461e-06, -6.059184670448303e-06, -5.024485290050507e-06, -3.98978590965271e-06, -2.9550865292549133e-06, -1.9203871488571167e-06, -8.856877684593201e-07, 1.4901161193847656e-07, 1.1837109923362732e-06, 2.21841037273407e-06, 3.2531097531318665e-06, 4.287809133529663e-06, 5.32250851392746e-06, 6.357207894325256e-06, 7.391907274723053e-06, 8.42660665512085e-06, 9.461306035518646e-06, 1.0496005415916443e-05, 1.153070479631424e-05, 1.2565404176712036e-05, 1.3600103557109833e-05, 1.463480293750763e-05, 1.5669502317905426e-05, 1.6704201698303223e-05, 1.773890107870102e-05, 1.8773600459098816e-05, 1.9808299839496613e-05, 2.084299921989441e-05, 2.1877698600292206e-05, 2.2912397980690002e-05, 2.39470973610878e-05, 2.4981796741485596e-05, 2.6016496121883392e-05, 2.705119550228119e-05, 2.8085894882678986e-05, 2.9120594263076782e-05, 3.015529364347458e-05, 3.1189993023872375e-05, 3.222469240427017e-05, 3.325939178466797e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 18.0, 14.0, 24.0, 25.0, 47.0, 81.0, 149.0, 302.0, 759.0, 1772.0, 4772.0, 18098.0, 99817.0, 588102.0, 276911.0, 43277.0, 9391.0, 2882.0, 1108.0, 481.0, 212.0, 118.0, 68.0, 35.0, 15.0, 14.0, 11.0, 12.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.226806640625, -0.2194347381591797, -0.21206283569335938, -0.20469093322753906, -0.19731903076171875, -0.18994712829589844, -0.18257522583007812, -0.1752033233642578, -0.1678314208984375, -0.1604595184326172, -0.15308761596679688, -0.14571571350097656, -0.13834381103515625, -0.13097190856933594, -0.12360000610351562, -0.11622810363769531, -0.108856201171875, -0.10148429870605469, -0.09411239624023438, -0.08674049377441406, -0.07936859130859375, -0.07199668884277344, -0.06462478637695312, -0.05725288391113281, -0.0498809814453125, -0.04250907897949219, -0.035137176513671875, -0.027765274047851562, -0.02039337158203125, -0.013021469116210938, -0.005649566650390625, 0.0017223358154296875, 0.00909423828125, 0.016466140747070312, 0.023838043212890625, 0.031209945678710938, 0.03858184814453125, 0.04595375061035156, 0.053325653076171875, 0.06069755554199219, 0.0680694580078125, 0.07544136047363281, 0.08281326293945312, 0.09018516540527344, 0.09755706787109375, 0.10492897033691406, 0.11230087280273438, 0.11967277526855469, 0.127044677734375, 0.1344165802001953, 0.14178848266601562, 0.14916038513183594, 0.15653228759765625, 0.16390419006347656, 0.17127609252929688, 0.1786479949951172, 0.1860198974609375, 0.1933917999267578, 0.20076370239257812, 0.20813560485839844, 0.21550750732421875, 0.22287940979003906, 0.23025131225585938, 0.2376232147216797, 0.2449951171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 7.0, 4.0, 8.0, 13.0, 15.0, 24.0, 38.0, 56.0, 59.0, 94.0, 139.0, 110.0, 122.0, 84.0, 50.0, 38.0, 30.0, 27.0, 13.0, 17.0, 6.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.1596393585205078, -0.15399551391601562, -0.14835166931152344, -0.14270782470703125, -0.13706398010253906, -0.13142013549804688, -0.1257762908935547, -0.1201324462890625, -0.11448860168457031, -0.10884475708007812, -0.10320091247558594, -0.09755706787109375, -0.09191322326660156, -0.08626937866210938, -0.08062553405761719, -0.074981689453125, -0.06933784484863281, -0.06369400024414062, -0.05805015563964844, -0.05240631103515625, -0.04676246643066406, -0.041118621826171875, -0.03547477722167969, -0.0298309326171875, -0.024187088012695312, -0.018543243408203125, -0.012899398803710938, -0.00725555419921875, -0.0016117095947265625, 0.004032135009765625, 0.009675979614257812, 0.01531982421875, 0.020963668823242188, 0.026607513427734375, 0.03225135803222656, 0.03789520263671875, 0.04353904724121094, 0.049182891845703125, 0.05482673645019531, 0.0604705810546875, 0.06611442565917969, 0.07175827026367188, 0.07740211486816406, 0.08304595947265625, 0.08868980407714844, 0.09433364868164062, 0.09997749328613281, 0.105621337890625, 0.11126518249511719, 0.11690902709960938, 0.12255287170410156, 0.12819671630859375, 0.13384056091308594, 0.13948440551757812, 0.1451282501220703, 0.1507720947265625, 0.1564159393310547, 0.16205978393554688, 0.16770362854003906, 0.17334747314453125, 0.17899131774902344, 0.18463516235351562, 0.1902790069580078, 0.1959228515625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 16.0, 19.0, 48.0, 86.0, 139.0, 181.0, 176.0, 156.0, 77.0, 55.0, 19.0, 14.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4526896476745605, -2.3807754516601562, -2.308861255645752, -2.2369470596313477, -2.1650328636169434, -2.09311842918396, -2.0212042331695557, -1.9492900371551514, -1.877375841140747, -1.8054616451263428, -1.7335474491119385, -1.6616331338882446, -1.5897189378738403, -1.517804741859436, -1.4458904266357422, -1.373976230621338, -1.3020620346069336, -1.2301478385925293, -1.158233642578125, -1.0863193273544312, -1.0144051313400269, -0.9424909353256226, -0.8705766797065735, -0.7986624240875244, -0.7267482280731201, -0.6548340320587158, -0.5829197764396667, -0.5110055208206177, -0.4390913248062134, -0.3671770989894867, -0.29526287317276, -0.22334861755371094, -0.15143442153930664, -0.07952019572257996, -0.0076059699058532715, 0.06430825591087341, 0.1362224817276001, 0.20813670754432678, 0.28005093336105347, 0.35196518898010254, 0.42387938499450684, 0.4957936108112335, 0.5677078366279602, 0.6396220922470093, 0.7115362882614136, 0.7834504842758179, 0.8553647398948669, 0.927278995513916, 0.9991931915283203, 1.0711073875427246, 1.143021583557129, 1.2149358987808228, 1.286850094795227, 1.3587642908096313, 1.4306786060333252, 1.5025928020477295, 1.5745069980621338, 1.646421194076538, 1.7183353900909424, 1.7902497053146362, 1.8621639013290405, 1.9340780973434448, 2.0059924125671387, 2.077906608581543, 2.1498208045959473]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 2.0, 0.0, 4.0, 6.0, 6.0, 5.0, 5.0, 12.0, 6.0, 11.0, 20.0, 21.0, 22.0, 18.0, 20.0, 26.0, 34.0, 25.0, 33.0, 35.0, 35.0, 45.0, 46.0, 33.0, 39.0, 28.0, 40.0, 46.0, 34.0, 31.0, 34.0, 35.0, 31.0, 23.0, 30.0, 27.0, 20.0, 25.0, 10.0, 13.0, 9.0, 15.0, 4.0, 5.0, 5.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.7390925884246826, -0.7134337425231934, -0.6877748966217041, -0.6621159911155701, -0.6364571452140808, -0.6107982993125916, -0.5851394534111023, -0.5594805479049683, -0.533821702003479, -0.5081628561019897, -0.4825039803981781, -0.45684513449668884, -0.4311862587928772, -0.40552741289138794, -0.3798685669898987, -0.35420969128608704, -0.3285508453845978, -0.3028919994831085, -0.2772331237792969, -0.2515742778778076, -0.22591540217399597, -0.2002565562725067, -0.17459769546985626, -0.1489388346672058, -0.12327997386455536, -0.09762111306190491, -0.07196225225925446, -0.0463033989071846, -0.02064453810453415, 0.005014315247535706, 0.030673176050186157, 0.05633203685283661, 0.08199089765548706, 0.10764975845813751, 0.13330861926078796, 0.15896746516227722, 0.18462634086608887, 0.21028518676757812, 0.23594404757022858, 0.26160290837287903, 0.2872617840766907, 0.31292062997817993, 0.3385795056819916, 0.36423835158348083, 0.3898972272872925, 0.41555607318878174, 0.441214919090271, 0.46687379479408264, 0.4925326406955719, 0.5181915163993835, 0.5438503623008728, 0.5695092082023621, 0.5951680541038513, 0.6208269596099854, 0.6464858055114746, 0.6721446514129639, 0.6978034973144531, 0.7234623432159424, 0.7491211891174316, 0.7747800946235657, 0.8004389405250549, 0.8260977864265442, 0.8517566323280334, 0.8774155378341675, 0.9030743837356567]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 0.0, 9.0, 10.0, 15.0, 17.0, 14.0, 31.0, 40.0, 69.0, 108.0, 184.0, 321.0, 544.0, 913.0, 1890.0, 3890.0, 8443.0, 20483.0, 52011.0, 148432.0, 523441.0, 2222548.0, 875821.0, 216489.0, 71538.0, 26643.0, 10702.0, 4767.0, 2260.0, 1167.0, 628.0, 326.0, 181.0, 111.0, 80.0, 40.0, 38.0, 26.0, 21.0, 7.0, 5.0, 6.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.14944839477539062, -0.14423370361328125, -0.13901901245117188, -0.1338043212890625, -0.12858963012695312, -0.12337493896484375, -0.11816024780273438, -0.112945556640625, -0.10773086547851562, -0.10251617431640625, -0.09730148315429688, -0.0920867919921875, -0.08687210083007812, -0.08165740966796875, -0.07644271850585938, -0.07122802734375, -0.06601333618164062, -0.06079864501953125, -0.055583953857421875, -0.0503692626953125, -0.045154571533203125, -0.03993988037109375, -0.034725189208984375, -0.029510498046875, -0.024295806884765625, -0.01908111572265625, -0.013866424560546875, -0.0086517333984375, -0.003437042236328125, 0.00177764892578125, 0.006992340087890625, 0.01220703125, 0.017421722412109375, 0.02263641357421875, 0.027851104736328125, 0.0330657958984375, 0.038280487060546875, 0.04349517822265625, 0.048709869384765625, 0.053924560546875, 0.059139251708984375, 0.06435394287109375, 0.06956863403320312, 0.0747833251953125, 0.07999801635742188, 0.08521270751953125, 0.09042739868164062, 0.09564208984375, 0.10085678100585938, 0.10607147216796875, 0.11128616333007812, 0.1165008544921875, 0.12171554565429688, 0.12693023681640625, 0.13214492797851562, 0.137359619140625, 0.14257431030273438, 0.14778900146484375, 0.15300369262695312, 0.1582183837890625, 0.16343307495117188, 0.16864776611328125, 0.17386245727539062, 0.1790771484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 8.0, 10.0, 5.0, 13.0, 15.0, 15.0, 18.0, 21.0, 23.0, 23.0, 26.0, 23.0, 43.0, 45.0, 32.0, 50.0, 39.0, 45.0, 48.0, 47.0, 52.0, 37.0, 42.0, 46.0, 39.0, 20.0, 35.0, 32.0, 18.0, 15.0, 27.0, 15.0, 8.0, 8.0, 11.0, 8.0, 7.0, 7.0, 5.0, 1.0, 1.0, 5.0, 4.0, 0.0, 1.0], "bins": [-0.10601806640625, -0.10318565368652344, -0.10035324096679688, -0.09752082824707031, -0.09468841552734375, -0.09185600280761719, -0.08902359008789062, -0.08619117736816406, -0.0833587646484375, -0.08052635192871094, -0.07769393920898438, -0.07486152648925781, -0.07202911376953125, -0.06919670104980469, -0.06636428833007812, -0.06353187561035156, -0.060699462890625, -0.05786705017089844, -0.055034637451171875, -0.05220222473144531, -0.04936981201171875, -0.04653739929199219, -0.043704986572265625, -0.04087257385253906, -0.0380401611328125, -0.03520774841308594, -0.032375335693359375, -0.029542922973632812, -0.02671051025390625, -0.023878097534179688, -0.021045684814453125, -0.018213272094726562, -0.015380859375, -0.012548446655273438, -0.009716033935546875, -0.0068836212158203125, -0.00405120849609375, -0.0012187957763671875, 0.001613616943359375, 0.0044460296630859375, 0.0072784423828125, 0.010110855102539062, 0.012943267822265625, 0.015775680541992188, 0.01860809326171875, 0.021440505981445312, 0.024272918701171875, 0.027105331420898438, 0.029937744140625, 0.03277015686035156, 0.035602569580078125, 0.03843498229980469, 0.04126739501953125, 0.04409980773925781, 0.046932220458984375, 0.04976463317871094, 0.0525970458984375, 0.05542945861816406, 0.058261871337890625, 0.06109428405761719, 0.06392669677734375, 0.06675910949707031, 0.06959152221679688, 0.07242393493652344, 0.07525634765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 8.0, 8.0, 12.0, 10.0, 10.0, 32.0, 26.0, 51.0, 61.0, 70.0, 133.0, 183.0, 237.0, 377.0, 727.0, 1177.0, 2107.0, 4070.0, 8614.0, 18765.0, 44389.0, 109530.0, 295747.0, 979709.0, 1850652.0, 557396.0, 190476.0, 73274.0, 29933.0, 13147.0, 6214.0, 3055.0, 1667.0, 885.0, 526.0, 327.0, 201.0, 121.0, 114.0, 75.0, 55.0, 31.0, 17.0, 18.0, 15.0, 8.0, 7.0, 7.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.1885528564453125, -0.182525634765625, -0.1764984130859375, -0.17047119140625, -0.1644439697265625, -0.158416748046875, -0.1523895263671875, -0.1463623046875, -0.1403350830078125, -0.134307861328125, -0.1282806396484375, -0.12225341796875, -0.1162261962890625, -0.110198974609375, -0.1041717529296875, -0.09814453125, -0.0921173095703125, -0.086090087890625, -0.0800628662109375, -0.07403564453125, -0.0680084228515625, -0.061981201171875, -0.0559539794921875, -0.0499267578125, -0.0438995361328125, -0.037872314453125, -0.0318450927734375, -0.02581787109375, -0.0197906494140625, -0.013763427734375, -0.0077362060546875, -0.001708984375, 0.0043182373046875, 0.010345458984375, 0.0163726806640625, 0.02239990234375, 0.0284271240234375, 0.034454345703125, 0.0404815673828125, 0.0465087890625, 0.0525360107421875, 0.058563232421875, 0.0645904541015625, 0.07061767578125, 0.0766448974609375, 0.082672119140625, 0.0886993408203125, 0.0947265625, 0.1007537841796875, 0.106781005859375, 0.1128082275390625, 0.11883544921875, 0.1248626708984375, 0.130889892578125, 0.1369171142578125, 0.1429443359375, 0.1489715576171875, 0.154998779296875, 0.1610260009765625, 0.16705322265625, 0.1730804443359375, 0.179107666015625, 0.1851348876953125, 0.191162109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 7.0, 8.0, 17.0, 11.0, 25.0, 42.0, 44.0, 70.0, 95.0, 124.0, 153.0, 259.0, 388.0, 559.0, 749.0, 460.0, 310.0, 228.0, 149.0, 104.0, 78.0, 62.0, 33.0, 34.0, 17.0, 15.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24853515625, -0.24126052856445312, -0.23398590087890625, -0.22671127319335938, -0.2194366455078125, -0.21216201782226562, -0.20488739013671875, -0.19761276245117188, -0.190338134765625, -0.18306350708007812, -0.17578887939453125, -0.16851425170898438, -0.1612396240234375, -0.15396499633789062, -0.14669036865234375, -0.13941574096679688, -0.13214111328125, -0.12486648559570312, -0.11759185791015625, -0.11031723022460938, -0.1030426025390625, -0.09576797485351562, -0.08849334716796875, -0.08121871948242188, -0.073944091796875, -0.06666946411132812, -0.05939483642578125, -0.052120208740234375, -0.0448455810546875, -0.037570953369140625, -0.03029632568359375, -0.023021697998046875, -0.0157470703125, -0.008472442626953125, -0.00119781494140625, 0.006076812744140625, 0.0133514404296875, 0.020626068115234375, 0.02790069580078125, 0.035175323486328125, 0.042449951171875, 0.049724578857421875, 0.05699920654296875, 0.06427383422851562, 0.0715484619140625, 0.07882308959960938, 0.08609771728515625, 0.09337234497070312, 0.10064697265625, 0.10792160034179688, 0.11519622802734375, 0.12247085571289062, 0.1297454833984375, 0.13702011108398438, 0.14429473876953125, 0.15156936645507812, 0.158843994140625, 0.16611862182617188, 0.17339324951171875, 0.18066787719726562, 0.1879425048828125, 0.19521713256835938, 0.20249176025390625, 0.20976638793945312, 0.217041015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 16.0, 22.0, 27.0, 49.0, 77.0, 110.0, 114.0, 93.0, 107.0, 121.0, 71.0, 60.0, 36.0, 31.0, 25.0, 10.0, 5.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9338374137878418, -0.892816960811615, -0.8517965078353882, -0.8107760548591614, -0.7697556018829346, -0.7287351489067078, -0.687714695930481, -0.6466941833496094, -0.6056737899780273, -0.5646533370018005, -0.5236328840255737, -0.4826124310493469, -0.4415919780731201, -0.4005715250968933, -0.3595510423183441, -0.3185305893421173, -0.2775101065635681, -0.2364896535873413, -0.1954692006111145, -0.1544487327337265, -0.1134282797574997, -0.07240782678127289, -0.03138735890388489, 0.009633094072341919, 0.050653547048568726, 0.09167400002479553, 0.13269445300102234, 0.17371492087841034, 0.21473537385463715, 0.25575584173202515, 0.29677629470825195, 0.33779674768447876, 0.37881720066070557, 0.4198376536369324, 0.4608581066131592, 0.501878559589386, 0.5428990125656128, 0.5839194655418396, 0.6249399185180664, 0.665960431098938, 0.70698082447052, 0.7480012774467468, 0.7890217304229736, 0.8300421833992004, 0.8710626363754272, 0.912083089351654, 0.9531035423278809, 0.9941240549087524, 1.035144567489624, 1.0761650800704956, 1.1171854734420776, 1.1582059860229492, 1.1992263793945312, 1.2402468919754028, 1.2812672853469849, 1.3222877979278564, 1.3633081912994385, 1.40432870388031, 1.445349097251892, 1.4863696098327637, 1.5273900032043457, 1.5684105157852173, 1.6094309091567993, 1.650451421737671, 1.691471815109253]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 9.0, 18.0, 21.0, 22.0, 35.0, 38.0, 28.0, 34.0, 43.0, 37.0, 39.0, 47.0, 37.0, 46.0, 46.0, 33.0, 35.0, 33.0, 34.0, 38.0, 41.0, 36.0, 26.0, 30.0, 27.0, 23.0, 16.0, 23.0, 12.0, 12.0, 22.0, 9.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6693547964096069, -0.6482653021812439, -0.6271757483482361, -0.606086254119873, -0.5849967002868652, -0.5639072060585022, -0.5428177118301392, -0.5217281579971313, -0.5006386041641235, -0.4795490801334381, -0.4584595561027527, -0.43737006187438965, -0.41628050804138184, -0.3951910138130188, -0.3741014897823334, -0.35301196575164795, -0.3319224715232849, -0.3108329474925995, -0.28974342346191406, -0.268653929233551, -0.2475643903017044, -0.22647486627101898, -0.20538535714149475, -0.18429583311080933, -0.1632063090801239, -0.14211678504943848, -0.12102726846933365, -0.09993775188922882, -0.0788482278585434, -0.05775870382785797, -0.03666919469833374, -0.015579670667648315, 0.005509793758392334, 0.02659931406378746, 0.04768883436918259, 0.06877835094928741, 0.08986787497997284, 0.11095739901065826, 0.1320469081401825, 0.15313643217086792, 0.17422595620155334, 0.19531548023223877, 0.2164050042629242, 0.23749451339244843, 0.25858402252197266, 0.27967357635498047, 0.3007630705833435, 0.32185259461402893, 0.34294211864471436, 0.3640316426753998, 0.3851211667060852, 0.40621066093444824, 0.42730021476745605, 0.4483897089958191, 0.4694792330265045, 0.49056875705718994, 0.5116583108901978, 0.5327478051185608, 0.5538373589515686, 0.5749268531799316, 0.5960164070129395, 0.6171059012413025, 0.6381953954696655, 0.6592849493026733, 0.6803744435310364]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 15.0, 20.0, 47.0, 39.0, 73.0, 94.0, 131.0, 215.0, 309.0, 427.0, 604.0, 950.0, 1321.0, 1848.0, 2863.0, 4556.0, 6970.0, 11289.0, 18938.0, 32836.0, 62503.0, 147102.0, 353305.0, 217501.0, 82575.0, 41162.0, 23184.0, 13673.0, 8435.0, 5155.0, 3396.0, 2159.0, 1473.0, 1007.0, 737.0, 526.0, 339.0, 230.0, 164.0, 112.0, 87.0, 64.0, 38.0, 35.0, 17.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14596176147460938, -0.14104461669921875, -0.13612747192382812, -0.1312103271484375, -0.12629318237304688, -0.12137603759765625, -0.11645889282226562, -0.111541748046875, -0.10662460327148438, -0.10170745849609375, -0.09679031372070312, -0.0918731689453125, -0.08695602416992188, -0.08203887939453125, -0.07712173461914062, -0.07220458984375, -0.06728744506835938, -0.06237030029296875, -0.057453155517578125, -0.0525360107421875, -0.047618865966796875, -0.04270172119140625, -0.037784576416015625, -0.032867431640625, -0.027950286865234375, -0.02303314208984375, -0.018115997314453125, -0.0131988525390625, -0.008281707763671875, -0.00336456298828125, 0.001552581787109375, 0.0064697265625, 0.011386871337890625, 0.01630401611328125, 0.021221160888671875, 0.0261383056640625, 0.031055450439453125, 0.03597259521484375, 0.040889739990234375, 0.045806884765625, 0.050724029541015625, 0.05564117431640625, 0.060558319091796875, 0.0654754638671875, 0.07039260864257812, 0.07530975341796875, 0.08022689819335938, 0.08514404296875, 0.09006118774414062, 0.09497833251953125, 0.09989547729492188, 0.1048126220703125, 0.10972976684570312, 0.11464691162109375, 0.11956405639648438, 0.124481201171875, 0.12939834594726562, 0.13431549072265625, 0.13923263549804688, 0.1441497802734375, 0.14906692504882812, 0.15398406982421875, 0.15890121459960938, 0.163818359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 8.0, 8.0, 8.0, 7.0, 13.0, 6.0, 12.0, 20.0, 25.0, 24.0, 28.0, 31.0, 42.0, 38.0, 43.0, 49.0, 46.0, 37.0, 44.0, 40.0, 44.0, 45.0, 47.0, 42.0, 47.0, 35.0, 27.0, 35.0, 24.0, 22.0, 20.0, 12.0, 16.0, 14.0, 8.0, 8.0, 4.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09802627563476562, -0.09485626220703125, -0.09168624877929688, -0.0885162353515625, -0.08534622192382812, -0.08217620849609375, -0.07900619506835938, -0.075836181640625, -0.07266616821289062, -0.06949615478515625, -0.06632614135742188, -0.0631561279296875, -0.059986114501953125, -0.05681610107421875, -0.053646087646484375, -0.05047607421875, -0.047306060791015625, -0.04413604736328125, -0.040966033935546875, -0.0377960205078125, -0.034626007080078125, -0.03145599365234375, -0.028285980224609375, -0.025115966796875, -0.021945953369140625, -0.01877593994140625, -0.015605926513671875, -0.0124359130859375, -0.009265899658203125, -0.00609588623046875, -0.002925872802734375, 0.000244140625, 0.003414154052734375, 0.00658416748046875, 0.009754180908203125, 0.0129241943359375, 0.016094207763671875, 0.01926422119140625, 0.022434234619140625, 0.025604248046875, 0.028774261474609375, 0.03194427490234375, 0.035114288330078125, 0.0382843017578125, 0.041454315185546875, 0.04462432861328125, 0.047794342041015625, 0.05096435546875, 0.054134368896484375, 0.05730438232421875, 0.060474395751953125, 0.0636444091796875, 0.06681442260742188, 0.06998443603515625, 0.07315444946289062, 0.076324462890625, 0.07949447631835938, 0.08266448974609375, 0.08583450317382812, 0.0890045166015625, 0.09217453002929688, 0.09534454345703125, 0.09851455688476562, 0.1016845703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 9.0, 5.0, 4.0, 10.0, 19.0, 17.0, 15.0, 15.0, 25.0, 44.0, 71.0, 104.0, 149.0, 243.0, 440.0, 796.0, 1477.0, 2845.0, 5588.0, 10980.0, 22480.0, 50225.0, 141348.0, 465158.0, 222328.0, 67352.0, 28711.0, 13693.0, 6796.0, 3377.0, 1818.0, 1018.0, 516.0, 296.0, 200.0, 135.0, 80.0, 46.0, 34.0, 25.0, 16.0, 8.0, 13.0, 7.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2216796875, -0.2146778106689453, -0.20767593383789062, -0.20067405700683594, -0.19367218017578125, -0.18667030334472656, -0.17966842651367188, -0.1726665496826172, -0.1656646728515625, -0.1586627960205078, -0.15166091918945312, -0.14465904235839844, -0.13765716552734375, -0.13065528869628906, -0.12365341186523438, -0.11665153503417969, -0.109649658203125, -0.10264778137207031, -0.09564590454101562, -0.08864402770996094, -0.08164215087890625, -0.07464027404785156, -0.06763839721679688, -0.06063652038574219, -0.0536346435546875, -0.04663276672363281, -0.039630889892578125, -0.03262901306152344, -0.02562713623046875, -0.018625259399414062, -0.011623382568359375, -0.0046215057373046875, 0.00238037109375, 0.009382247924804688, 0.016384124755859375, 0.023386001586914062, 0.03038787841796875, 0.03738975524902344, 0.044391632080078125, 0.05139350891113281, 0.0583953857421875, 0.06539726257324219, 0.07239913940429688, 0.07940101623535156, 0.08640289306640625, 0.09340476989746094, 0.10040664672851562, 0.10740852355957031, 0.114410400390625, 0.12141227722167969, 0.12841415405273438, 0.13541603088378906, 0.14241790771484375, 0.14941978454589844, 0.15642166137695312, 0.1634235382080078, 0.1704254150390625, 0.1774272918701172, 0.18442916870117188, 0.19143104553222656, 0.19843292236328125, 0.20543479919433594, 0.21243667602539062, 0.2194385528564453, 0.2264404296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 10.0, 8.0, 4.0, 14.0, 12.0, 11.0, 16.0, 17.0, 24.0, 31.0, 23.0, 26.0, 26.0, 38.0, 40.0, 29.0, 39.0, 42.0, 49.0, 35.0, 28.0, 49.0, 37.0, 35.0, 36.0, 36.0, 30.0, 30.0, 30.0, 27.0, 21.0, 20.0, 20.0, 15.0, 19.0, 13.0, 9.0, 11.0, 6.0, 5.0, 7.0, 1.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.278564453125, -0.2702751159667969, -0.26198577880859375, -0.2536964416503906, -0.2454071044921875, -0.23711776733398438, -0.22882843017578125, -0.22053909301757812, -0.212249755859375, -0.20396041870117188, -0.19567108154296875, -0.18738174438476562, -0.1790924072265625, -0.17080307006835938, -0.16251373291015625, -0.15422439575195312, -0.14593505859375, -0.13764572143554688, -0.12935638427734375, -0.12106704711914062, -0.1127777099609375, -0.10448837280273438, -0.09619903564453125, -0.08790969848632812, -0.079620361328125, -0.07133102416992188, -0.06304168701171875, -0.054752349853515625, -0.0464630126953125, -0.038173675537109375, -0.02988433837890625, -0.021595001220703125, -0.0133056640625, -0.005016326904296875, 0.00327301025390625, 0.011562347412109375, 0.0198516845703125, 0.028141021728515625, 0.03643035888671875, 0.044719696044921875, 0.053009033203125, 0.061298370361328125, 0.06958770751953125, 0.07787704467773438, 0.0861663818359375, 0.09445571899414062, 0.10274505615234375, 0.11103439331054688, 0.11932373046875, 0.12761306762695312, 0.13590240478515625, 0.14419174194335938, 0.1524810791015625, 0.16077041625976562, 0.16905975341796875, 0.17734909057617188, 0.185638427734375, 0.19392776489257812, 0.20221710205078125, 0.21050643920898438, 0.2187957763671875, 0.22708511352539062, 0.23537445068359375, 0.24366378784179688, 0.251953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 1.0, 10.0, 6.0, 11.0, 19.0, 26.0, 32.0, 45.0, 78.0, 139.0, 250.0, 479.0, 970.0, 2028.0, 4339.0, 9366.0, 21464.0, 50408.0, 112413.0, 380932.0, 293519.0, 95379.0, 42457.0, 18797.0, 8182.0, 3546.0, 1755.0, 898.0, 441.0, 224.0, 117.0, 76.0, 50.0, 26.0, 17.0, 13.0, 7.0, 8.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.11590576171875, -0.11238288879394531, -0.10886001586914062, -0.10533714294433594, -0.10181427001953125, -0.09829139709472656, -0.09476852416992188, -0.09124565124511719, -0.0877227783203125, -0.08419990539550781, -0.08067703247070312, -0.07715415954589844, -0.07363128662109375, -0.07010841369628906, -0.06658554077148438, -0.06306266784667969, -0.059539794921875, -0.05601692199707031, -0.052494049072265625, -0.04897117614746094, -0.04544830322265625, -0.04192543029785156, -0.038402557373046875, -0.03487968444824219, -0.0313568115234375, -0.027833938598632812, -0.024311065673828125, -0.020788192749023438, -0.01726531982421875, -0.013742446899414062, -0.010219573974609375, -0.0066967010498046875, -0.003173828125, 0.0003490447998046875, 0.003871917724609375, 0.0073947906494140625, 0.01091766357421875, 0.014440536499023438, 0.017963409423828125, 0.021486282348632812, 0.0250091552734375, 0.028532028198242188, 0.032054901123046875, 0.03557777404785156, 0.03910064697265625, 0.04262351989746094, 0.046146392822265625, 0.04966926574707031, 0.053192138671875, 0.05671501159667969, 0.060237884521484375, 0.06376075744628906, 0.06728363037109375, 0.07080650329589844, 0.07432937622070312, 0.07785224914550781, 0.0813751220703125, 0.08489799499511719, 0.08842086791992188, 0.09194374084472656, 0.09546661376953125, 0.09898948669433594, 0.10251235961914062, 0.10603523254394531, 0.10955810546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 7.0, 4.0, 8.0, 6.0, 6.0, 10.0, 6.0, 16.0, 20.0, 29.0, 34.0, 38.0, 52.0, 93.0, 113.0, 131.0, 126.0, 76.0, 65.0, 43.0, 17.0, 27.0, 17.0, 6.0, 17.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0338764190673828e-05, -2.931244671344757e-05, -2.8286129236221313e-05, -2.7259811758995056e-05, -2.62334942817688e-05, -2.520717680454254e-05, -2.4180859327316284e-05, -2.3154541850090027e-05, -2.212822437286377e-05, -2.1101906895637512e-05, -2.0075589418411255e-05, -1.9049271941184998e-05, -1.802295446395874e-05, -1.6996636986732483e-05, -1.5970319509506226e-05, -1.4944002032279968e-05, -1.3917684555053711e-05, -1.2891367077827454e-05, -1.1865049600601196e-05, -1.0838732123374939e-05, -9.812414646148682e-06, -8.786097168922424e-06, -7.759779691696167e-06, -6.73346221446991e-06, -5.707144737243652e-06, -4.680827260017395e-06, -3.6545097827911377e-06, -2.6281923055648804e-06, -1.601874828338623e-06, -5.755573511123657e-07, 4.507601261138916e-07, 1.477077603340149e-06, 2.5033950805664062e-06, 3.5297125577926636e-06, 4.556030035018921e-06, 5.582347512245178e-06, 6.6086649894714355e-06, 7.634982466697693e-06, 8.66129994392395e-06, 9.687617421150208e-06, 1.0713934898376465e-05, 1.1740252375602722e-05, 1.276656985282898e-05, 1.3792887330055237e-05, 1.4819204807281494e-05, 1.584552228450775e-05, 1.687183976173401e-05, 1.7898157238960266e-05, 1.8924474716186523e-05, 1.995079219341278e-05, 2.0977109670639038e-05, 2.2003427147865295e-05, 2.3029744625091553e-05, 2.405606210231781e-05, 2.5082379579544067e-05, 2.6108697056770325e-05, 2.7135014533996582e-05, 2.816133201122284e-05, 2.9187649488449097e-05, 3.0213966965675354e-05, 3.124028444290161e-05, 3.226660192012787e-05, 3.3292919397354126e-05, 3.431923687458038e-05, 3.534555435180664e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 10.0, 23.0, 23.0, 42.0, 59.0, 100.0, 170.0, 334.0, 634.0, 1227.0, 3069.0, 9571.0, 32321.0, 117542.0, 523646.0, 267619.0, 64704.0, 18081.0, 5428.0, 2010.0, 883.0, 453.0, 239.0, 121.0, 84.0, 45.0, 33.0, 20.0, 18.0, 11.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.141357421875, -0.13626670837402344, -0.13117599487304688, -0.1260852813720703, -0.12099456787109375, -0.11590385437011719, -0.11081314086914062, -0.10572242736816406, -0.1006317138671875, -0.09554100036621094, -0.09045028686523438, -0.08535957336425781, -0.08026885986328125, -0.07517814636230469, -0.07008743286132812, -0.06499671936035156, -0.059906005859375, -0.05481529235839844, -0.049724578857421875, -0.04463386535644531, -0.03954315185546875, -0.03445243835449219, -0.029361724853515625, -0.024271011352539062, -0.0191802978515625, -0.014089584350585938, -0.008998870849609375, -0.0039081573486328125, 0.00118255615234375, 0.0062732696533203125, 0.011363983154296875, 0.016454696655273438, 0.02154541015625, 0.026636123657226562, 0.031726837158203125, 0.03681755065917969, 0.04190826416015625, 0.04699897766113281, 0.052089691162109375, 0.05718040466308594, 0.0622711181640625, 0.06736183166503906, 0.07245254516601562, 0.07754325866699219, 0.08263397216796875, 0.08772468566894531, 0.09281539916992188, 0.09790611267089844, 0.102996826171875, 0.10808753967285156, 0.11317825317382812, 0.11826896667480469, 0.12335968017578125, 0.1284503936767578, 0.13354110717773438, 0.13863182067871094, 0.1437225341796875, 0.14881324768066406, 0.15390396118164062, 0.1589946746826172, 0.16408538818359375, 0.1691761016845703, 0.17426681518554688, 0.17935752868652344, 0.1844482421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 8.0, 9.0, 15.0, 7.0, 17.0, 14.0, 20.0, 31.0, 26.0, 30.0, 46.0, 61.0, 98.0, 118.0, 99.0, 83.0, 71.0, 35.0, 39.0, 27.0, 21.0, 17.0, 23.0, 19.0, 9.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.128662109375, -0.1252899169921875, -0.121917724609375, -0.1185455322265625, -0.11517333984375, -0.1118011474609375, -0.108428955078125, -0.1050567626953125, -0.1016845703125, -0.0983123779296875, -0.094940185546875, -0.0915679931640625, -0.08819580078125, -0.0848236083984375, -0.081451416015625, -0.0780792236328125, -0.07470703125, -0.0713348388671875, -0.067962646484375, -0.0645904541015625, -0.06121826171875, -0.0578460693359375, -0.054473876953125, -0.0511016845703125, -0.0477294921875, -0.0443572998046875, -0.040985107421875, -0.0376129150390625, -0.03424072265625, -0.0308685302734375, -0.027496337890625, -0.0241241455078125, -0.020751953125, -0.0173797607421875, -0.014007568359375, -0.0106353759765625, -0.00726318359375, -0.0038909912109375, -0.000518798828125, 0.0028533935546875, 0.0062255859375, 0.0095977783203125, 0.012969970703125, 0.0163421630859375, 0.01971435546875, 0.0230865478515625, 0.026458740234375, 0.0298309326171875, 0.033203125, 0.0365753173828125, 0.039947509765625, 0.0433197021484375, 0.04669189453125, 0.0500640869140625, 0.053436279296875, 0.0568084716796875, 0.0601806640625, 0.0635528564453125, 0.066925048828125, 0.0702972412109375, 0.07366943359375, 0.0770416259765625, 0.080413818359375, 0.0837860107421875, 0.087158203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 20.0, 24.0, 39.0, 59.0, 90.0, 105.0, 117.0, 118.0, 97.0, 90.0, 77.0, 48.0, 36.0, 22.0, 20.0, 5.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0324938297271729, -0.9934993982315063, -0.9545049667358398, -0.9155104756355286, -0.8765160441398621, -0.8375216126441956, -0.7985271215438843, -0.7595326900482178, -0.7205382585525513, -0.6815438270568848, -0.6425493955612183, -0.603554904460907, -0.5645604729652405, -0.525566041469574, -0.4865715801715851, -0.4475771188735962, -0.4085826873779297, -0.3695882558822632, -0.3305937945842743, -0.2915993332862854, -0.2526049017906189, -0.2136104553937912, -0.1746160089969635, -0.1356215476989746, -0.0966271162033081, -0.05763266980648041, -0.01863822340965271, 0.020356222987174988, 0.059350669384002686, 0.09834511578083038, 0.13733956217765808, 0.17633402347564697, 0.21532845497131348, 0.25432288646698, 0.29331734776496887, 0.33231180906295776, 0.37130624055862427, 0.41030067205429077, 0.44929513335227966, 0.48828959465026855, 0.5272840261459351, 0.5662784576416016, 0.6052728891372681, 0.6442673802375793, 0.6832618117332458, 0.7222562432289124, 0.7612507343292236, 0.8002451658248901, 0.8392395973205566, 0.8782340288162231, 0.9172284603118896, 0.9562229514122009, 0.9952173829078674, 1.0342118740081787, 1.0732063055038452, 1.1122007369995117, 1.1511951684951782, 1.1901895999908447, 1.2291840314865112, 1.2681784629821777, 1.3071730136871338, 1.3461674451828003, 1.3851618766784668, 1.4241563081741333, 1.4631507396697998]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 10.0, 8.0, 10.0, 20.0, 17.0, 14.0, 14.0, 29.0, 31.0, 28.0, 27.0, 33.0, 39.0, 49.0, 40.0, 33.0, 43.0, 57.0, 31.0, 33.0, 43.0, 44.0, 36.0, 43.0, 28.0, 39.0, 21.0, 27.0, 22.0, 23.0, 19.0, 12.0, 8.0, 12.0, 7.0, 6.0, 10.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6206184029579163, -0.5980514287948608, -0.5754845142364502, -0.5529175400733948, -0.5303506255149841, -0.5077836513519287, -0.48521673679351807, -0.46264976263046265, -0.440082848072052, -0.41751590371131897, -0.39494895935058594, -0.3723820149898529, -0.3498150706291199, -0.32724812626838684, -0.3046811819076538, -0.2821142077445984, -0.25954726338386536, -0.23698031902313232, -0.2144133746623993, -0.19184643030166626, -0.16927948594093323, -0.1467125415802002, -0.12414558231830597, -0.10157863795757294, -0.0790116935968399, -0.05644474923610687, -0.03387780115008354, -0.011310853064060211, 0.011256091296672821, 0.03382303565740585, 0.05638998746871948, 0.07895693182945251, 0.10152387619018555, 0.12409082055091858, 0.1466577649116516, 0.16922470927238464, 0.19179165363311768, 0.2143585979938507, 0.23692555725574493, 0.25949251651763916, 0.2820594310760498, 0.30462637543678284, 0.32719331979751587, 0.3497602641582489, 0.37232720851898193, 0.39489415287971497, 0.417461097240448, 0.4400280714035034, 0.46259501576423645, 0.4851619601249695, 0.5077289342880249, 0.5302958488464355, 0.552862823009491, 0.5754297375679016, 0.597996711730957, 0.6205636262893677, 0.6431306004524231, 0.6656975746154785, 0.6882644891738892, 0.7108314633369446, 0.7333983778953552, 0.7559653520584106, 0.7785322666168213, 0.8010992407798767, 0.8236661553382874]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 14.0, 16.0, 31.0, 49.0, 46.0, 89.0, 124.0, 194.0, 318.0, 521.0, 907.0, 1715.0, 3285.0, 6469.0, 14219.0, 32130.0, 78334.0, 210576.0, 766389.0, 2188768.0, 592161.0, 177030.0, 67089.0, 28143.0, 12650.0, 6069.0, 3075.0, 1616.0, 856.0, 547.0, 306.0, 179.0, 112.0, 86.0, 56.0, 23.0, 26.0, 21.0, 8.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.1601848602294922, -0.15508651733398438, -0.14998817443847656, -0.14488983154296875, -0.13979148864746094, -0.13469314575195312, -0.1295948028564453, -0.1244964599609375, -0.11939811706542969, -0.11429977416992188, -0.10920143127441406, -0.10410308837890625, -0.09900474548339844, -0.09390640258789062, -0.08880805969238281, -0.083709716796875, -0.07861137390136719, -0.07351303100585938, -0.06841468811035156, -0.06331634521484375, -0.05821800231933594, -0.053119659423828125, -0.04802131652832031, -0.0429229736328125, -0.03782463073730469, -0.032726287841796875, -0.027627944946289062, -0.02252960205078125, -0.017431259155273438, -0.012332916259765625, -0.0072345733642578125, -0.00213623046875, 0.0029621124267578125, 0.008060455322265625, 0.013158798217773438, 0.01825714111328125, 0.023355484008789062, 0.028453826904296875, 0.03355216979980469, 0.0386505126953125, 0.04374885559082031, 0.048847198486328125, 0.05394554138183594, 0.05904388427734375, 0.06414222717285156, 0.06924057006835938, 0.07433891296386719, 0.079437255859375, 0.08453559875488281, 0.08963394165039062, 0.09473228454589844, 0.09983062744140625, 0.10492897033691406, 0.11002731323242188, 0.11512565612792969, 0.1202239990234375, 0.1253223419189453, 0.13042068481445312, 0.13551902770996094, 0.14061737060546875, 0.14571571350097656, 0.15081405639648438, 0.1559123992919922, 0.1610107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 7.0, 11.0, 9.0, 16.0, 23.0, 23.0, 23.0, 20.0, 26.0, 24.0, 41.0, 40.0, 41.0, 45.0, 57.0, 38.0, 43.0, 50.0, 52.0, 45.0, 44.0, 36.0, 31.0, 32.0, 29.0, 26.0, 27.0, 17.0, 14.0, 13.0, 18.0, 12.0, 5.0, 8.0, 5.0, 10.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0970458984375, -0.09416961669921875, -0.0912933349609375, -0.08841705322265625, -0.085540771484375, -0.08266448974609375, -0.0797882080078125, -0.07691192626953125, -0.07403564453125, -0.07115936279296875, -0.0682830810546875, -0.06540679931640625, -0.062530517578125, -0.05965423583984375, -0.0567779541015625, -0.05390167236328125, -0.051025390625, -0.04814910888671875, -0.0452728271484375, -0.04239654541015625, -0.039520263671875, -0.03664398193359375, -0.0337677001953125, -0.03089141845703125, -0.02801513671875, -0.02513885498046875, -0.0222625732421875, -0.01938629150390625, -0.016510009765625, -0.01363372802734375, -0.0107574462890625, -0.00788116455078125, -0.0050048828125, -0.00212860107421875, 0.0007476806640625, 0.00362396240234375, 0.006500244140625, 0.00937652587890625, 0.0122528076171875, 0.01512908935546875, 0.01800537109375, 0.02088165283203125, 0.0237579345703125, 0.02663421630859375, 0.029510498046875, 0.03238677978515625, 0.0352630615234375, 0.03813934326171875, 0.041015625, 0.04389190673828125, 0.0467681884765625, 0.04964447021484375, 0.052520751953125, 0.05539703369140625, 0.0582733154296875, 0.06114959716796875, 0.06402587890625, 0.06690216064453125, 0.0697784423828125, 0.07265472412109375, 0.075531005859375, 0.07840728759765625, 0.0812835693359375, 0.08415985107421875, 0.0870361328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 14.0, 21.0, 30.0, 52.0, 67.0, 111.0, 164.0, 246.0, 433.0, 695.0, 1126.0, 2007.0, 3650.0, 6980.0, 14193.0, 29585.0, 65569.0, 157180.0, 438693.0, 1714570.0, 1209527.0, 324516.0, 123328.0, 52809.0, 24255.0, 11378.0, 5810.0, 3016.0, 1658.0, 958.0, 565.0, 367.0, 245.0, 165.0, 106.0, 75.0, 38.0, 16.0, 13.0, 15.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.217529296875, -0.2112903594970703, -0.20505142211914062, -0.19881248474121094, -0.19257354736328125, -0.18633460998535156, -0.18009567260742188, -0.1738567352294922, -0.1676177978515625, -0.1613788604736328, -0.15513992309570312, -0.14890098571777344, -0.14266204833984375, -0.13642311096191406, -0.13018417358398438, -0.12394523620605469, -0.117706298828125, -0.11146736145019531, -0.10522842407226562, -0.09898948669433594, -0.09275054931640625, -0.08651161193847656, -0.08027267456054688, -0.07403373718261719, -0.0677947998046875, -0.06155586242675781, -0.055316925048828125, -0.04907798767089844, -0.04283905029296875, -0.03660011291503906, -0.030361175537109375, -0.024122238159179688, -0.01788330078125, -0.011644363403320312, -0.005405426025390625, 0.0008335113525390625, 0.00707244873046875, 0.013311386108398438, 0.019550323486328125, 0.025789260864257812, 0.0320281982421875, 0.03826713562011719, 0.044506072998046875, 0.05074501037597656, 0.05698394775390625, 0.06322288513183594, 0.06946182250976562, 0.07570075988769531, 0.081939697265625, 0.08817863464355469, 0.09441757202148438, 0.10065650939941406, 0.10689544677734375, 0.11313438415527344, 0.11937332153320312, 0.1256122589111328, 0.1318511962890625, 0.1380901336669922, 0.14432907104492188, 0.15056800842285156, 0.15680694580078125, 0.16304588317871094, 0.16928482055664062, 0.1755237579345703, 0.1817626953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 14.0, 3.0, 5.0, 10.0, 9.0, 18.0, 20.0, 21.0, 30.0, 41.0, 45.0, 54.0, 83.0, 110.0, 135.0, 192.0, 279.0, 475.0, 646.0, 574.0, 356.0, 262.0, 171.0, 123.0, 94.0, 68.0, 64.0, 40.0, 17.0, 19.0, 26.0, 14.0, 20.0, 11.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1895751953125, -0.1827411651611328, -0.17590713500976562, -0.16907310485839844, -0.16223907470703125, -0.15540504455566406, -0.14857101440429688, -0.1417369842529297, -0.1349029541015625, -0.1280689239501953, -0.12123489379882812, -0.11440086364746094, -0.10756683349609375, -0.10073280334472656, -0.09389877319335938, -0.08706474304199219, -0.080230712890625, -0.07339668273925781, -0.06656265258789062, -0.05972862243652344, -0.05289459228515625, -0.04606056213378906, -0.039226531982421875, -0.03239250183105469, -0.0255584716796875, -0.018724441528320312, -0.011890411376953125, -0.0050563812255859375, 0.00177764892578125, 0.008611679077148438, 0.015445709228515625, 0.022279739379882812, 0.02911376953125, 0.03594779968261719, 0.042781829833984375, 0.04961585998535156, 0.05644989013671875, 0.06328392028808594, 0.07011795043945312, 0.07695198059082031, 0.0837860107421875, 0.09062004089355469, 0.09745407104492188, 0.10428810119628906, 0.11112213134765625, 0.11795616149902344, 0.12479019165039062, 0.1316242218017578, 0.138458251953125, 0.1452922821044922, 0.15212631225585938, 0.15896034240722656, 0.16579437255859375, 0.17262840270996094, 0.17946243286132812, 0.1862964630126953, 0.1931304931640625, 0.1999645233154297, 0.20679855346679688, 0.21363258361816406, 0.22046661376953125, 0.22730064392089844, 0.23413467407226562, 0.2409687042236328, 0.247802734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 15.0, 16.0, 47.0, 57.0, 115.0, 150.0, 199.0, 164.0, 123.0, 59.0, 22.0, 20.0, 7.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3207229375839233, -1.2530392408370972, -1.185355544090271, -1.1176718473434448, -1.0499881505966187, -0.9823044538497925, -0.9146208167076111, -0.8469371199607849, -0.7792534232139587, -0.7115697264671326, -0.6438860297203064, -0.576202392578125, -0.5085186958312988, -0.44083496928215027, -0.3731513023376465, -0.3054676055908203, -0.23778390884399414, -0.17010021209716797, -0.10241653025150299, -0.03473284840583801, 0.03295084834098816, 0.10063454508781433, 0.16831821203231812, 0.2360019087791443, 0.30368560552597046, 0.37136930227279663, 0.4390529990196228, 0.5067366361618042, 0.5744203329086304, 0.6421040296554565, 0.7097877264022827, 0.7774714231491089, 0.8451550006866455, 0.9128386974334717, 0.9805223941802979, 1.048206090927124, 1.1158897876739502, 1.1835734844207764, 1.2512571811676025, 1.3189408779144287, 1.3866245746612549, 1.454308271408081, 1.5219919681549072, 1.5896756649017334, 1.6573593616485596, 1.7250430583953857, 1.792726755142212, 1.860410451889038, 1.9280940294265747, 1.9957777261734009, 2.0634613037109375, 2.1311450004577637, 2.19882869720459, 2.266512393951416, 2.334196090698242, 2.4018797874450684, 2.4695634841918945, 2.5372471809387207, 2.604930877685547, 2.672614574432373, 2.740298271179199, 2.8079819679260254, 2.8756656646728516, 2.9433493614196777, 3.011033058166504]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 3.0, 6.0, 4.0, 7.0, 14.0, 11.0, 10.0, 15.0, 22.0, 25.0, 27.0, 24.0, 44.0, 34.0, 29.0, 31.0, 51.0, 32.0, 41.0, 47.0, 42.0, 36.0, 32.0, 33.0, 38.0, 37.0, 44.0, 34.0, 33.0, 30.0, 24.0, 26.0, 10.0, 15.0, 17.0, 16.0, 12.0, 5.0, 2.0, 10.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8308234810829163, -0.8071470856666565, -0.7834707498550415, -0.7597943544387817, -0.736117959022522, -0.7124415636062622, -0.6887651681900024, -0.6650888323783875, -0.6414124369621277, -0.6177360415458679, -0.5940597057342529, -0.5703833103179932, -0.5467069149017334, -0.5230305194854736, -0.49935415387153625, -0.4756777882575989, -0.4520013928413391, -0.42832499742507935, -0.40464863181114197, -0.3809722661972046, -0.3572958707809448, -0.33361947536468506, -0.3099431097507477, -0.2862667441368103, -0.26259034872055054, -0.23891396820545197, -0.2152375876903534, -0.19156120717525482, -0.16788482666015625, -0.14420844614505768, -0.1205320656299591, -0.09685568511486053, -0.07317930459976196, -0.04950292408466339, -0.02582654356956482, -0.0021501630544662476, 0.021526217460632324, 0.045202597975730896, 0.06887897849082947, 0.09255535900592804, 0.11623173952102661, 0.13990812003612518, 0.16358450055122375, 0.18726088106632233, 0.2109372615814209, 0.23461364209651947, 0.25829002261161804, 0.2819663882255554, 0.3056427836418152, 0.32931917905807495, 0.35299554467201233, 0.3766719102859497, 0.4003483057022095, 0.42402470111846924, 0.4477010667324066, 0.471377432346344, 0.49505382776260376, 0.5187302231788635, 0.5424065589904785, 0.5660829544067383, 0.589759349822998, 0.6134357452392578, 0.6371121406555176, 0.6607884764671326, 0.6844648718833923]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 14.0, 13.0, 18.0, 24.0, 42.0, 56.0, 102.0, 175.0, 285.0, 443.0, 772.0, 1327.0, 2260.0, 3751.0, 6499.0, 11469.0, 21748.0, 47085.0, 135068.0, 375443.0, 279923.0, 88540.0, 34521.0, 16809.0, 9390.0, 5231.0, 3094.0, 1791.0, 1046.0, 648.0, 394.0, 204.0, 134.0, 82.0, 57.0, 38.0, 26.0, 11.0, 14.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1781005859375, -0.17169761657714844, -0.16529464721679688, -0.1588916778564453, -0.15248870849609375, -0.1460857391357422, -0.13968276977539062, -0.13327980041503906, -0.1268768310546875, -0.12047386169433594, -0.11407089233398438, -0.10766792297363281, -0.10126495361328125, -0.09486198425292969, -0.08845901489257812, -0.08205604553222656, -0.075653076171875, -0.06925010681152344, -0.06284713745117188, -0.05644416809082031, -0.05004119873046875, -0.04363822937011719, -0.037235260009765625, -0.030832290649414062, -0.0244293212890625, -0.018026351928710938, -0.011623382568359375, -0.0052204132080078125, 0.00118255615234375, 0.0075855255126953125, 0.013988494873046875, 0.020391464233398438, 0.02679443359375, 0.03319740295410156, 0.039600372314453125, 0.04600334167480469, 0.05240631103515625, 0.05880928039550781, 0.06521224975585938, 0.07161521911621094, 0.0780181884765625, 0.08442115783691406, 0.09082412719726562, 0.09722709655761719, 0.10363006591796875, 0.11003303527832031, 0.11643600463867188, 0.12283897399902344, 0.129241943359375, 0.13564491271972656, 0.14204788208007812, 0.1484508514404297, 0.15485382080078125, 0.1612567901611328, 0.16765975952148438, 0.17406272888183594, 0.1804656982421875, 0.18686866760253906, 0.19327163696289062, 0.1996746063232422, 0.20607757568359375, 0.2124805450439453, 0.21888351440429688, 0.22528648376464844, 0.231689453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 7.0, 8.0, 12.0, 9.0, 12.0, 18.0, 21.0, 22.0, 34.0, 20.0, 16.0, 29.0, 44.0, 34.0, 37.0, 24.0, 40.0, 47.0, 31.0, 39.0, 38.0, 45.0, 37.0, 36.0, 39.0, 30.0, 35.0, 25.0, 20.0, 30.0, 27.0, 14.0, 18.0, 13.0, 16.0, 13.0, 11.0, 10.0, 9.0, 2.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08966350555419922, -0.08661460876464844, -0.08356571197509766, -0.08051681518554688, -0.0774679183959961, -0.07441902160644531, -0.07137012481689453, -0.06832122802734375, -0.06527233123779297, -0.06222343444824219, -0.059174537658691406, -0.056125640869140625, -0.053076744079589844, -0.05002784729003906, -0.04697895050048828, -0.0439300537109375, -0.04088115692138672, -0.03783226013183594, -0.034783363342285156, -0.031734466552734375, -0.028685569763183594, -0.025636672973632812, -0.02258777618408203, -0.01953887939453125, -0.01648998260498047, -0.013441085815429688, -0.010392189025878906, -0.007343292236328125, -0.004294395446777344, -0.0012454986572265625, 0.0018033981323242188, 0.004852294921875, 0.007901191711425781, 0.010950088500976562, 0.013998985290527344, 0.017047882080078125, 0.020096778869628906, 0.023145675659179688, 0.02619457244873047, 0.02924346923828125, 0.03229236602783203, 0.03534126281738281, 0.038390159606933594, 0.041439056396484375, 0.044487953186035156, 0.04753684997558594, 0.05058574676513672, 0.0536346435546875, 0.05668354034423828, 0.05973243713378906, 0.06278133392333984, 0.06583023071289062, 0.0688791275024414, 0.07192802429199219, 0.07497692108154297, 0.07802581787109375, 0.08107471466064453, 0.08412361145019531, 0.0871725082397461, 0.09022140502929688, 0.09327030181884766, 0.09631919860839844, 0.09936809539794922, 0.1024169921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 2.0, 11.0, 15.0, 18.0, 25.0, 51.0, 73.0, 149.0, 230.0, 418.0, 905.0, 1862.0, 4147.0, 10081.0, 29545.0, 140246.0, 608755.0, 194588.0, 36554.0, 11904.0, 4734.0, 2126.0, 964.0, 517.0, 235.0, 147.0, 89.0, 49.0, 26.0, 27.0, 16.0, 11.0, 4.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.38427734375, -0.3734779357910156, -0.36267852783203125, -0.3518791198730469, -0.3410797119140625, -0.3302803039550781, -0.31948089599609375, -0.3086814880371094, -0.297882080078125, -0.2870826721191406, -0.27628326416015625, -0.2654838562011719, -0.2546844482421875, -0.24388504028320312, -0.23308563232421875, -0.22228622436523438, -0.21148681640625, -0.20068740844726562, -0.18988800048828125, -0.17908859252929688, -0.1682891845703125, -0.15748977661132812, -0.14669036865234375, -0.13589096069335938, -0.125091552734375, -0.11429214477539062, -0.10349273681640625, -0.09269332885742188, -0.0818939208984375, -0.07109451293945312, -0.06029510498046875, -0.049495697021484375, -0.0386962890625, -0.027896881103515625, -0.01709747314453125, -0.006298065185546875, 0.0045013427734375, 0.015300750732421875, 0.02610015869140625, 0.036899566650390625, 0.047698974609375, 0.058498382568359375, 0.06929779052734375, 0.08009719848632812, 0.0908966064453125, 0.10169601440429688, 0.11249542236328125, 0.12329483032226562, 0.13409423828125, 0.14489364624023438, 0.15569305419921875, 0.16649246215820312, 0.1772918701171875, 0.18809127807617188, 0.19889068603515625, 0.20969009399414062, 0.220489501953125, 0.23128890991210938, 0.24208831787109375, 0.2528877258300781, 0.2636871337890625, 0.2744865417480469, 0.28528594970703125, 0.2960853576660156, 0.306884765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 16.0, 8.0, 8.0, 13.0, 23.0, 15.0, 19.0, 30.0, 24.0, 25.0, 21.0, 35.0, 36.0, 44.0, 37.0, 33.0, 61.0, 40.0, 49.0, 39.0, 41.0, 39.0, 36.0, 30.0, 36.0, 20.0, 27.0, 20.0, 19.0, 28.0, 20.0, 20.0, 13.0, 10.0, 6.0, 9.0, 8.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.27118682861328125, -0.2618560791015625, -0.25252532958984375, -0.243194580078125, -0.23386383056640625, -0.2245330810546875, -0.21520233154296875, -0.20587158203125, -0.19654083251953125, -0.1872100830078125, -0.17787933349609375, -0.168548583984375, -0.15921783447265625, -0.1498870849609375, -0.14055633544921875, -0.1312255859375, -0.12189483642578125, -0.1125640869140625, -0.10323333740234375, -0.093902587890625, -0.08457183837890625, -0.0752410888671875, -0.06591033935546875, -0.05657958984375, -0.04724884033203125, -0.0379180908203125, -0.02858734130859375, -0.019256591796875, -0.00992584228515625, -0.0005950927734375, 0.00873565673828125, 0.01806640625, 0.02739715576171875, 0.0367279052734375, 0.04605865478515625, 0.055389404296875, 0.06472015380859375, 0.0740509033203125, 0.08338165283203125, 0.09271240234375, 0.10204315185546875, 0.1113739013671875, 0.12070465087890625, 0.130035400390625, 0.13936614990234375, 0.1486968994140625, 0.15802764892578125, 0.1673583984375, 0.17668914794921875, 0.1860198974609375, 0.19535064697265625, 0.204681396484375, 0.21401214599609375, 0.2233428955078125, 0.23267364501953125, 0.24200439453125, 0.25133514404296875, 0.2606658935546875, 0.26999664306640625, 0.279327392578125, 0.28865814208984375, 0.2979888916015625, 0.30731964111328125, 0.316650390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 15.0, 13.0, 23.0, 30.0, 43.0, 82.0, 136.0, 221.0, 476.0, 924.0, 1824.0, 3901.0, 8697.0, 20349.0, 53922.0, 179532.0, 486835.0, 195224.0, 57679.0, 21448.0, 9070.0, 4096.0, 1987.0, 907.0, 498.0, 276.0, 139.0, 75.0, 48.0, 32.0, 17.0, 14.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11871337890625, -0.11494827270507812, -0.11118316650390625, -0.10741806030273438, -0.1036529541015625, -0.09988784790039062, -0.09612274169921875, -0.09235763549804688, -0.088592529296875, -0.08482742309570312, -0.08106231689453125, -0.07729721069335938, -0.0735321044921875, -0.06976699829101562, -0.06600189208984375, -0.062236785888671875, -0.0584716796875, -0.054706573486328125, -0.05094146728515625, -0.047176361083984375, -0.0434112548828125, -0.039646148681640625, -0.03588104248046875, -0.032115936279296875, -0.028350830078125, -0.024585723876953125, -0.02082061767578125, -0.017055511474609375, -0.0132904052734375, -0.009525299072265625, -0.00576019287109375, -0.001995086669921875, 0.00177001953125, 0.005535125732421875, 0.00930023193359375, 0.013065338134765625, 0.0168304443359375, 0.020595550537109375, 0.02436065673828125, 0.028125762939453125, 0.031890869140625, 0.035655975341796875, 0.03942108154296875, 0.043186187744140625, 0.0469512939453125, 0.050716400146484375, 0.05448150634765625, 0.058246612548828125, 0.06201171875, 0.06577682495117188, 0.06954193115234375, 0.07330703735351562, 0.0770721435546875, 0.08083724975585938, 0.08460235595703125, 0.08836746215820312, 0.092132568359375, 0.09589767456054688, 0.09966278076171875, 0.10342788696289062, 0.1071929931640625, 0.11095809936523438, 0.11472320556640625, 0.11848831176757812, 0.12225341796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 9.0, 8.0, 15.0, 26.0, 33.0, 77.0, 161.0, 234.0, 193.0, 104.0, 71.0, 13.0, 12.0, 11.0, 10.0, 11.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.655122756958008e-05, -4.480872303247452e-05, -4.306621849536896e-05, -4.13237139582634e-05, -3.958120942115784e-05, -3.7838704884052277e-05, -3.6096200346946716e-05, -3.4353695809841156e-05, -3.2611191272735596e-05, -3.0868686735630035e-05, -2.9126182198524475e-05, -2.7383677661418915e-05, -2.5641173124313354e-05, -2.3898668587207794e-05, -2.2156164050102234e-05, -2.0413659512996674e-05, -1.8671154975891113e-05, -1.6928650438785553e-05, -1.5186145901679993e-05, -1.3443641364574432e-05, -1.1701136827468872e-05, -9.958632290363312e-06, -8.216127753257751e-06, -6.473623216152191e-06, -4.731118679046631e-06, -2.9886141419410706e-06, -1.2461096048355103e-06, 4.9639493227005e-07, 2.2388994693756104e-06, 3.981404006481171e-06, 5.723908543586731e-06, 7.466413080692291e-06, 9.208917617797852e-06, 1.0951422154903412e-05, 1.2693926692008972e-05, 1.4436431229114532e-05, 1.6178935766220093e-05, 1.7921440303325653e-05, 1.9663944840431213e-05, 2.1406449377536774e-05, 2.3148953914642334e-05, 2.4891458451747894e-05, 2.6633962988853455e-05, 2.8376467525959015e-05, 3.0118972063064575e-05, 3.1861476600170135e-05, 3.3603981137275696e-05, 3.5346485674381256e-05, 3.7088990211486816e-05, 3.883149474859238e-05, 4.057399928569794e-05, 4.23165038228035e-05, 4.405900835990906e-05, 4.580151289701462e-05, 4.754401743412018e-05, 4.928652197122574e-05, 5.10290265083313e-05, 5.277153104543686e-05, 5.451403558254242e-05, 5.625654011964798e-05, 5.799904465675354e-05, 5.97415491938591e-05, 6.148405373096466e-05, 6.322655826807022e-05, 6.496906280517578e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 4.0, 8.0, 13.0, 13.0, 18.0, 18.0, 39.0, 56.0, 96.0, 124.0, 176.0, 264.0, 372.0, 630.0, 1014.0, 1852.0, 3645.0, 7375.0, 17374.0, 45431.0, 139766.0, 387898.0, 292887.0, 92529.0, 31961.0, 12584.0, 5744.0, 2823.0, 1454.0, 871.0, 470.0, 354.0, 206.0, 137.0, 99.0, 77.0, 57.0, 38.0, 23.0, 20.0, 10.0, 9.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1021728515625, -0.09885787963867188, -0.09554290771484375, -0.09222793579101562, -0.0889129638671875, -0.08559799194335938, -0.08228302001953125, -0.07896804809570312, -0.075653076171875, -0.07233810424804688, -0.06902313232421875, -0.06570816040039062, -0.0623931884765625, -0.059078216552734375, -0.05576324462890625, -0.052448272705078125, -0.04913330078125, -0.045818328857421875, -0.04250335693359375, -0.039188385009765625, -0.0358734130859375, -0.032558441162109375, -0.02924346923828125, -0.025928497314453125, -0.022613525390625, -0.019298553466796875, -0.01598358154296875, -0.012668609619140625, -0.0093536376953125, -0.006038665771484375, -0.00272369384765625, 0.000591278076171875, 0.00390625, 0.007221221923828125, 0.01053619384765625, 0.013851165771484375, 0.0171661376953125, 0.020481109619140625, 0.02379608154296875, 0.027111053466796875, 0.030426025390625, 0.033740997314453125, 0.03705596923828125, 0.040370941162109375, 0.0436859130859375, 0.047000885009765625, 0.05031585693359375, 0.053630828857421875, 0.05694580078125, 0.060260772705078125, 0.06357574462890625, 0.06689071655273438, 0.0702056884765625, 0.07352066040039062, 0.07683563232421875, 0.08015060424804688, 0.083465576171875, 0.08678054809570312, 0.09009552001953125, 0.09341049194335938, 0.0967254638671875, 0.10004043579101562, 0.10335540771484375, 0.10667037963867188, 0.1099853515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 6.0, 12.0, 12.0, 11.0, 11.0, 29.0, 40.0, 49.0, 76.0, 73.0, 107.0, 106.0, 95.0, 92.0, 83.0, 58.0, 44.0, 31.0, 16.0, 12.0, 10.0, 6.0, 7.0, 5.0, 5.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1246337890625, -0.12082958221435547, -0.11702537536621094, -0.1132211685180664, -0.10941696166992188, -0.10561275482177734, -0.10180854797363281, -0.09800434112548828, -0.09420013427734375, -0.09039592742919922, -0.08659172058105469, -0.08278751373291016, -0.07898330688476562, -0.0751791000366211, -0.07137489318847656, -0.06757068634033203, -0.0637664794921875, -0.05996227264404297, -0.05615806579589844, -0.052353858947753906, -0.048549652099609375, -0.044745445251464844, -0.04094123840332031, -0.03713703155517578, -0.03333282470703125, -0.02952861785888672, -0.025724411010742188, -0.021920204162597656, -0.018115997314453125, -0.014311790466308594, -0.010507583618164062, -0.006703376770019531, -0.002899169921875, 0.0009050369262695312, 0.0047092437744140625, 0.008513450622558594, 0.012317657470703125, 0.016121864318847656, 0.019926071166992188, 0.02373027801513672, 0.02753448486328125, 0.03133869171142578, 0.03514289855957031, 0.038947105407714844, 0.042751312255859375, 0.046555519104003906, 0.05035972595214844, 0.05416393280029297, 0.0579681396484375, 0.06177234649658203, 0.06557655334472656, 0.0693807601928711, 0.07318496704101562, 0.07698917388916016, 0.08079338073730469, 0.08459758758544922, 0.08840179443359375, 0.09220600128173828, 0.09601020812988281, 0.09981441497802734, 0.10361862182617188, 0.1074228286743164, 0.11122703552246094, 0.11503124237060547, 0.11883544921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 15.0, 19.0, 40.0, 52.0, 70.0, 88.0, 95.0, 104.0, 110.0, 105.0, 82.0, 81.0, 43.0, 22.0, 13.0, 18.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.081995964050293, -1.046774983406067, -1.0115540027618408, -0.9763329029083252, -0.9411119222640991, -0.905890941619873, -0.8706699013710022, -0.8354488611221313, -0.8002278804779053, -0.7650068998336792, -0.7297858595848083, -0.6945648193359375, -0.6593438386917114, -0.6241228580474854, -0.5889018177986145, -0.5536807775497437, -0.5184597969055176, -0.4832387864589691, -0.44801777601242065, -0.4127967655658722, -0.37757575511932373, -0.34235474467277527, -0.3071337342262268, -0.27191272377967834, -0.23669171333312988, -0.20147070288658142, -0.16624969244003296, -0.1310286819934845, -0.09580767154693604, -0.06058666110038757, -0.02536565065383911, 0.00985535979270935, 0.04507637023925781, 0.08029738068580627, 0.11551839113235474, 0.1507394015789032, 0.18596041202545166, 0.22118142247200012, 0.2564024329185486, 0.29162344336509705, 0.3268444538116455, 0.36206546425819397, 0.39728647470474243, 0.4325074851512909, 0.46772849559783936, 0.5029494762420654, 0.5381705164909363, 0.5733915567398071, 0.6086125373840332, 0.6438335180282593, 0.6790545582771301, 0.714275598526001, 0.749496579170227, 0.7847175598144531, 0.819938600063324, 0.8551596403121948, 0.8903806209564209, 0.925601601600647, 0.9608226418495178, 0.9960436820983887, 1.0312646627426147, 1.0664856433868408, 1.1017067432403564, 1.1369277238845825, 1.1721487045288086]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 16.0, 10.0, 9.0, 15.0, 23.0, 31.0, 26.0, 27.0, 29.0, 29.0, 35.0, 33.0, 36.0, 49.0, 31.0, 29.0, 41.0, 28.0, 39.0, 40.0, 44.0, 40.0, 33.0, 29.0, 29.0, 37.0, 29.0, 20.0, 26.0, 21.0, 18.0, 15.0, 6.0, 6.0, 15.0, 7.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7232616543769836, -0.6990386247634888, -0.6748155951499939, -0.650592565536499, -0.6263695359230042, -0.6021465063095093, -0.5779235363006592, -0.5537004470825195, -0.5294774770736694, -0.5052544474601746, -0.4810314178466797, -0.4568083882331848, -0.43258535861968994, -0.40836232900619507, -0.3841393291950226, -0.3599162995815277, -0.33569324016571045, -0.3114702105522156, -0.2872471809387207, -0.26302415132522583, -0.23880113661289215, -0.21457810699939728, -0.1903550922870636, -0.16613206267356873, -0.14190903306007385, -0.11768600344657898, -0.0934629812836647, -0.06923995912075043, -0.045016929507255554, -0.02079389989376068, 0.003429114818572998, 0.02765214443206787, 0.051875174045562744, 0.07609820365905762, 0.1003212258219719, 0.12454424798488617, 0.14876727759838104, 0.17299030721187592, 0.1972133219242096, 0.22143635153770447, 0.24565938115119934, 0.2698824107646942, 0.2941054403781891, 0.3183284401893616, 0.34255146980285645, 0.3667744994163513, 0.3909975290298462, 0.41522055864334106, 0.43944358825683594, 0.4636666178703308, 0.4878896474838257, 0.5121126770973206, 0.5363357067108154, 0.5605587363243103, 0.5847817659378052, 0.6090047359466553, 0.6332278251647949, 0.6574508547782898, 0.6816738843917847, 0.7058969140052795, 0.7301199436187744, 0.7543429732322693, 0.7785660028457642, 0.8027889728546143, 0.8270120024681091]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 7.0, 6.0, 14.0, 20.0, 26.0, 53.0, 56.0, 72.0, 148.0, 207.0, 317.0, 549.0, 920.0, 1724.0, 3318.0, 6907.0, 14464.0, 35035.0, 87020.0, 247254.0, 878120.0, 1955461.0, 646171.0, 192525.0, 69884.0, 28841.0, 12506.0, 5884.0, 2959.0, 1586.0, 880.0, 477.0, 297.0, 192.0, 128.0, 74.0, 66.0, 43.0, 27.0, 28.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.153564453125, -0.14815521240234375, -0.1427459716796875, -0.13733673095703125, -0.131927490234375, -0.12651824951171875, -0.1211090087890625, -0.11569976806640625, -0.11029052734375, -0.10488128662109375, -0.0994720458984375, -0.09406280517578125, -0.088653564453125, -0.08324432373046875, -0.0778350830078125, -0.07242584228515625, -0.0670166015625, -0.06160736083984375, -0.0561981201171875, -0.05078887939453125, -0.045379638671875, -0.03997039794921875, -0.0345611572265625, -0.02915191650390625, -0.02374267578125, -0.01833343505859375, -0.0129241943359375, -0.00751495361328125, -0.002105712890625, 0.00330352783203125, 0.0087127685546875, 0.01412200927734375, 0.01953125, 0.02494049072265625, 0.0303497314453125, 0.03575897216796875, 0.041168212890625, 0.04657745361328125, 0.0519866943359375, 0.05739593505859375, 0.06280517578125, 0.06821441650390625, 0.0736236572265625, 0.07903289794921875, 0.084442138671875, 0.08985137939453125, 0.0952606201171875, 0.10066986083984375, 0.1060791015625, 0.11148834228515625, 0.1168975830078125, 0.12230682373046875, 0.127716064453125, 0.13312530517578125, 0.1385345458984375, 0.14394378662109375, 0.14935302734375, 0.15476226806640625, 0.1601715087890625, 0.16558074951171875, 0.170989990234375, 0.17639923095703125, 0.1818084716796875, 0.18721771240234375, 0.192626953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 7.0, 11.0, 9.0, 7.0, 16.0, 17.0, 19.0, 33.0, 22.0, 35.0, 40.0, 34.0, 31.0, 46.0, 29.0, 44.0, 37.0, 43.0, 48.0, 37.0, 49.0, 41.0, 46.0, 43.0, 47.0, 20.0, 26.0, 16.0, 17.0, 24.0, 18.0, 10.0, 12.0, 15.0, 5.0, 5.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.11199951171875, -0.10868549346923828, -0.10537147521972656, -0.10205745697021484, -0.09874343872070312, -0.0954294204711914, -0.09211540222167969, -0.08880138397216797, -0.08548736572265625, -0.08217334747314453, -0.07885932922363281, -0.0755453109741211, -0.07223129272460938, -0.06891727447509766, -0.06560325622558594, -0.06228923797607422, -0.0589752197265625, -0.05566120147705078, -0.05234718322753906, -0.049033164978027344, -0.045719146728515625, -0.042405128479003906, -0.03909111022949219, -0.03577709197998047, -0.03246307373046875, -0.02914905548095703, -0.025835037231445312, -0.022521018981933594, -0.019207000732421875, -0.015892982482910156, -0.012578964233398438, -0.009264945983886719, -0.005950927734375, -0.0026369094848632812, 0.0006771087646484375, 0.003991127014160156, 0.007305145263671875, 0.010619163513183594, 0.013933181762695312, 0.01724720001220703, 0.02056121826171875, 0.02387523651123047, 0.027189254760742188, 0.030503273010253906, 0.033817291259765625, 0.037131309509277344, 0.04044532775878906, 0.04375934600830078, 0.0470733642578125, 0.05038738250732422, 0.05370140075683594, 0.057015419006347656, 0.060329437255859375, 0.0636434555053711, 0.06695747375488281, 0.07027149200439453, 0.07358551025390625, 0.07689952850341797, 0.08021354675292969, 0.0835275650024414, 0.08684158325195312, 0.09015560150146484, 0.09346961975097656, 0.09678363800048828, 0.10009765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 9.0, 14.0, 16.0, 23.0, 22.0, 21.0, 27.0, 45.0, 66.0, 106.0, 148.0, 242.0, 420.0, 774.0, 1754.0, 4185.0, 12381.0, 40927.0, 166525.0, 960806.0, 2495399.0, 391180.0, 84165.0, 22562.0, 7071.0, 2748.0, 1173.0, 591.0, 321.0, 179.0, 97.0, 79.0, 45.0, 37.0, 13.0, 23.0, 19.0, 12.0, 7.0, 5.0, 6.0, 6.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.275146484375, -0.26467132568359375, -0.2541961669921875, -0.24372100830078125, -0.233245849609375, -0.22277069091796875, -0.2122955322265625, -0.20182037353515625, -0.19134521484375, -0.18087005615234375, -0.1703948974609375, -0.15991973876953125, -0.149444580078125, -0.13896942138671875, -0.1284942626953125, -0.11801910400390625, -0.1075439453125, -0.09706878662109375, -0.0865936279296875, -0.07611846923828125, -0.065643310546875, -0.05516815185546875, -0.0446929931640625, -0.03421783447265625, -0.02374267578125, -0.01326751708984375, -0.0027923583984375, 0.00768280029296875, 0.018157958984375, 0.02863311767578125, 0.0391082763671875, 0.04958343505859375, 0.06005859375, 0.07053375244140625, 0.0810089111328125, 0.09148406982421875, 0.101959228515625, 0.11243438720703125, 0.1229095458984375, 0.13338470458984375, 0.14385986328125, 0.15433502197265625, 0.1648101806640625, 0.17528533935546875, 0.185760498046875, 0.19623565673828125, 0.2067108154296875, 0.21718597412109375, 0.2276611328125, 0.23813629150390625, 0.2486114501953125, 0.25908660888671875, 0.269561767578125, 0.28003692626953125, 0.2905120849609375, 0.30098724365234375, 0.31146240234375, 0.32193756103515625, 0.3324127197265625, 0.34288787841796875, 0.353363037109375, 0.36383819580078125, 0.3743133544921875, 0.38478851318359375, 0.395263671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 7.0, 18.0, 24.0, 39.0, 49.0, 77.0, 95.0, 154.0, 209.0, 364.0, 630.0, 882.0, 618.0, 304.0, 220.0, 139.0, 80.0, 57.0, 37.0, 33.0, 13.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.44899749755859375, -0.4373016357421875, -0.42560577392578125, -0.413909912109375, -0.40221405029296875, -0.3905181884765625, -0.37882232666015625, -0.36712646484375, -0.35543060302734375, -0.3437347412109375, -0.33203887939453125, -0.320343017578125, -0.30864715576171875, -0.2969512939453125, -0.28525543212890625, -0.2735595703125, -0.26186370849609375, -0.2501678466796875, -0.23847198486328125, -0.226776123046875, -0.21508026123046875, -0.2033843994140625, -0.19168853759765625, -0.17999267578125, -0.16829681396484375, -0.1566009521484375, -0.14490509033203125, -0.133209228515625, -0.12151336669921875, -0.1098175048828125, -0.09812164306640625, -0.08642578125, -0.07472991943359375, -0.0630340576171875, -0.05133819580078125, -0.039642333984375, -0.02794647216796875, -0.0162506103515625, -0.00455474853515625, 0.00714111328125, 0.01883697509765625, 0.0305328369140625, 0.04222869873046875, 0.053924560546875, 0.06562042236328125, 0.0773162841796875, 0.08901214599609375, 0.1007080078125, 0.11240386962890625, 0.1240997314453125, 0.13579559326171875, 0.147491455078125, 0.15918731689453125, 0.1708831787109375, 0.18257904052734375, 0.19427490234375, 0.20597076416015625, 0.2176666259765625, 0.22936248779296875, 0.241058349609375, 0.25275421142578125, 0.2644500732421875, 0.27614593505859375, 0.287841796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 17.0, 46.0, 92.0, 166.0, 208.0, 193.0, 130.0, 77.0, 37.0, 10.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6999917030334473, -2.607011318206787, -2.514031171798706, -2.421050786972046, -2.328070640563965, -2.2350902557373047, -2.1421101093292236, -2.0491297245025635, -1.9561495780944824, -1.8631693124771118, -1.7701890468597412, -1.6772087812423706, -1.584228515625, -1.4912482500076294, -1.3982679843902588, -1.3052875995635986, -1.212307333946228, -1.1193270683288574, -1.0263468027114868, -0.9333665370941162, -0.8403862714767456, -0.747406005859375, -0.6544256806373596, -0.561445415019989, -0.4684651494026184, -0.3754848837852478, -0.2825046181678772, -0.1895243227481842, -0.0965440571308136, -0.003563791513442993, 0.08941650390625, 0.1823967695236206, 0.2753770351409912, 0.3683573007583618, 0.4613375663757324, 0.554317831993103, 0.6472980976104736, 0.7402783632278442, 0.8332586884498596, 0.9262389540672302, 1.019219160079956, 1.1121994256973267, 1.2051796913146973, 1.2981599569320679, 1.3911402225494385, 1.484120488166809, 1.5771007537841797, 1.6700811386108398, 1.7630614042282104, 1.856041669845581, 1.9490219354629517, 2.0420022010803223, 2.1349825859069824, 2.2279627323150635, 2.3209431171417236, 2.4139232635498047, 2.506903648376465, 2.599884033203125, 2.692864179611206, 2.785844564437866, 2.8788247108459473, 2.9718050956726074, 3.0647852420806885, 3.1577656269073486, 3.2507457733154297]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 9.0, 12.0, 13.0, 9.0, 24.0, 15.0, 14.0, 19.0, 23.0, 28.0, 29.0, 37.0, 34.0, 28.0, 46.0, 37.0, 47.0, 34.0, 42.0, 35.0, 42.0, 39.0, 38.0, 37.0, 28.0, 21.0, 23.0, 23.0, 27.0, 21.0, 22.0, 16.0, 16.0, 15.0, 16.0, 13.0, 13.0, 5.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.8448373079299927, -0.8209336400032043, -0.7970299124717712, -0.7731262445449829, -0.7492225170135498, -0.7253188490867615, -0.7014151811599731, -0.67751145362854, -0.6536077857017517, -0.6297041177749634, -0.6058003902435303, -0.5818967223167419, -0.5579930543899536, -0.5340893268585205, -0.5101856589317322, -0.48628196120262146, -0.46237826347351074, -0.4384745657444, -0.4145708680152893, -0.390667200088501, -0.36676350235939026, -0.34285980463027954, -0.3189561367034912, -0.2950524389743805, -0.2711487412452698, -0.24724504351615906, -0.22334136068820953, -0.19943767786026, -0.1755339801311493, -0.15163028240203857, -0.12772659957408905, -0.10382291674613953, -0.07991921901702881, -0.05601552873849869, -0.03211183845996857, -0.008208148181438446, 0.015695542097091675, 0.039599232375621796, 0.06350292265415192, 0.08740660548210144, 0.11131030321121216, 0.13521400094032288, 0.1591176837682724, 0.18302136659622192, 0.20692506432533264, 0.23082876205444336, 0.2547324299812317, 0.2786361277103424, 0.3025398254394531, 0.32644352316856384, 0.35034722089767456, 0.3742508888244629, 0.3981545865535736, 0.4220582842826843, 0.44596195220947266, 0.4698656499385834, 0.4937693476676941, 0.5176730155944824, 0.5415767431259155, 0.5654804110527039, 0.5893840789794922, 0.6132878065109253, 0.6371914744377136, 0.661095142364502, 0.6849988698959351]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 17.0, 17.0, 27.0, 50.0, 88.0, 112.0, 186.0, 275.0, 448.0, 672.0, 1062.0, 1529.0, 2373.0, 3487.0, 4953.0, 7666.0, 11923.0, 22117.0, 52456.0, 180364.0, 445955.0, 197235.0, 56366.0, 23275.0, 12414.0, 7759.0, 5157.0, 3534.0, 2436.0, 1574.0, 1052.0, 731.0, 465.0, 276.0, 207.0, 108.0, 54.0, 43.0, 32.0, 24.0, 8.0, 12.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.298095703125, -0.2899360656738281, -0.28177642822265625, -0.2736167907714844, -0.2654571533203125, -0.2572975158691406, -0.24913787841796875, -0.24097824096679688, -0.232818603515625, -0.22465896606445312, -0.21649932861328125, -0.20833969116210938, -0.2001800537109375, -0.19202041625976562, -0.18386077880859375, -0.17570114135742188, -0.16754150390625, -0.15938186645507812, -0.15122222900390625, -0.14306259155273438, -0.1349029541015625, -0.12674331665039062, -0.11858367919921875, -0.11042404174804688, -0.102264404296875, -0.09410476684570312, -0.08594512939453125, -0.07778549194335938, -0.0696258544921875, -0.061466217041015625, -0.05330657958984375, -0.045146942138671875, -0.0369873046875, -0.028827667236328125, -0.02066802978515625, -0.012508392333984375, -0.0043487548828125, 0.003810882568359375, 0.01197052001953125, 0.020130157470703125, 0.028289794921875, 0.036449432373046875, 0.04460906982421875, 0.052768707275390625, 0.0609283447265625, 0.06908798217773438, 0.07724761962890625, 0.08540725708007812, 0.09356689453125, 0.10172653198242188, 0.10988616943359375, 0.11804580688476562, 0.1262054443359375, 0.13436508178710938, 0.14252471923828125, 0.15068435668945312, 0.158843994140625, 0.16700363159179688, 0.17516326904296875, 0.18332290649414062, 0.1914825439453125, 0.19964218139648438, 0.20780181884765625, 0.21596145629882812, 0.22412109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 9.0, 5.0, 8.0, 19.0, 14.0, 21.0, 19.0, 15.0, 27.0, 28.0, 31.0, 23.0, 31.0, 39.0, 36.0, 49.0, 40.0, 37.0, 43.0, 39.0, 49.0, 35.0, 34.0, 36.0, 36.0, 38.0, 35.0, 27.0, 16.0, 15.0, 20.0, 19.0, 12.0, 9.0, 12.0, 6.0, 11.0, 8.0, 6.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0], "bins": [-0.1163330078125, -0.11287498474121094, -0.10941696166992188, -0.10595893859863281, -0.10250091552734375, -0.09904289245605469, -0.09558486938476562, -0.09212684631347656, -0.0886688232421875, -0.08521080017089844, -0.08175277709960938, -0.07829475402832031, -0.07483673095703125, -0.07137870788574219, -0.06792068481445312, -0.06446266174316406, -0.061004638671875, -0.05754661560058594, -0.054088592529296875, -0.05063056945800781, -0.04717254638671875, -0.04371452331542969, -0.040256500244140625, -0.03679847717285156, -0.0333404541015625, -0.029882431030273438, -0.026424407958984375, -0.022966384887695312, -0.01950836181640625, -0.016050338745117188, -0.012592315673828125, -0.009134292602539062, -0.00567626953125, -0.0022182464599609375, 0.001239776611328125, 0.0046977996826171875, 0.00815582275390625, 0.011613845825195312, 0.015071868896484375, 0.018529891967773438, 0.0219879150390625, 0.025445938110351562, 0.028903961181640625, 0.03236198425292969, 0.03582000732421875, 0.03927803039550781, 0.042736053466796875, 0.04619407653808594, 0.049652099609375, 0.05311012268066406, 0.056568145751953125, 0.06002616882324219, 0.06348419189453125, 0.06694221496582031, 0.07040023803710938, 0.07385826110839844, 0.0773162841796875, 0.08077430725097656, 0.08423233032226562, 0.08769035339355469, 0.09114837646484375, 0.09460639953613281, 0.09806442260742188, 0.10152244567871094, 0.10498046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 12.0, 16.0, 16.0, 21.0, 27.0, 46.0, 62.0, 81.0, 164.0, 285.0, 513.0, 994.0, 2072.0, 4699.0, 10768.0, 25704.0, 77331.0, 493232.0, 337383.0, 57585.0, 20928.0, 8975.0, 3896.0, 1769.0, 863.0, 399.0, 243.0, 148.0, 100.0, 58.0, 42.0, 25.0, 21.0, 20.0, 13.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3556556701660156, -0.34290313720703125, -0.3301506042480469, -0.3173980712890625, -0.3046455383300781, -0.29189300537109375, -0.2791404724121094, -0.266387939453125, -0.2536354064941406, -0.24088287353515625, -0.22813034057617188, -0.2153778076171875, -0.20262527465820312, -0.18987274169921875, -0.17712020874023438, -0.16436767578125, -0.15161514282226562, -0.13886260986328125, -0.12611007690429688, -0.1133575439453125, -0.10060501098632812, -0.08785247802734375, -0.07509994506835938, -0.062347412109375, -0.049594879150390625, -0.03684234619140625, -0.024089813232421875, -0.0113372802734375, 0.001415252685546875, 0.01416778564453125, 0.026920318603515625, 0.0396728515625, 0.052425384521484375, 0.06517791748046875, 0.07793045043945312, 0.0906829833984375, 0.10343551635742188, 0.11618804931640625, 0.12894058227539062, 0.141693115234375, 0.15444564819335938, 0.16719818115234375, 0.17995071411132812, 0.1927032470703125, 0.20545578002929688, 0.21820831298828125, 0.23096084594726562, 0.24371337890625, 0.2564659118652344, 0.26921844482421875, 0.2819709777832031, 0.2947235107421875, 0.3074760437011719, 0.32022857666015625, 0.3329811096191406, 0.345733642578125, 0.3584861755371094, 0.37123870849609375, 0.3839912414550781, 0.3967437744140625, 0.4094963073730469, 0.42224884033203125, 0.4350013732910156, 0.44775390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 6.0, 5.0, 8.0, 12.0, 13.0, 10.0, 23.0, 18.0, 15.0, 27.0, 22.0, 32.0, 22.0, 44.0, 42.0, 43.0, 38.0, 47.0, 44.0, 57.0, 49.0, 51.0, 47.0, 44.0, 41.0, 36.0, 33.0, 31.0, 18.0, 15.0, 19.0, 20.0, 10.0, 10.0, 8.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29177093505859375, -0.2798309326171875, -0.26789093017578125, -0.255950927734375, -0.24401092529296875, -0.2320709228515625, -0.22013092041015625, -0.20819091796875, -0.19625091552734375, -0.1843109130859375, -0.17237091064453125, -0.160430908203125, -0.14849090576171875, -0.1365509033203125, -0.12461090087890625, -0.1126708984375, -0.10073089599609375, -0.0887908935546875, -0.07685089111328125, -0.064910888671875, -0.05297088623046875, -0.0410308837890625, -0.02909088134765625, -0.01715087890625, -0.00521087646484375, 0.0067291259765625, 0.01866912841796875, 0.030609130859375, 0.04254913330078125, 0.0544891357421875, 0.06642913818359375, 0.078369140625, 0.09030914306640625, 0.1022491455078125, 0.11418914794921875, 0.126129150390625, 0.13806915283203125, 0.1500091552734375, 0.16194915771484375, 0.17388916015625, 0.18582916259765625, 0.1977691650390625, 0.20970916748046875, 0.221649169921875, 0.23358917236328125, 0.2455291748046875, 0.25746917724609375, 0.2694091796875, 0.28134918212890625, 0.2932891845703125, 0.30522918701171875, 0.317169189453125, 0.32910919189453125, 0.3410491943359375, 0.35298919677734375, 0.36492919921875, 0.37686920166015625, 0.3888092041015625, 0.40074920654296875, 0.412689208984375, 0.42462921142578125, 0.4365692138671875, 0.44850921630859375, 0.46044921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 14.0, 11.0, 17.0, 17.0, 47.0, 82.0, 122.0, 174.0, 267.0, 505.0, 921.0, 1517.0, 2891.0, 4959.0, 9342.0, 18558.0, 41000.0, 119825.0, 476711.0, 250341.0, 66053.0, 26951.0, 12733.0, 6798.0, 3757.0, 2136.0, 1141.0, 673.0, 397.0, 228.0, 133.0, 80.0, 56.0, 32.0, 16.0, 15.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.14501953125, -0.14072227478027344, -0.13642501831054688, -0.1321277618408203, -0.12783050537109375, -0.12353324890136719, -0.11923599243164062, -0.11493873596191406, -0.1106414794921875, -0.10634422302246094, -0.10204696655273438, -0.09774971008300781, -0.09345245361328125, -0.08915519714355469, -0.08485794067382812, -0.08056068420410156, -0.076263427734375, -0.07196617126464844, -0.06766891479492188, -0.06337165832519531, -0.05907440185546875, -0.05477714538574219, -0.050479888916015625, -0.04618263244628906, -0.0418853759765625, -0.03758811950683594, -0.033290863037109375, -0.028993606567382812, -0.02469635009765625, -0.020399093627929688, -0.016101837158203125, -0.011804580688476562, -0.00750732421875, -0.0032100677490234375, 0.001087188720703125, 0.0053844451904296875, 0.00968170166015625, 0.013978958129882812, 0.018276214599609375, 0.022573471069335938, 0.0268707275390625, 0.031167984008789062, 0.035465240478515625, 0.03976249694824219, 0.04405975341796875, 0.04835700988769531, 0.052654266357421875, 0.05695152282714844, 0.061248779296875, 0.06554603576660156, 0.06984329223632812, 0.07414054870605469, 0.07843780517578125, 0.08273506164550781, 0.08703231811523438, 0.09132957458496094, 0.0956268310546875, 0.09992408752441406, 0.10422134399414062, 0.10851860046386719, 0.11281585693359375, 0.11711311340332031, 0.12141036987304688, 0.12570762634277344, 0.1300048828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 12.0, 12.0, 12.0, 28.0, 30.0, 82.0, 148.0, 196.0, 200.0, 97.0, 49.0, 37.0, 19.0, 9.0, 11.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5180320739746094e-05, -4.349276423454285e-05, -4.18052077293396e-05, -4.011765122413635e-05, -3.8430094718933105e-05, -3.674253821372986e-05, -3.505498170852661e-05, -3.3367425203323364e-05, -3.167986869812012e-05, -2.999231219291687e-05, -2.8304755687713623e-05, -2.6617199182510376e-05, -2.492964267730713e-05, -2.3242086172103882e-05, -2.1554529666900635e-05, -1.9866973161697388e-05, -1.817941665649414e-05, -1.6491860151290894e-05, -1.4804303646087646e-05, -1.31167471408844e-05, -1.1429190635681152e-05, -9.741634130477905e-06, -8.054077625274658e-06, -6.366521120071411e-06, -4.678964614868164e-06, -2.991408109664917e-06, -1.30385160446167e-06, 3.8370490074157715e-07, 2.0712614059448242e-06, 3.7588179111480713e-06, 5.446374416351318e-06, 7.1339309215545654e-06, 8.821487426757812e-06, 1.050904393196106e-05, 1.2196600437164307e-05, 1.3884156942367554e-05, 1.55717134475708e-05, 1.7259269952774048e-05, 1.8946826457977295e-05, 2.0634382963180542e-05, 2.232193946838379e-05, 2.4009495973587036e-05, 2.5697052478790283e-05, 2.738460898399353e-05, 2.9072165489196777e-05, 3.0759721994400024e-05, 3.244727849960327e-05, 3.413483500480652e-05, 3.5822391510009766e-05, 3.750994801521301e-05, 3.919750452041626e-05, 4.088506102561951e-05, 4.2572617530822754e-05, 4.4260174036026e-05, 4.594773054122925e-05, 4.7635287046432495e-05, 4.932284355163574e-05, 5.101040005683899e-05, 5.2697956562042236e-05, 5.4385513067245483e-05, 5.607306957244873e-05, 5.776062607765198e-05, 5.9448182582855225e-05, 6.113573908805847e-05, 6.282329559326172e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 8.0, 13.0, 14.0, 21.0, 31.0, 49.0, 81.0, 113.0, 229.0, 400.0, 771.0, 1914.0, 4116.0, 10364.0, 27621.0, 90741.0, 367763.0, 395977.0, 99386.0, 29568.0, 11015.0, 4477.0, 1939.0, 914.0, 434.0, 229.0, 128.0, 64.0, 47.0, 36.0, 21.0, 10.0, 17.0, 11.0, 7.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.165771484375, -0.16117095947265625, -0.1565704345703125, -0.15196990966796875, -0.147369384765625, -0.14276885986328125, -0.1381683349609375, -0.13356781005859375, -0.12896728515625, -0.12436676025390625, -0.1197662353515625, -0.11516571044921875, -0.110565185546875, -0.10596466064453125, -0.1013641357421875, -0.09676361083984375, -0.0921630859375, -0.08756256103515625, -0.0829620361328125, -0.07836151123046875, -0.073760986328125, -0.06916046142578125, -0.0645599365234375, -0.05995941162109375, -0.05535888671875, -0.05075836181640625, -0.0461578369140625, -0.04155731201171875, -0.036956787109375, -0.03235626220703125, -0.0277557373046875, -0.02315521240234375, -0.0185546875, -0.01395416259765625, -0.0093536376953125, -0.00475311279296875, -0.000152587890625, 0.00444793701171875, 0.0090484619140625, 0.01364898681640625, 0.01824951171875, 0.02285003662109375, 0.0274505615234375, 0.03205108642578125, 0.036651611328125, 0.04125213623046875, 0.0458526611328125, 0.05045318603515625, 0.0550537109375, 0.05965423583984375, 0.0642547607421875, 0.06885528564453125, 0.073455810546875, 0.07805633544921875, 0.0826568603515625, 0.08725738525390625, 0.09185791015625, 0.09645843505859375, 0.1010589599609375, 0.10565948486328125, 0.110260009765625, 0.11486053466796875, 0.1194610595703125, 0.12406158447265625, 0.128662109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 7.0, 6.0, 15.0, 15.0, 10.0, 23.0, 31.0, 38.0, 49.0, 59.0, 76.0, 109.0, 89.0, 104.0, 84.0, 58.0, 46.0, 33.0, 27.0, 29.0, 18.0, 9.0, 12.0, 9.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1148681640625, -0.11110687255859375, -0.1073455810546875, -0.10358428955078125, -0.099822998046875, -0.09606170654296875, -0.0923004150390625, -0.08853912353515625, -0.08477783203125, -0.08101654052734375, -0.0772552490234375, -0.07349395751953125, -0.069732666015625, -0.06597137451171875, -0.0622100830078125, -0.05844879150390625, -0.0546875, -0.05092620849609375, -0.0471649169921875, -0.04340362548828125, -0.039642333984375, -0.03588104248046875, -0.0321197509765625, -0.02835845947265625, -0.02459716796875, -0.02083587646484375, -0.0170745849609375, -0.01331329345703125, -0.009552001953125, -0.00579071044921875, -0.0020294189453125, 0.00173187255859375, 0.0054931640625, 0.00925445556640625, 0.0130157470703125, 0.01677703857421875, 0.020538330078125, 0.02429962158203125, 0.0280609130859375, 0.03182220458984375, 0.03558349609375, 0.03934478759765625, 0.0431060791015625, 0.04686737060546875, 0.050628662109375, 0.05438995361328125, 0.0581512451171875, 0.06191253662109375, 0.065673828125, 0.06943511962890625, 0.0731964111328125, 0.07695770263671875, 0.080718994140625, 0.08448028564453125, 0.0882415771484375, 0.09200286865234375, 0.09576416015625, 0.09952545166015625, 0.1032867431640625, 0.10704803466796875, 0.110809326171875, 0.11457061767578125, 0.1183319091796875, 0.12209320068359375, 0.1258544921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 16.0, 39.0, 53.0, 104.0, 125.0, 139.0, 158.0, 135.0, 87.0, 53.0, 39.0, 24.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.616220474243164, -1.545584797859192, -1.4749491214752197, -1.404313325881958, -1.3336776494979858, -1.2630419731140137, -1.192406177520752, -1.1217705011367798, -1.0511348247528076, -0.9804991483688354, -0.9098634123802185, -0.8392276763916016, -0.7685920000076294, -0.6979563236236572, -0.6273205876350403, -0.5566848516464233, -0.48604917526245117, -0.4154134690761566, -0.34477776288986206, -0.2741420567035675, -0.20350635051727295, -0.1328706443309784, -0.06223493814468384, 0.008400768041610718, 0.07903647422790527, 0.14967218041419983, 0.22030788660049438, 0.29094359278678894, 0.3615792989730835, 0.43221500515937805, 0.5028507113456726, 0.5734864473342896, 0.6441221237182617, 0.7147578001022339, 0.7853935360908508, 0.8560292720794678, 0.9266649484634399, 0.9973006248474121, 1.0679364204406738, 1.138572096824646, 1.2092077732086182, 1.2798434495925903, 1.3504791259765625, 1.4211149215698242, 1.4917505979537964, 1.5623862743377686, 1.6330220699310303, 1.7036577463150024, 1.7742934226989746, 1.8449290990829468, 1.915564775466919, 1.9862005710601807, 2.0568361282348633, 2.127471923828125, 2.1981077194213867, 2.2687432765960693, 2.339379072189331, 2.4100148677825928, 2.4806504249572754, 2.551286220550537, 2.621922016143799, 2.6925575733184814, 2.763193368911743, 2.833828926086426, 2.9044647216796875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 6.0, 9.0, 12.0, 7.0, 13.0, 14.0, 23.0, 13.0, 18.0, 22.0, 19.0, 35.0, 19.0, 32.0, 32.0, 39.0, 30.0, 30.0, 44.0, 39.0, 32.0, 37.0, 40.0, 29.0, 34.0, 31.0, 35.0, 32.0, 31.0, 25.0, 25.0, 21.0, 24.0, 16.0, 20.0, 11.0, 7.0, 17.0, 8.0, 9.0, 5.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.7879053950309753, -0.7606739401817322, -0.7334424257278442, -0.7062109708786011, -0.6789795160293579, -0.6517480611801147, -0.6245166063308716, -0.5972850918769836, -0.5700536370277405, -0.5428221821784973, -0.5155906677246094, -0.4883592128753662, -0.46112775802612305, -0.4338963031768799, -0.40666481852531433, -0.3794333338737488, -0.3522018790245056, -0.32497042417526245, -0.2977389395236969, -0.27050745487213135, -0.24327600002288818, -0.21604453027248383, -0.18881306052207947, -0.1615815907716751, -0.13435012102127075, -0.1071186512708664, -0.07988718152046204, -0.05265571177005768, -0.02542424201965332, 0.0018072277307510376, 0.029038697481155396, 0.05627016723155975, 0.08350157737731934, 0.1107330471277237, 0.13796451687812805, 0.1651959866285324, 0.19242745637893677, 0.21965892612934113, 0.24689039587974548, 0.27412188053131104, 0.3013533353805542, 0.32858479022979736, 0.3558162748813629, 0.38304775953292847, 0.41027921438217163, 0.4375106692314148, 0.46474215388298035, 0.4919736385345459, 0.5192050933837891, 0.5464365482330322, 0.5736680030822754, 0.6008995175361633, 0.6281309723854065, 0.6553624272346497, 0.6825939416885376, 0.7098253965377808, 0.7370568513870239, 0.7642883062362671, 0.7915197610855103, 0.8187512755393982, 0.8459827303886414, 0.8732141852378845, 0.9004456996917725, 0.9276771545410156, 0.9549086093902588]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 9.0, 11.0, 19.0, 23.0, 44.0, 72.0, 123.0, 199.0, 332.0, 619.0, 1021.0, 2119.0, 4141.0, 8772.0, 20423.0, 51008.0, 146379.0, 533199.0, 1943044.0, 1086319.0, 259442.0, 81545.0, 30572.0, 13008.0, 5880.0, 2827.0, 1374.0, 733.0, 407.0, 229.0, 149.0, 95.0, 55.0, 43.0, 18.0, 14.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17366981506347656, -0.16740798950195312, -0.1611461639404297, -0.15488433837890625, -0.1486225128173828, -0.14236068725585938, -0.13609886169433594, -0.1298370361328125, -0.12357521057128906, -0.11731338500976562, -0.11105155944824219, -0.10478973388671875, -0.09852790832519531, -0.09226608276367188, -0.08600425720214844, -0.079742431640625, -0.07348060607910156, -0.06721878051757812, -0.06095695495605469, -0.05469512939453125, -0.04843330383300781, -0.042171478271484375, -0.03590965270996094, -0.0296478271484375, -0.023386001586914062, -0.017124176025390625, -0.010862350463867188, -0.00460052490234375, 0.0016613006591796875, 0.007923126220703125, 0.014184951782226562, 0.02044677734375, 0.026708602905273438, 0.032970428466796875, 0.03923225402832031, 0.04549407958984375, 0.05175590515136719, 0.058017730712890625, 0.06427955627441406, 0.0705413818359375, 0.07680320739746094, 0.08306503295898438, 0.08932685852050781, 0.09558868408203125, 0.10185050964355469, 0.10811233520507812, 0.11437416076660156, 0.120635986328125, 0.12689781188964844, 0.13315963745117188, 0.1394214630126953, 0.14568328857421875, 0.1519451141357422, 0.15820693969726562, 0.16446876525878906, 0.1707305908203125, 0.17699241638183594, 0.18325424194335938, 0.1895160675048828, 0.19577789306640625, 0.2020397186279297, 0.20830154418945312, 0.21456336975097656, 0.2208251953125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 7.0, 11.0, 9.0, 14.0, 19.0, 22.0, 26.0, 26.0, 24.0, 29.0, 26.0, 32.0, 28.0, 34.0, 44.0, 46.0, 34.0, 39.0, 47.0, 36.0, 40.0, 34.0, 32.0, 36.0, 30.0, 38.0, 28.0, 21.0, 22.0, 20.0, 19.0, 17.0, 11.0, 12.0, 10.0, 9.0, 6.0, 8.0, 4.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.11962890625, -0.1160116195678711, -0.11239433288574219, -0.10877704620361328, -0.10515975952148438, -0.10154247283935547, -0.09792518615722656, -0.09430789947509766, -0.09069061279296875, -0.08707332611083984, -0.08345603942871094, -0.07983875274658203, -0.07622146606445312, -0.07260417938232422, -0.06898689270019531, -0.0653696060180664, -0.0617523193359375, -0.058135032653808594, -0.05451774597167969, -0.05090045928955078, -0.047283172607421875, -0.04366588592529297, -0.04004859924316406, -0.036431312561035156, -0.03281402587890625, -0.029196739196777344, -0.025579452514648438, -0.02196216583251953, -0.018344879150390625, -0.014727592468261719, -0.011110305786132812, -0.007493019104003906, -0.003875732421875, -0.00025844573974609375, 0.0033588409423828125, 0.006976127624511719, 0.010593414306640625, 0.014210700988769531, 0.017827987670898438, 0.021445274353027344, 0.02506256103515625, 0.028679847717285156, 0.03229713439941406, 0.03591442108154297, 0.039531707763671875, 0.04314899444580078, 0.04676628112792969, 0.050383567810058594, 0.0540008544921875, 0.057618141174316406, 0.06123542785644531, 0.06485271453857422, 0.06847000122070312, 0.07208728790283203, 0.07570457458496094, 0.07932186126708984, 0.08293914794921875, 0.08655643463134766, 0.09017372131347656, 0.09379100799560547, 0.09740829467773438, 0.10102558135986328, 0.10464286804199219, 0.1082601547241211, 0.11187744140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 8.0, 9.0, 13.0, 21.0, 19.0, 33.0, 54.0, 97.0, 142.0, 224.0, 477.0, 1100.0, 3086.0, 9672.0, 40883.0, 239506.0, 2486836.0, 1238590.0, 137007.0, 25841.0, 6670.0, 2239.0, 872.0, 414.0, 181.0, 86.0, 53.0, 31.0, 28.0, 22.0, 18.0, 12.0, 8.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.427734375, -0.4134063720703125, -0.399078369140625, -0.3847503662109375, -0.37042236328125, -0.3560943603515625, -0.341766357421875, -0.3274383544921875, -0.3131103515625, -0.2987823486328125, -0.284454345703125, -0.2701263427734375, -0.25579833984375, -0.2414703369140625, -0.227142333984375, -0.2128143310546875, -0.198486328125, -0.1841583251953125, -0.169830322265625, -0.1555023193359375, -0.14117431640625, -0.1268463134765625, -0.112518310546875, -0.0981903076171875, -0.0838623046875, -0.0695343017578125, -0.055206298828125, -0.0408782958984375, -0.02655029296875, -0.0122222900390625, 0.002105712890625, 0.0164337158203125, 0.03076171875, 0.0450897216796875, 0.059417724609375, 0.0737457275390625, 0.08807373046875, 0.1024017333984375, 0.116729736328125, 0.1310577392578125, 0.1453857421875, 0.1597137451171875, 0.174041748046875, 0.1883697509765625, 0.20269775390625, 0.2170257568359375, 0.231353759765625, 0.2456817626953125, 0.260009765625, 0.2743377685546875, 0.288665771484375, 0.3029937744140625, 0.31732177734375, 0.3316497802734375, 0.345977783203125, 0.3603057861328125, 0.3746337890625, 0.3889617919921875, 0.403289794921875, 0.4176177978515625, 0.43194580078125, 0.4462738037109375, 0.460601806640625, 0.4749298095703125, 0.4892578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 13.0, 14.0, 13.0, 21.0, 29.0, 44.0, 95.0, 143.0, 216.0, 303.0, 633.0, 940.0, 698.0, 346.0, 185.0, 122.0, 97.0, 57.0, 44.0, 21.0, 8.0, 9.0, 10.0, 10.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.595703125, -0.5816993713378906, -0.5676956176757812, -0.5536918640136719, -0.5396881103515625, -0.5256843566894531, -0.5116806030273438, -0.4976768493652344, -0.483673095703125, -0.4696693420410156, -0.45566558837890625, -0.4416618347167969, -0.4276580810546875, -0.4136543273925781, -0.39965057373046875, -0.3856468200683594, -0.37164306640625, -0.3576393127441406, -0.34363555908203125, -0.3296318054199219, -0.3156280517578125, -0.3016242980957031, -0.28762054443359375, -0.2736167907714844, -0.259613037109375, -0.24560928344726562, -0.23160552978515625, -0.21760177612304688, -0.2035980224609375, -0.18959426879882812, -0.17559051513671875, -0.16158676147460938, -0.1475830078125, -0.13357925415039062, -0.11957550048828125, -0.10557174682617188, -0.0915679931640625, -0.07756423950195312, -0.06356048583984375, -0.049556732177734375, -0.035552978515625, -0.021549224853515625, -0.00754547119140625, 0.006458282470703125, 0.0204620361328125, 0.034465789794921875, 0.04846954345703125, 0.062473297119140625, 0.07647705078125, 0.09048080444335938, 0.10448455810546875, 0.11848831176757812, 0.1324920654296875, 0.14649581909179688, 0.16049957275390625, 0.17450332641601562, 0.188507080078125, 0.20251083374023438, 0.21651458740234375, 0.23051834106445312, 0.2445220947265625, 0.2585258483886719, 0.27252960205078125, 0.2865333557128906, 0.300537109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 12.0, 32.0, 44.0, 48.0, 87.0, 129.0, 125.0, 153.0, 134.0, 94.0, 63.0, 36.0, 17.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5302045345306396, -2.459735631942749, -2.3892664909362793, -2.3187975883483887, -2.248328685760498, -2.1778595447540283, -2.1073906421661377, -2.036921739578247, -1.9664525985717773, -1.8959835767745972, -1.8255146741867065, -1.7550456523895264, -1.6845766305923462, -1.614107608795166, -1.5436387062072754, -1.4731696844100952, -1.4027007818222046, -1.3322317600250244, -1.2617628574371338, -1.1912938356399536, -1.1208248138427734, -1.0503559112548828, -0.9798868894577026, -0.9094178676605225, -0.8389489054679871, -0.7684799432754517, -0.6980109214782715, -0.6275419592857361, -0.5570729970932007, -0.4866039752960205, -0.4161350131034851, -0.3456660211086273, -0.27519702911376953, -0.20472803711891174, -0.13425906002521515, -0.06379008293151855, 0.006678909063339233, 0.07714790105819702, 0.14761686325073242, 0.2180858552455902, 0.288554847240448, 0.3590238392353058, 0.4294928312301636, 0.499961793422699, 0.5704307556152344, 0.6408997774124146, 0.71136873960495, 0.7818377017974854, 0.8523067235946655, 0.9227756857872009, 0.9932447075843811, 1.0637136697769165, 1.1341826915740967, 1.2046515941619873, 1.2751206159591675, 1.3455896377563477, 1.4160585403442383, 1.4865275621414185, 1.556996464729309, 1.6274654865264893, 1.6979345083236694, 1.7684035301208496, 1.8388724327087402, 1.9093414545059204, 1.9798104763031006]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 4.0, 6.0, 9.0, 11.0, 8.0, 16.0, 22.0, 15.0, 21.0, 18.0, 14.0, 28.0, 26.0, 22.0, 32.0, 27.0, 36.0, 44.0, 43.0, 39.0, 40.0, 37.0, 46.0, 37.0, 43.0, 41.0, 30.0, 37.0, 25.0, 27.0, 28.0, 21.0, 18.0, 17.0, 15.0, 15.0, 11.0, 14.0, 15.0, 1.0, 9.0, 3.0, 8.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.9195284247398376, -0.8909602761268616, -0.8623921275138855, -0.8338240385055542, -0.8052558898925781, -0.776687741279602, -0.748119592666626, -0.7195514440536499, -0.6909832954406738, -0.6624151468276978, -0.6338469982147217, -0.6052788496017456, -0.5767107605934143, -0.5481426119804382, -0.5195744633674622, -0.4910063147544861, -0.4624382257461548, -0.4338700771331787, -0.405301958322525, -0.37673380970954895, -0.34816569089889526, -0.3195975422859192, -0.2910293936729431, -0.26246124505996704, -0.23389312624931335, -0.20532499253749847, -0.1767568588256836, -0.14818871021270752, -0.11962057650089264, -0.09105244278907776, -0.062484294176101685, -0.033916160464286804, -0.0053479671478271484, 0.02322017028927803, 0.05178830772638321, 0.08035644888877869, 0.10892458260059357, 0.13749271631240845, 0.16606086492538452, 0.1946289986371994, 0.22319713234901428, 0.25176528096199036, 0.28033339977264404, 0.3089015483856201, 0.3374696969985962, 0.3660378158092499, 0.39460596442222595, 0.42317408323287964, 0.4517422318458557, 0.4803103804588318, 0.5088785290718079, 0.5374466180801392, 0.5660147666931152, 0.5945829153060913, 0.6231510639190674, 0.6517192125320435, 0.6802873611450195, 0.7088555097579956, 0.7374236583709717, 0.7659918069839478, 0.794559895992279, 0.8231280446052551, 0.8516961932182312, 0.8802643418312073, 0.9088324308395386]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 8.0, 15.0, 12.0, 19.0, 35.0, 53.0, 78.0, 117.0, 185.0, 338.0, 584.0, 1055.0, 1844.0, 3171.0, 5722.0, 9951.0, 17516.0, 32010.0, 77926.0, 313031.0, 397359.0, 103721.0, 37453.0, 19871.0, 11340.0, 6431.0, 3643.0, 2135.0, 1232.0, 674.0, 393.0, 216.0, 146.0, 82.0, 45.0, 49.0, 18.0, 19.0, 10.0, 7.0, 8.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.2958984375, -0.2863883972167969, -0.27687835693359375, -0.2673683166503906, -0.2578582763671875, -0.24834823608398438, -0.23883819580078125, -0.22932815551757812, -0.219818115234375, -0.21030807495117188, -0.20079803466796875, -0.19128799438476562, -0.1817779541015625, -0.17226791381835938, -0.16275787353515625, -0.15324783325195312, -0.14373779296875, -0.13422775268554688, -0.12471771240234375, -0.11520767211914062, -0.1056976318359375, -0.09618759155273438, -0.08667755126953125, -0.07716751098632812, -0.067657470703125, -0.058147430419921875, -0.04863739013671875, -0.039127349853515625, -0.0296173095703125, -0.020107269287109375, -0.01059722900390625, -0.001087188720703125, 0.0084228515625, 0.017932891845703125, 0.02744293212890625, 0.036952972412109375, 0.0464630126953125, 0.055973052978515625, 0.06548309326171875, 0.07499313354492188, 0.084503173828125, 0.09401321411132812, 0.10352325439453125, 0.11303329467773438, 0.1225433349609375, 0.13205337524414062, 0.14156341552734375, 0.15107345581054688, 0.16058349609375, 0.17009353637695312, 0.17960357666015625, 0.18911361694335938, 0.1986236572265625, 0.20813369750976562, 0.21764373779296875, 0.22715377807617188, 0.236663818359375, 0.24617385864257812, 0.25568389892578125, 0.2651939392089844, 0.2747039794921875, 0.2842140197753906, 0.29372406005859375, 0.3032341003417969, 0.312744140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 8.0, 11.0, 13.0, 12.0, 16.0, 14.0, 29.0, 19.0, 33.0, 34.0, 44.0, 46.0, 39.0, 53.0, 46.0, 52.0, 54.0, 48.0, 47.0, 37.0, 55.0, 39.0, 41.0, 23.0, 28.0, 23.0, 24.0, 29.0, 17.0, 9.0, 8.0, 9.0, 6.0, 5.0, 5.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1380615234375, -0.1335010528564453, -0.12894058227539062, -0.12438011169433594, -0.11981964111328125, -0.11525917053222656, -0.11069869995117188, -0.10613822937011719, -0.1015777587890625, -0.09701728820800781, -0.09245681762695312, -0.08789634704589844, -0.08333587646484375, -0.07877540588378906, -0.07421493530273438, -0.06965446472167969, -0.065093994140625, -0.06053352355957031, -0.055973052978515625, -0.05141258239746094, -0.04685211181640625, -0.04229164123535156, -0.037731170654296875, -0.03317070007324219, -0.0286102294921875, -0.024049758911132812, -0.019489288330078125, -0.014928817749023438, -0.01036834716796875, -0.0058078765869140625, -0.001247406005859375, 0.0033130645751953125, 0.00787353515625, 0.012434005737304688, 0.016994476318359375, 0.021554946899414062, 0.02611541748046875, 0.030675888061523438, 0.035236358642578125, 0.03979682922363281, 0.0443572998046875, 0.04891777038574219, 0.053478240966796875, 0.05803871154785156, 0.06259918212890625, 0.06715965270996094, 0.07172012329101562, 0.07628059387207031, 0.080841064453125, 0.08540153503417969, 0.08996200561523438, 0.09452247619628906, 0.09908294677734375, 0.10364341735839844, 0.10820388793945312, 0.11276435852050781, 0.1173248291015625, 0.12188529968261719, 0.12644577026367188, 0.13100624084472656, 0.13556671142578125, 0.14012718200683594, 0.14468765258789062, 0.1492481231689453, 0.15380859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 8.0, 5.0, 9.0, 15.0, 32.0, 38.0, 61.0, 84.0, 117.0, 209.0, 383.0, 714.0, 1450.0, 3300.0, 7921.0, 19961.0, 67136.0, 581249.0, 298226.0, 41920.0, 14600.0, 6029.0, 2578.0, 1153.0, 550.0, 318.0, 148.0, 104.0, 60.0, 41.0, 34.0, 25.0, 10.0, 11.0, 18.0, 11.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4619140625, -0.4447021484375, -0.427490234375, -0.4102783203125, -0.39306640625, -0.3758544921875, -0.358642578125, -0.3414306640625, -0.32421875, -0.3070068359375, -0.289794921875, -0.2725830078125, -0.25537109375, -0.2381591796875, -0.220947265625, -0.2037353515625, -0.1865234375, -0.1693115234375, -0.152099609375, -0.1348876953125, -0.11767578125, -0.1004638671875, -0.083251953125, -0.0660400390625, -0.048828125, -0.0316162109375, -0.014404296875, 0.0028076171875, 0.02001953125, 0.0372314453125, 0.054443359375, 0.0716552734375, 0.0888671875, 0.1060791015625, 0.123291015625, 0.1405029296875, 0.15771484375, 0.1749267578125, 0.192138671875, 0.2093505859375, 0.2265625, 0.2437744140625, 0.260986328125, 0.2781982421875, 0.29541015625, 0.3126220703125, 0.329833984375, 0.3470458984375, 0.3642578125, 0.3814697265625, 0.398681640625, 0.4158935546875, 0.43310546875, 0.4503173828125, 0.467529296875, 0.4847412109375, 0.501953125, 0.5191650390625, 0.536376953125, 0.5535888671875, 0.57080078125, 0.5880126953125, 0.605224609375, 0.6224365234375, 0.6396484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 3.0, 6.0, 15.0, 11.0, 16.0, 15.0, 26.0, 21.0, 28.0, 35.0, 37.0, 46.0, 52.0, 58.0, 62.0, 61.0, 49.0, 58.0, 48.0, 45.0, 44.0, 39.0, 45.0, 28.0, 37.0, 25.0, 21.0, 12.0, 10.0, 6.0, 10.0, 6.0, 4.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.556640625, -0.539947509765625, -0.52325439453125, -0.506561279296875, -0.4898681640625, -0.473175048828125, -0.45648193359375, -0.439788818359375, -0.423095703125, -0.406402587890625, -0.38970947265625, -0.373016357421875, -0.3563232421875, -0.339630126953125, -0.32293701171875, -0.306243896484375, -0.28955078125, -0.272857666015625, -0.25616455078125, -0.239471435546875, -0.2227783203125, -0.206085205078125, -0.18939208984375, -0.172698974609375, -0.156005859375, -0.139312744140625, -0.12261962890625, -0.105926513671875, -0.0892333984375, -0.072540283203125, -0.05584716796875, -0.039154052734375, -0.0224609375, -0.005767822265625, 0.01092529296875, 0.027618408203125, 0.0443115234375, 0.061004638671875, 0.07769775390625, 0.094390869140625, 0.111083984375, 0.127777099609375, 0.14447021484375, 0.161163330078125, 0.1778564453125, 0.194549560546875, 0.21124267578125, 0.227935791015625, 0.24462890625, 0.261322021484375, 0.27801513671875, 0.294708251953125, 0.3114013671875, 0.328094482421875, 0.34478759765625, 0.361480712890625, 0.378173828125, 0.394866943359375, 0.41156005859375, 0.428253173828125, 0.4449462890625, 0.461639404296875, 0.47833251953125, 0.495025634765625, 0.51171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 13.0, 7.0, 13.0, 20.0, 27.0, 42.0, 65.0, 95.0, 136.0, 253.0, 353.0, 537.0, 812.0, 1264.0, 2082.0, 3584.0, 5706.0, 9358.0, 16596.0, 29515.0, 58130.0, 148712.0, 409029.0, 208166.0, 72191.0, 35058.0, 18821.0, 10947.0, 6548.0, 3848.0, 2458.0, 1530.0, 906.0, 591.0, 403.0, 247.0, 154.0, 113.0, 59.0, 53.0, 17.0, 24.0, 21.0, 15.0, 12.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.11041259765625, -0.10702896118164062, -0.10364532470703125, -0.10026168823242188, -0.0968780517578125, -0.09349441528320312, -0.09011077880859375, -0.08672714233398438, -0.083343505859375, -0.07995986938476562, -0.07657623291015625, -0.07319259643554688, -0.0698089599609375, -0.06642532348632812, -0.06304168701171875, -0.059658050537109375, -0.0562744140625, -0.052890777587890625, -0.04950714111328125, -0.046123504638671875, -0.0427398681640625, -0.039356231689453125, -0.03597259521484375, -0.032588958740234375, -0.029205322265625, -0.025821685791015625, -0.02243804931640625, -0.019054412841796875, -0.0156707763671875, -0.012287139892578125, -0.00890350341796875, -0.005519866943359375, -0.00213623046875, 0.001247406005859375, 0.00463104248046875, 0.008014678955078125, 0.0113983154296875, 0.014781951904296875, 0.01816558837890625, 0.021549224853515625, 0.024932861328125, 0.028316497802734375, 0.03170013427734375, 0.035083770751953125, 0.0384674072265625, 0.041851043701171875, 0.04523468017578125, 0.048618316650390625, 0.052001953125, 0.055385589599609375, 0.05876922607421875, 0.062152862548828125, 0.0655364990234375, 0.06892013549804688, 0.07230377197265625, 0.07568740844726562, 0.079071044921875, 0.08245468139648438, 0.08583831787109375, 0.08922195434570312, 0.0926055908203125, 0.09598922729492188, 0.09937286376953125, 0.10275650024414062, 0.10614013671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 7.0, 12.0, 8.0, 8.0, 16.0, 11.0, 11.0, 31.0, 23.0, 69.0, 102.0, 142.0, 205.0, 143.0, 60.0, 38.0, 27.0, 11.0, 16.0, 7.0, 8.0, 10.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.3392181396484375e-05, -4.17931005358696e-05, -4.019401967525482e-05, -3.8594938814640045e-05, -3.699585795402527e-05, -3.539677709341049e-05, -3.3797696232795715e-05, -3.219861537218094e-05, -3.059953451156616e-05, -2.9000453650951385e-05, -2.740137279033661e-05, -2.5802291929721832e-05, -2.4203211069107056e-05, -2.260413020849228e-05, -2.1005049347877502e-05, -1.9405968487262726e-05, -1.780688762664795e-05, -1.6207806766033173e-05, -1.4608725905418396e-05, -1.300964504480362e-05, -1.1410564184188843e-05, -9.811483323574066e-06, -8.21240246295929e-06, -6.613321602344513e-06, -5.014240741729736e-06, -3.4151598811149597e-06, -1.816079020500183e-06, -2.169981598854065e-07, 1.3820827007293701e-06, 2.9811635613441467e-06, 4.580244421958923e-06, 6.1793252825737e-06, 7.778406143188477e-06, 9.377487003803253e-06, 1.097656786441803e-05, 1.2575648725032806e-05, 1.4174729585647583e-05, 1.577381044626236e-05, 1.7372891306877136e-05, 1.8971972167491913e-05, 2.057105302810669e-05, 2.2170133888721466e-05, 2.3769214749336243e-05, 2.536829560995102e-05, 2.6967376470565796e-05, 2.8566457331180573e-05, 3.016553819179535e-05, 3.1764619052410126e-05, 3.33636999130249e-05, 3.496278077363968e-05, 3.6561861634254456e-05, 3.816094249486923e-05, 3.976002335548401e-05, 4.1359104216098785e-05, 4.295818507671356e-05, 4.455726593732834e-05, 4.6156346797943115e-05, 4.775542765855789e-05, 4.935450851917267e-05, 5.0953589379787445e-05, 5.255267024040222e-05, 5.4151751101017e-05, 5.5750831961631775e-05, 5.734991282224655e-05, 5.894899368286133e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 16.0, 19.0, 22.0, 43.0, 41.0, 84.0, 77.0, 150.0, 241.0, 360.0, 603.0, 1047.0, 1993.0, 4175.0, 8686.0, 18173.0, 38937.0, 92833.0, 271978.0, 368347.0, 139012.0, 53526.0, 24582.0, 11739.0, 5661.0, 2839.0, 1442.0, 702.0, 451.0, 237.0, 163.0, 121.0, 69.0, 47.0, 39.0, 16.0, 22.0, 15.0, 11.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.11474609375, -0.11118221282958984, -0.10761833190917969, -0.10405445098876953, -0.10049057006835938, -0.09692668914794922, -0.09336280822753906, -0.0897989273071289, -0.08623504638671875, -0.0826711654663086, -0.07910728454589844, -0.07554340362548828, -0.07197952270507812, -0.06841564178466797, -0.06485176086425781, -0.061287879943847656, -0.0577239990234375, -0.054160118103027344, -0.05059623718261719, -0.04703235626220703, -0.043468475341796875, -0.03990459442138672, -0.03634071350097656, -0.032776832580566406, -0.02921295166015625, -0.025649070739746094, -0.022085189819335938, -0.01852130889892578, -0.014957427978515625, -0.011393547058105469, -0.007829666137695312, -0.004265785217285156, -0.000701904296875, 0.0028619766235351562, 0.0064258575439453125, 0.009989738464355469, 0.013553619384765625, 0.01711750030517578, 0.020681381225585938, 0.024245262145996094, 0.02780914306640625, 0.031373023986816406, 0.03493690490722656, 0.03850078582763672, 0.042064666748046875, 0.04562854766845703, 0.04919242858886719, 0.052756309509277344, 0.0563201904296875, 0.059884071350097656, 0.06344795227050781, 0.06701183319091797, 0.07057571411132812, 0.07413959503173828, 0.07770347595214844, 0.0812673568725586, 0.08483123779296875, 0.0883951187133789, 0.09195899963378906, 0.09552288055419922, 0.09908676147460938, 0.10265064239501953, 0.10621452331542969, 0.10977840423583984, 0.11334228515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 5.0, 3.0, 3.0, 6.0, 16.0, 10.0, 16.0, 28.0, 32.0, 34.0, 54.0, 65.0, 82.0, 82.0, 96.0, 110.0, 78.0, 61.0, 44.0, 34.0, 22.0, 22.0, 14.0, 9.0, 8.0, 8.0, 14.0, 4.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.168701171875, -0.1643085479736328, -0.15991592407226562, -0.15552330017089844, -0.15113067626953125, -0.14673805236816406, -0.14234542846679688, -0.1379528045654297, -0.1335601806640625, -0.1291675567626953, -0.12477493286132812, -0.12038230895996094, -0.11598968505859375, -0.11159706115722656, -0.10720443725585938, -0.10281181335449219, -0.098419189453125, -0.09402656555175781, -0.08963394165039062, -0.08524131774902344, -0.08084869384765625, -0.07645606994628906, -0.07206344604492188, -0.06767082214355469, -0.0632781982421875, -0.05888557434082031, -0.054492950439453125, -0.05010032653808594, -0.04570770263671875, -0.04131507873535156, -0.036922454833984375, -0.03252983093261719, -0.02813720703125, -0.023744583129882812, -0.019351959228515625, -0.014959335327148438, -0.01056671142578125, -0.0061740875244140625, -0.001781463623046875, 0.0026111602783203125, 0.0070037841796875, 0.011396408081054688, 0.015789031982421875, 0.020181655883789062, 0.02457427978515625, 0.028966903686523438, 0.033359527587890625, 0.03775215148925781, 0.042144775390625, 0.04653739929199219, 0.050930023193359375, 0.05532264709472656, 0.05971527099609375, 0.06410789489746094, 0.06850051879882812, 0.07289314270019531, 0.0772857666015625, 0.08167839050292969, 0.08607101440429688, 0.09046363830566406, 0.09485626220703125, 0.09924888610839844, 0.10364151000976562, 0.10803413391113281, 0.1124267578125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 13.0, 37.0, 64.0, 119.0, 149.0, 190.0, 173.0, 113.0, 57.0, 38.0, 16.0, 11.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.663025140762329, -2.5725982189178467, -2.4821712970733643, -2.391744375228882, -2.3013172149658203, -2.210890293121338, -2.1204633712768555, -2.030036449432373, -1.9396095275878906, -1.8491826057434082, -1.7587556838989258, -1.6683286428451538, -1.5779017210006714, -1.487474799156189, -1.397047758102417, -1.3066208362579346, -1.2161939144134521, -1.1257669925689697, -1.0353400707244873, -0.9449130296707153, -0.8544861078262329, -0.7640591859817505, -0.6736322045326233, -0.5832052230834961, -0.49277830123901367, -0.40235134959220886, -0.31192439794540405, -0.22149744629859924, -0.13107049465179443, -0.040643543004989624, 0.049783408641815186, 0.14021039009094238, 0.2306370735168457, 0.3210640251636505, 0.4114909768104553, 0.5019179582595825, 0.5923448801040649, 0.6827718019485474, 0.7731987833976746, 0.8636257648468018, 0.9540526866912842, 1.0444796085357666, 1.134906530380249, 1.225333571434021, 1.3157604932785034, 1.4061874151229858, 1.4966144561767578, 1.5870413780212402, 1.6774682998657227, 1.767895221710205, 1.8583221435546875, 1.9487491846084595, 2.0391759872436523, 2.129603147506714, 2.2200300693511963, 2.3104569911956787, 2.400883913040161, 2.4913108348846436, 2.581737756729126, 2.6721646785736084, 2.76259183883667, 2.8530187606811523, 2.9434456825256348, 3.033872604370117, 3.1242995262145996]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 6.0, 1.0, 8.0, 10.0, 11.0, 11.0, 13.0, 13.0, 16.0, 13.0, 19.0, 18.0, 32.0, 37.0, 38.0, 25.0, 37.0, 43.0, 43.0, 38.0, 47.0, 29.0, 38.0, 44.0, 42.0, 40.0, 38.0, 26.0, 33.0, 38.0, 25.0, 27.0, 28.0, 20.0, 15.0, 17.0, 13.0, 11.0, 10.0, 16.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.254845142364502, -1.2192962169647217, -1.1837472915649414, -1.1481983661651611, -1.1126494407653809, -1.0771005153656006, -1.0415515899658203, -1.0060027837753296, -0.9704538583755493, -0.934904932975769, -0.8993560075759888, -0.8638070821762085, -0.828258216381073, -0.7927092909812927, -0.7571603655815125, -0.7216114401817322, -0.6860625147819519, -0.6505135893821716, -0.6149646639823914, -0.5794157981872559, -0.5438668727874756, -0.5083179473876953, -0.47276902198791504, -0.43722009658813477, -0.4016712009906769, -0.3661222755908966, -0.3305733799934387, -0.29502445459365845, -0.2594755291938782, -0.2239266335964203, -0.18837770819664001, -0.15282879769802094, -0.11727988719940186, -0.08173097670078278, -0.0461820587515831, -0.010633140802383423, 0.024915769696235657, 0.060464680194854736, 0.09601360559463501, 0.1315625160932541, 0.16711142659187317, 0.20266033709049225, 0.23820924758911133, 0.2737581729888916, 0.3093070983886719, 0.34485599398612976, 0.38040491938591003, 0.4159538149833679, 0.4515027403831482, 0.48705166578292847, 0.5226005911827087, 0.5581494569778442, 0.5936983823776245, 0.6292473077774048, 0.6647962331771851, 0.7003451585769653, 0.7358940839767456, 0.7714430093765259, 0.8069919347763062, 0.8425408601760864, 0.8780897259712219, 0.9136386513710022, 0.9491875767707825, 0.9847365021705627, 1.0202853679656982]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 11.0, 19.0, 33.0, 55.0, 74.0, 116.0, 224.0, 372.0, 782.0, 1335.0, 2810.0, 5942.0, 13682.0, 31872.0, 79055.0, 221849.0, 760038.0, 1766394.0, 889425.0, 262015.0, 92797.0, 36555.0, 15643.0, 6887.0, 3196.0, 1463.0, 748.0, 418.0, 188.0, 122.0, 63.0, 30.0, 23.0, 19.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2301025390625, -0.22397804260253906, -0.21785354614257812, -0.2117290496826172, -0.20560455322265625, -0.1994800567626953, -0.19335556030273438, -0.18723106384277344, -0.1811065673828125, -0.17498207092285156, -0.16885757446289062, -0.1627330780029297, -0.15660858154296875, -0.1504840850830078, -0.14435958862304688, -0.13823509216308594, -0.132110595703125, -0.12598609924316406, -0.11986160278320312, -0.11373710632324219, -0.10761260986328125, -0.10148811340332031, -0.09536361694335938, -0.08923912048339844, -0.0831146240234375, -0.07699012756347656, -0.07086563110351562, -0.06474113464355469, -0.05861663818359375, -0.05249214172363281, -0.046367645263671875, -0.04024314880371094, -0.03411865234375, -0.027994155883789062, -0.021869659423828125, -0.015745162963867188, -0.00962066650390625, -0.0034961700439453125, 0.002628326416015625, 0.008752822875976562, 0.0148773193359375, 0.021001815795898438, 0.027126312255859375, 0.03325080871582031, 0.03937530517578125, 0.04549980163574219, 0.051624298095703125, 0.05774879455566406, 0.063873291015625, 0.06999778747558594, 0.07612228393554688, 0.08224678039550781, 0.08837127685546875, 0.09449577331542969, 0.10062026977539062, 0.10674476623535156, 0.1128692626953125, 0.11899375915527344, 0.12511825561523438, 0.1312427520751953, 0.13736724853515625, 0.1434917449951172, 0.14961624145507812, 0.15574073791503906, 0.161865234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 11.0, 6.0, 10.0, 9.0, 10.0, 16.0, 21.0, 19.0, 23.0, 35.0, 25.0, 34.0, 29.0, 35.0, 45.0, 42.0, 56.0, 56.0, 51.0, 40.0, 41.0, 46.0, 42.0, 40.0, 36.0, 37.0, 37.0, 17.0, 16.0, 14.0, 21.0, 18.0, 15.0, 10.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0], "bins": [-0.1878662109375, -0.18329715728759766, -0.1787281036376953, -0.17415904998779297, -0.16958999633789062, -0.16502094268798828, -0.16045188903808594, -0.1558828353881836, -0.15131378173828125, -0.1467447280883789, -0.14217567443847656, -0.13760662078857422, -0.13303756713867188, -0.12846851348876953, -0.12389945983886719, -0.11933040618896484, -0.1147613525390625, -0.11019229888916016, -0.10562324523925781, -0.10105419158935547, -0.09648513793945312, -0.09191608428955078, -0.08734703063964844, -0.0827779769897461, -0.07820892333984375, -0.0736398696899414, -0.06907081604003906, -0.06450176239013672, -0.059932708740234375, -0.05536365509033203, -0.05079460144042969, -0.046225547790527344, -0.041656494140625, -0.037087440490722656, -0.03251838684082031, -0.02794933319091797, -0.023380279541015625, -0.01881122589111328, -0.014242172241210938, -0.009673118591308594, -0.00510406494140625, -0.0005350112915039062, 0.0040340423583984375, 0.008603096008300781, 0.013172149658203125, 0.01774120330810547, 0.022310256958007812, 0.026879310607910156, 0.0314483642578125, 0.036017417907714844, 0.04058647155761719, 0.04515552520751953, 0.049724578857421875, 0.05429363250732422, 0.05886268615722656, 0.0634317398071289, 0.06800079345703125, 0.0725698471069336, 0.07713890075683594, 0.08170795440673828, 0.08627700805664062, 0.09084606170654297, 0.09541511535644531, 0.09998416900634766, 0.10455322265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 8.0, 1.0, 6.0, 15.0, 25.0, 33.0, 40.0, 65.0, 97.0, 160.0, 271.0, 493.0, 889.0, 1914.0, 4890.0, 15944.0, 68064.0, 384735.0, 2620131.0, 918965.0, 136174.0, 28182.0, 7682.0, 2805.0, 1178.0, 618.0, 350.0, 203.0, 99.0, 71.0, 59.0, 36.0, 30.0, 18.0, 12.0, 3.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.413818359375, -0.3988838195800781, -0.38394927978515625, -0.3690147399902344, -0.3540802001953125, -0.3391456604003906, -0.32421112060546875, -0.3092765808105469, -0.294342041015625, -0.2794075012207031, -0.26447296142578125, -0.24953842163085938, -0.2346038818359375, -0.21966934204101562, -0.20473480224609375, -0.18980026245117188, -0.17486572265625, -0.15993118286132812, -0.14499664306640625, -0.13006210327148438, -0.1151275634765625, -0.10019302368164062, -0.08525848388671875, -0.07032394409179688, -0.055389404296875, -0.040454864501953125, -0.02552032470703125, -0.010585784912109375, 0.0043487548828125, 0.019283294677734375, 0.03421783447265625, 0.049152374267578125, 0.0640869140625, 0.07902145385742188, 0.09395599365234375, 0.10889053344726562, 0.1238250732421875, 0.13875961303710938, 0.15369415283203125, 0.16862869262695312, 0.183563232421875, 0.19849777221679688, 0.21343231201171875, 0.22836685180664062, 0.2433013916015625, 0.2582359313964844, 0.27317047119140625, 0.2881050109863281, 0.30303955078125, 0.3179740905761719, 0.33290863037109375, 0.3478431701660156, 0.3627777099609375, 0.3777122497558594, 0.39264678955078125, 0.4075813293457031, 0.422515869140625, 0.4374504089355469, 0.45238494873046875, 0.4673194885253906, 0.4822540283203125, 0.4971885681152344, 0.5121231079101562, 0.5270576477050781, 0.5419921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 15.0, 17.0, 23.0, 29.0, 50.0, 66.0, 104.0, 137.0, 223.0, 354.0, 616.0, 800.0, 600.0, 330.0, 225.0, 155.0, 114.0, 73.0, 54.0, 31.0, 14.0, 13.0, 13.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5361518859863281, -0.5210342407226562, -0.5059165954589844, -0.4907989501953125, -0.4756813049316406, -0.46056365966796875, -0.4454460144042969, -0.430328369140625, -0.4152107238769531, -0.40009307861328125, -0.3849754333496094, -0.3698577880859375, -0.3547401428222656, -0.33962249755859375, -0.3245048522949219, -0.30938720703125, -0.2942695617675781, -0.27915191650390625, -0.2640342712402344, -0.2489166259765625, -0.23379898071289062, -0.21868133544921875, -0.20356369018554688, -0.188446044921875, -0.17332839965820312, -0.15821075439453125, -0.14309310913085938, -0.1279754638671875, -0.11285781860351562, -0.09774017333984375, -0.08262252807617188, -0.0675048828125, -0.052387237548828125, -0.03726959228515625, -0.022151947021484375, -0.0070343017578125, 0.008083343505859375, 0.02320098876953125, 0.038318634033203125, 0.053436279296875, 0.06855392456054688, 0.08367156982421875, 0.09878921508789062, 0.1139068603515625, 0.12902450561523438, 0.14414215087890625, 0.15925979614257812, 0.17437744140625, 0.18949508666992188, 0.20461273193359375, 0.21973037719726562, 0.2348480224609375, 0.24996566772460938, 0.26508331298828125, 0.2802009582519531, 0.295318603515625, 0.3104362487792969, 0.32555389404296875, 0.3406715393066406, 0.3557891845703125, 0.3709068298339844, 0.38602447509765625, 0.4011421203613281, 0.416259765625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 12.0, 23.0, 56.0, 101.0, 149.0, 196.0, 180.0, 124.0, 73.0, 37.0, 25.0, 8.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9030795097351074, -2.798339605331421, -2.6935997009277344, -2.588859796524048, -2.4841198921203613, -2.3793797492980957, -2.2746400833129883, -2.1698999404907227, -2.065160036087036, -1.9604201316833496, -1.855680227279663, -1.7509403228759766, -1.6462002992630005, -1.541460394859314, -1.4367204904556274, -1.3319804668426514, -1.2272406816482544, -1.1225007772445679, -1.0177608728408813, -0.91302090883255, -0.8082809448242188, -0.7035410404205322, -0.5988011360168457, -0.4940611720085144, -0.3893212676048279, -0.28458133339881897, -0.17984141409397125, -0.07510149478912354, 0.029638439416885376, 0.1343783736228943, 0.2391182780265808, 0.3438582420349121, 0.44859814643859863, 0.5533380508422852, 0.6580780148506165, 0.762817919254303, 0.8675578832626343, 0.9722977876663208, 1.0770376920700073, 1.1817777156829834, 1.28651762008667, 1.3912575244903564, 1.495997428894043, 1.6007373332977295, 1.7054773569107056, 1.810217261314392, 1.9149571657180786, 2.0196971893310547, 2.124436855316162, 2.2291767597198486, 2.333916664123535, 2.4386565685272217, 2.543396472930908, 2.648136615753174, 2.7528762817382812, 2.857616424560547, 2.9623563289642334, 3.06709623336792, 3.1718361377716064, 3.276576042175293, 3.3813159465789795, 3.486055850982666, 3.5907959938049316, 3.695535898208618, 3.8002758026123047]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 6.0, 11.0, 11.0, 9.0, 13.0, 12.0, 19.0, 16.0, 18.0, 17.0, 22.0, 20.0, 30.0, 28.0, 34.0, 39.0, 36.0, 49.0, 47.0, 45.0, 39.0, 35.0, 30.0, 36.0, 32.0, 40.0, 38.0, 27.0, 28.0, 18.0, 27.0, 28.0, 21.0, 18.0, 14.0, 10.0, 15.0, 7.0, 8.0, 5.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9802557826042175, -0.9464905261993408, -0.9127253293991089, -0.8789600729942322, -0.8451948761940002, -0.8114296197891235, -0.7776644229888916, -0.7438991665840149, -0.7101339101791382, -0.6763686537742615, -0.6426034569740295, -0.6088382005691528, -0.5750730037689209, -0.5413077473640442, -0.5075424909591675, -0.47377729415893555, -0.4400120973587036, -0.4062468707561493, -0.37248164415359497, -0.33871638774871826, -0.30495119094848633, -0.2711859345436096, -0.2374207079410553, -0.20365548133850098, -0.16989025473594666, -0.13612502813339233, -0.10235979408025742, -0.0685945600271225, -0.034829333424568176, -0.001064106822013855, 0.03270113468170166, 0.06646636128425598, 0.10023164749145508, 0.1339968740940094, 0.16776210069656372, 0.20152734220027924, 0.23529256880283356, 0.2690578103065491, 0.3028230369091034, 0.3365882635116577, 0.37035349011421204, 0.40411871671676636, 0.4378839433193207, 0.471649169921875, 0.5054144263267517, 0.5391796231269836, 0.5729448795318604, 0.6067100763320923, 0.640475332736969, 0.6742405891418457, 0.7080057859420776, 0.7417710423469543, 0.7755362391471863, 0.809301495552063, 0.8430666923522949, 0.8768319487571716, 0.9105972051620483, 0.944362461566925, 0.978127658367157, 1.0118929147720337, 1.0456581115722656, 1.0794233083724976, 1.113188624382019, 1.146953821182251, 1.180719017982483]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 8.0, 15.0, 23.0, 20.0, 40.0, 61.0, 79.0, 141.0, 212.0, 330.0, 571.0, 847.0, 1520.0, 2559.0, 4409.0, 7874.0, 14485.0, 26984.0, 56398.0, 141540.0, 342971.0, 261100.0, 96722.0, 41947.0, 21306.0, 11212.0, 6446.0, 3545.0, 2028.0, 1167.0, 708.0, 473.0, 294.0, 165.0, 111.0, 95.0, 54.0, 36.0, 22.0, 17.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30322265625, -0.2936897277832031, -0.28415679931640625, -0.2746238708496094, -0.2650909423828125, -0.2555580139160156, -0.24602508544921875, -0.23649215698242188, -0.226959228515625, -0.21742630004882812, -0.20789337158203125, -0.19836044311523438, -0.1888275146484375, -0.17929458618164062, -0.16976165771484375, -0.16022872924804688, -0.15069580078125, -0.14116287231445312, -0.13162994384765625, -0.12209701538085938, -0.1125640869140625, -0.10303115844726562, -0.09349822998046875, -0.08396530151367188, -0.074432373046875, -0.06489944458007812, -0.05536651611328125, -0.045833587646484375, -0.0363006591796875, -0.026767730712890625, -0.01723480224609375, -0.007701873779296875, 0.0018310546875, 0.011363983154296875, 0.02089691162109375, 0.030429840087890625, 0.0399627685546875, 0.049495697021484375, 0.05902862548828125, 0.06856155395507812, 0.078094482421875, 0.08762741088867188, 0.09716033935546875, 0.10669326782226562, 0.1162261962890625, 0.12575912475585938, 0.13529205322265625, 0.14482498168945312, 0.15435791015625, 0.16389083862304688, 0.17342376708984375, 0.18295669555664062, 0.1924896240234375, 0.20202255249023438, 0.21155548095703125, 0.22108840942382812, 0.230621337890625, 0.24015426635742188, 0.24968719482421875, 0.2592201232910156, 0.2687530517578125, 0.2782859802246094, 0.28781890869140625, 0.2973518371582031, 0.306884765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 8.0, 7.0, 13.0, 12.0, 9.0, 19.0, 18.0, 25.0, 33.0, 28.0, 33.0, 43.0, 36.0, 33.0, 53.0, 49.0, 39.0, 44.0, 42.0, 49.0, 50.0, 48.0, 46.0, 31.0, 37.0, 23.0, 26.0, 23.0, 18.0, 13.0, 9.0, 10.0, 12.0, 8.0, 9.0, 4.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1815185546875, -0.1764965057373047, -0.17147445678710938, -0.16645240783691406, -0.16143035888671875, -0.15640830993652344, -0.15138626098632812, -0.1463642120361328, -0.1413421630859375, -0.1363201141357422, -0.13129806518554688, -0.12627601623535156, -0.12125396728515625, -0.11623191833496094, -0.11120986938476562, -0.10618782043457031, -0.101165771484375, -0.09614372253417969, -0.09112167358398438, -0.08609962463378906, -0.08107757568359375, -0.07605552673339844, -0.07103347778320312, -0.06601142883300781, -0.0609893798828125, -0.05596733093261719, -0.050945281982421875, -0.04592323303222656, -0.04090118408203125, -0.03587913513183594, -0.030857086181640625, -0.025835037231445312, -0.02081298828125, -0.015790939331054688, -0.010768890380859375, -0.0057468414306640625, -0.00072479248046875, 0.0042972564697265625, 0.009319305419921875, 0.014341354370117188, 0.0193634033203125, 0.024385452270507812, 0.029407501220703125, 0.03442955017089844, 0.03945159912109375, 0.04447364807128906, 0.049495697021484375, 0.05451774597167969, 0.059539794921875, 0.06456184387207031, 0.06958389282226562, 0.07460594177246094, 0.07962799072265625, 0.08465003967285156, 0.08967208862304688, 0.09469413757324219, 0.0997161865234375, 0.10473823547363281, 0.10976028442382812, 0.11478233337402344, 0.11980438232421875, 0.12482643127441406, 0.12984848022460938, 0.1348705291748047, 0.139892578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 21.0, 26.0, 49.0, 55.0, 77.0, 145.0, 218.0, 430.0, 812.0, 1600.0, 3705.0, 9746.0, 30362.0, 152243.0, 672667.0, 132208.0, 28203.0, 9098.0, 3447.0, 1612.0, 783.0, 380.0, 244.0, 121.0, 93.0, 53.0, 31.0, 31.0, 23.0, 12.0, 9.0, 6.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66455078125, -0.641998291015625, -0.61944580078125, -0.596893310546875, -0.5743408203125, -0.551788330078125, -0.52923583984375, -0.506683349609375, -0.484130859375, -0.461578369140625, -0.43902587890625, -0.416473388671875, -0.3939208984375, -0.371368408203125, -0.34881591796875, -0.326263427734375, -0.3037109375, -0.281158447265625, -0.25860595703125, -0.236053466796875, -0.2135009765625, -0.190948486328125, -0.16839599609375, -0.145843505859375, -0.123291015625, -0.100738525390625, -0.07818603515625, -0.055633544921875, -0.0330810546875, -0.010528564453125, 0.01202392578125, 0.034576416015625, 0.05712890625, 0.079681396484375, 0.10223388671875, 0.124786376953125, 0.1473388671875, 0.169891357421875, 0.19244384765625, 0.214996337890625, 0.237548828125, 0.260101318359375, 0.28265380859375, 0.305206298828125, 0.3277587890625, 0.350311279296875, 0.37286376953125, 0.395416259765625, 0.41796875, 0.440521240234375, 0.46307373046875, 0.485626220703125, 0.5081787109375, 0.530731201171875, 0.55328369140625, 0.575836181640625, 0.598388671875, 0.620941162109375, 0.64349365234375, 0.666046142578125, 0.6885986328125, 0.711151123046875, 0.73370361328125, 0.756256103515625, 0.77880859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 4.0, 8.0, 11.0, 14.0, 15.0, 26.0, 17.0, 36.0, 35.0, 36.0, 37.0, 41.0, 48.0, 52.0, 53.0, 65.0, 52.0, 50.0, 54.0, 50.0, 36.0, 38.0, 36.0, 30.0, 32.0, 20.0, 16.0, 15.0, 12.0, 9.0, 7.0, 1.0, 5.0, 3.0, 4.0, 6.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.541015625, -0.5224609375, -0.50390625, -0.4853515625, -0.466796875, -0.4482421875, -0.4296875, -0.4111328125, -0.392578125, -0.3740234375, -0.35546875, -0.3369140625, -0.318359375, -0.2998046875, -0.28125, -0.2626953125, -0.244140625, -0.2255859375, -0.20703125, -0.1884765625, -0.169921875, -0.1513671875, -0.1328125, -0.1142578125, -0.095703125, -0.0771484375, -0.05859375, -0.0400390625, -0.021484375, -0.0029296875, 0.015625, 0.0341796875, 0.052734375, 0.0712890625, 0.08984375, 0.1083984375, 0.126953125, 0.1455078125, 0.1640625, 0.1826171875, 0.201171875, 0.2197265625, 0.23828125, 0.2568359375, 0.275390625, 0.2939453125, 0.3125, 0.3310546875, 0.349609375, 0.3681640625, 0.38671875, 0.4052734375, 0.423828125, 0.4423828125, 0.4609375, 0.4794921875, 0.498046875, 0.5166015625, 0.53515625, 0.5537109375, 0.572265625, 0.5908203125, 0.609375, 0.6279296875, 0.646484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 4.0, 4.0, 7.0, 7.0, 12.0, 25.0, 34.0, 60.0, 87.0, 128.0, 237.0, 418.0, 672.0, 1250.0, 2208.0, 4020.0, 7489.0, 14341.0, 29056.0, 64393.0, 187013.0, 460129.0, 162554.0, 58755.0, 26699.0, 13317.0, 6958.0, 3797.0, 2062.0, 1165.0, 681.0, 359.0, 223.0, 151.0, 86.0, 53.0, 41.0, 15.0, 11.0, 5.0, 13.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1434326171875, -0.13820648193359375, -0.1329803466796875, -0.12775421142578125, -0.122528076171875, -0.11730194091796875, -0.1120758056640625, -0.10684967041015625, -0.10162353515625, -0.09639739990234375, -0.0911712646484375, -0.08594512939453125, -0.080718994140625, -0.07549285888671875, -0.0702667236328125, -0.06504058837890625, -0.059814453125, -0.05458831787109375, -0.0493621826171875, -0.04413604736328125, -0.038909912109375, -0.03368377685546875, -0.0284576416015625, -0.02323150634765625, -0.01800537109375, -0.01277923583984375, -0.0075531005859375, -0.00232696533203125, 0.002899169921875, 0.00812530517578125, 0.0133514404296875, 0.01857757568359375, 0.0238037109375, 0.02902984619140625, 0.0342559814453125, 0.03948211669921875, 0.044708251953125, 0.04993438720703125, 0.0551605224609375, 0.06038665771484375, 0.06561279296875, 0.07083892822265625, 0.0760650634765625, 0.08129119873046875, 0.086517333984375, 0.09174346923828125, 0.0969696044921875, 0.10219573974609375, 0.107421875, 0.11264801025390625, 0.1178741455078125, 0.12310028076171875, 0.128326416015625, 0.13355255126953125, 0.1387786865234375, 0.14400482177734375, 0.14923095703125, 0.15445709228515625, 0.1596832275390625, 0.16490936279296875, 0.170135498046875, 0.17536163330078125, 0.1805877685546875, 0.18581390380859375, 0.1910400390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 5.0, 2.0, 10.0, 8.0, 20.0, 28.0, 24.0, 41.0, 42.0, 71.0, 111.0, 170.0, 141.0, 93.0, 52.0, 36.0, 35.0, 9.0, 17.0, 18.0, 12.0, 7.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9948692321777344e-05, -4.8073939979076385e-05, -4.619918763637543e-05, -4.432443529367447e-05, -4.244968295097351e-05, -4.057493060827255e-05, -3.8700178265571594e-05, -3.6825425922870636e-05, -3.495067358016968e-05, -3.307592123746872e-05, -3.120116889476776e-05, -2.9326416552066803e-05, -2.7451664209365845e-05, -2.5576911866664886e-05, -2.3702159523963928e-05, -2.182740718126297e-05, -1.9952654838562012e-05, -1.8077902495861053e-05, -1.6203150153160095e-05, -1.4328397810459137e-05, -1.2453645467758179e-05, -1.057889312505722e-05, -8.704140782356262e-06, -6.829388439655304e-06, -4.954636096954346e-06, -3.0798837542533875e-06, -1.2051314115524292e-06, 6.69620931148529e-07, 2.5443732738494873e-06, 4.4191256165504456e-06, 6.293877959251404e-06, 8.168630301952362e-06, 1.004338264465332e-05, 1.1918134987354279e-05, 1.3792887330055237e-05, 1.5667639672756195e-05, 1.7542392015457153e-05, 1.941714435815811e-05, 2.129189670085907e-05, 2.3166649043560028e-05, 2.5041401386260986e-05, 2.6916153728961945e-05, 2.8790906071662903e-05, 3.066565841436386e-05, 3.254041075706482e-05, 3.441516309976578e-05, 3.6289915442466736e-05, 3.8164667785167694e-05, 4.003942012786865e-05, 4.191417247056961e-05, 4.378892481327057e-05, 4.566367715597153e-05, 4.7538429498672485e-05, 4.9413181841373444e-05, 5.12879341840744e-05, 5.316268652677536e-05, 5.503743886947632e-05, 5.6912191212177277e-05, 5.8786943554878235e-05, 6.066169589757919e-05, 6.253644824028015e-05, 6.441120058298111e-05, 6.628595292568207e-05, 6.816070526838303e-05, 7.003545761108398e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 7.0, 22.0, 28.0, 38.0, 38.0, 99.0, 135.0, 209.0, 360.0, 667.0, 1432.0, 3021.0, 7535.0, 21071.0, 65769.0, 289174.0, 491760.0, 114363.0, 33160.0, 11427.0, 4320.0, 1865.0, 854.0, 473.0, 281.0, 165.0, 81.0, 49.0, 44.0, 34.0, 21.0, 13.0, 6.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2269287109375, -0.2200946807861328, -0.21326065063476562, -0.20642662048339844, -0.19959259033203125, -0.19275856018066406, -0.18592453002929688, -0.1790904998779297, -0.1722564697265625, -0.1654224395751953, -0.15858840942382812, -0.15175437927246094, -0.14492034912109375, -0.13808631896972656, -0.13125228881835938, -0.12441825866699219, -0.117584228515625, -0.11075019836425781, -0.10391616821289062, -0.09708213806152344, -0.09024810791015625, -0.08341407775878906, -0.07658004760742188, -0.06974601745605469, -0.0629119873046875, -0.05607795715332031, -0.049243927001953125, -0.04240989685058594, -0.03557586669921875, -0.028741836547851562, -0.021907806396484375, -0.015073776245117188, -0.00823974609375, -0.0014057159423828125, 0.005428314208984375, 0.012262344360351562, 0.01909637451171875, 0.025930404663085938, 0.032764434814453125, 0.03959846496582031, 0.0464324951171875, 0.05326652526855469, 0.060100555419921875, 0.06693458557128906, 0.07376861572265625, 0.08060264587402344, 0.08743667602539062, 0.09427070617675781, 0.101104736328125, 0.10793876647949219, 0.11477279663085938, 0.12160682678222656, 0.12844085693359375, 0.13527488708496094, 0.14210891723632812, 0.1489429473876953, 0.1557769775390625, 0.1626110076904297, 0.16944503784179688, 0.17627906799316406, 0.18311309814453125, 0.18994712829589844, 0.19678115844726562, 0.2036151885986328, 0.21044921875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 3.0, 9.0, 7.0, 14.0, 7.0, 11.0, 17.0, 17.0, 26.0, 36.0, 46.0, 54.0, 69.0, 80.0, 87.0, 84.0, 87.0, 69.0, 55.0, 41.0, 31.0, 28.0, 22.0, 21.0, 16.0, 8.0, 9.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13326644897460938, -0.12798309326171875, -0.12269973754882812, -0.1174163818359375, -0.11213302612304688, -0.10684967041015625, -0.10156631469726562, -0.096282958984375, -0.09099960327148438, -0.08571624755859375, -0.08043289184570312, -0.0751495361328125, -0.06986618041992188, -0.06458282470703125, -0.059299468994140625, -0.05401611328125, -0.048732757568359375, -0.04344940185546875, -0.038166046142578125, -0.0328826904296875, -0.027599334716796875, -0.02231597900390625, -0.017032623291015625, -0.011749267578125, -0.006465911865234375, -0.00118255615234375, 0.004100799560546875, 0.0093841552734375, 0.014667510986328125, 0.01995086669921875, 0.025234222412109375, 0.030517578125, 0.035800933837890625, 0.04108428955078125, 0.046367645263671875, 0.0516510009765625, 0.056934356689453125, 0.06221771240234375, 0.06750106811523438, 0.072784423828125, 0.07806777954101562, 0.08335113525390625, 0.08863449096679688, 0.0939178466796875, 0.09920120239257812, 0.10448455810546875, 0.10976791381835938, 0.11505126953125, 0.12033462524414062, 0.12561798095703125, 0.13090133666992188, 0.1361846923828125, 0.14146804809570312, 0.14675140380859375, 0.15203475952148438, 0.157318115234375, 0.16260147094726562, 0.16788482666015625, 0.17316818237304688, 0.1784515380859375, 0.18373489379882812, 0.18901824951171875, 0.19430160522460938, 0.1995849609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 10.0, 26.0, 51.0, 100.0, 167.0, 189.0, 174.0, 130.0, 72.0, 33.0, 19.0, 11.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6679210662841797, -2.5510668754577637, -2.4342126846313477, -2.3173584938049316, -2.2005043029785156, -2.0836501121520996, -1.966795802116394, -1.849941611289978, -1.733087420463562, -1.616233229637146, -1.49937903881073, -1.3825247287750244, -1.2656705379486084, -1.1488163471221924, -1.0319621562957764, -0.9151079654693604, -0.7982537746429443, -0.6813995838165283, -0.5645453929901123, -0.4476911425590515, -0.3308369517326355, -0.21398276090621948, -0.09712851047515869, 0.019725680351257324, 0.13657987117767334, 0.25343406200408936, 0.37028828263282776, 0.48714250326156616, 0.6039966940879822, 0.7208508849143982, 0.837705135345459, 0.954559326171875, 1.071413516998291, 1.188267707824707, 1.305121898651123, 1.421976089477539, 1.538830280303955, 1.655684471130371, 1.7725387811660767, 1.8893929719924927, 2.006247043609619, 2.123101234436035, 2.239955425262451, 2.356809616088867, 2.473663806915283, 2.590517997741699, 2.7073721885681152, 2.8242263793945312, 2.9410808086395264, 3.0579349994659424, 3.1747891902923584, 3.2916433811187744, 3.4084975719451904, 3.5253517627716064, 3.6422061920166016, 3.7590603828430176, 3.8759145736694336, 3.9927687644958496, 4.109622955322266, 4.226477146148682, 4.343331336975098, 4.460185527801514, 4.57703971862793, 4.693893909454346, 4.810748100280762]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 8.0, 10.0, 12.0, 10.0, 23.0, 17.0, 25.0, 16.0, 29.0, 31.0, 40.0, 38.0, 42.0, 34.0, 49.0, 42.0, 46.0, 46.0, 59.0, 45.0, 47.0, 40.0, 43.0, 26.0, 38.0, 29.0, 30.0, 18.0, 13.0, 15.0, 24.0, 11.0, 7.0, 4.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1940765380859375, -1.1514370441436768, -1.108797550201416, -1.0661580562591553, -1.023518443107605, -0.9808789491653442, -0.9382394552230835, -0.8955999612808228, -0.8529604077339172, -0.8103209137916565, -0.767681360244751, -0.7250418663024902, -0.6824023723602295, -0.639762818813324, -0.5971233248710632, -0.5544837713241577, -0.511844277381897, -0.46920475363731384, -0.4265652298927307, -0.38392573595046997, -0.34128621220588684, -0.2986466884613037, -0.25600719451904297, -0.21336767077445984, -0.1707281470298767, -0.12808862328529358, -0.08544911444187164, -0.04280960559844971, -0.00017008185386657715, 0.04246944189071655, 0.0851089358329773, 0.12774845957756042, 0.17038798332214355, 0.21302750706672668, 0.2556670308113098, 0.29830652475357056, 0.3409460484981537, 0.3835855722427368, 0.42622506618499756, 0.4688645899295807, 0.5115041136741638, 0.5541436076164246, 0.5967831611633301, 0.6394226551055908, 0.6820621490478516, 0.7247017025947571, 0.7673411965370178, 0.8099807500839233, 0.8526202440261841, 0.8952597379684448, 0.9378992915153503, 0.9805387854576111, 1.0231783390045166, 1.0658178329467773, 1.108457326889038, 1.1510968208312988, 1.1937363147735596, 1.2363758087158203, 1.279015302658081, 1.3216547966003418, 1.364294409751892, 1.4069339036941528, 1.4495733976364136, 1.4922128915786743, 1.5348525047302246]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 5.0, 7.0, 16.0, 16.0, 13.0, 36.0, 43.0, 70.0, 114.0, 172.0, 325.0, 547.0, 1067.0, 2169.0, 4920.0, 12402.0, 35932.0, 126108.0, 574099.0, 2177728.0, 982409.0, 196702.0, 51431.0, 16377.0, 6122.0, 2601.0, 1265.0, 693.0, 324.0, 193.0, 127.0, 73.0, 56.0, 31.0, 25.0, 14.0, 8.0, 6.0, 10.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2637443542480469, -0.25453948974609375, -0.24533462524414062, -0.2361297607421875, -0.22692489624023438, -0.21772003173828125, -0.20851516723632812, -0.199310302734375, -0.19010543823242188, -0.18090057373046875, -0.17169570922851562, -0.1624908447265625, -0.15328598022460938, -0.14408111572265625, -0.13487625122070312, -0.12567138671875, -0.11646652221679688, -0.10726165771484375, -0.09805679321289062, -0.0888519287109375, -0.07964706420898438, -0.07044219970703125, -0.061237335205078125, -0.052032470703125, -0.042827606201171875, -0.03362274169921875, -0.024417877197265625, -0.0152130126953125, -0.006008148193359375, 0.00319671630859375, 0.012401580810546875, 0.0216064453125, 0.030811309814453125, 0.04001617431640625, 0.049221038818359375, 0.0584259033203125, 0.06763076782226562, 0.07683563232421875, 0.08604049682617188, 0.095245361328125, 0.10445022583007812, 0.11365509033203125, 0.12285995483398438, 0.1320648193359375, 0.14126968383789062, 0.15047454833984375, 0.15967941284179688, 0.16888427734375, 0.17808914184570312, 0.18729400634765625, 0.19649887084960938, 0.2057037353515625, 0.21490859985351562, 0.22411346435546875, 0.23331832885742188, 0.242523193359375, 0.2517280578613281, 0.26093292236328125, 0.2701377868652344, 0.2793426513671875, 0.2885475158691406, 0.29775238037109375, 0.3069572448730469, 0.316162109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 7.0, 14.0, 10.0, 9.0, 8.0, 18.0, 22.0, 19.0, 21.0, 36.0, 26.0, 35.0, 36.0, 40.0, 45.0, 54.0, 42.0, 49.0, 39.0, 35.0, 45.0, 40.0, 33.0, 33.0, 43.0, 20.0, 30.0, 25.0, 16.0, 16.0, 27.0, 17.0, 17.0, 5.0, 13.0, 8.0, 7.0, 4.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.1452198028564453, -0.14041519165039062, -0.13561058044433594, -0.13080596923828125, -0.12600135803222656, -0.12119674682617188, -0.11639213562011719, -0.1115875244140625, -0.10678291320800781, -0.10197830200195312, -0.09717369079589844, -0.09236907958984375, -0.08756446838378906, -0.08275985717773438, -0.07795524597167969, -0.073150634765625, -0.06834602355957031, -0.06354141235351562, -0.05873680114746094, -0.05393218994140625, -0.04912757873535156, -0.044322967529296875, -0.03951835632324219, -0.0347137451171875, -0.029909133911132812, -0.025104522705078125, -0.020299911499023438, -0.01549530029296875, -0.010690689086914062, -0.005886077880859375, -0.0010814666748046875, 0.00372314453125, 0.008527755737304688, 0.013332366943359375, 0.018136978149414062, 0.02294158935546875, 0.027746200561523438, 0.032550811767578125, 0.03735542297363281, 0.0421600341796875, 0.04696464538574219, 0.051769256591796875, 0.05657386779785156, 0.06137847900390625, 0.06618309020996094, 0.07098770141601562, 0.07579231262207031, 0.080596923828125, 0.08540153503417969, 0.09020614624023438, 0.09501075744628906, 0.09981536865234375, 0.10461997985839844, 0.10942459106445312, 0.11422920227050781, 0.1190338134765625, 0.12383842468261719, 0.12864303588867188, 0.13344764709472656, 0.13825225830078125, 0.14305686950683594, 0.14786148071289062, 0.1526660919189453, 0.157470703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 6.0, 4.0, 12.0, 20.0, 20.0, 35.0, 36.0, 56.0, 81.0, 134.0, 275.0, 567.0, 1213.0, 3223.0, 10885.0, 68548.0, 1591558.0, 2410642.0, 88037.0, 12695.0, 3630.0, 1275.0, 612.0, 280.0, 147.0, 98.0, 53.0, 27.0, 30.0, 20.0, 18.0, 14.0, 6.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90185546875, -0.8718490600585938, -0.8418426513671875, -0.8118362426757812, -0.781829833984375, -0.7518234252929688, -0.7218170166015625, -0.6918106079101562, -0.66180419921875, -0.6317977905273438, -0.6017913818359375, -0.5717849731445312, -0.541778564453125, -0.5117721557617188, -0.4817657470703125, -0.45175933837890625, -0.4217529296875, -0.39174652099609375, -0.3617401123046875, -0.33173370361328125, -0.301727294921875, -0.27172088623046875, -0.2417144775390625, -0.21170806884765625, -0.18170166015625, -0.15169525146484375, -0.1216888427734375, -0.09168243408203125, -0.061676025390625, -0.03166961669921875, -0.0016632080078125, 0.02834320068359375, 0.058349609375, 0.08835601806640625, 0.1183624267578125, 0.14836883544921875, 0.178375244140625, 0.20838165283203125, 0.2383880615234375, 0.26839447021484375, 0.29840087890625, 0.32840728759765625, 0.3584136962890625, 0.38842010498046875, 0.418426513671875, 0.44843292236328125, 0.4784393310546875, 0.5084457397460938, 0.5384521484375, 0.5684585571289062, 0.5984649658203125, 0.6284713745117188, 0.658477783203125, 0.6884841918945312, 0.7184906005859375, 0.7484970092773438, 0.77850341796875, 0.8085098266601562, 0.8385162353515625, 0.8685226440429688, 0.898529052734375, 0.9285354614257812, 0.9585418701171875, 0.9885482788085938, 1.0185546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 11.0, 21.0, 30.0, 62.0, 91.0, 192.0, 325.0, 755.0, 1287.0, 659.0, 307.0, 155.0, 70.0, 46.0, 29.0, 9.0, 9.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.1089706420898438, -1.0821990966796875, -1.0554275512695312, -1.028656005859375, -1.0018844604492188, -0.9751129150390625, -0.9483413696289062, -0.92156982421875, -0.8947982788085938, -0.8680267333984375, -0.8412551879882812, -0.814483642578125, -0.7877120971679688, -0.7609405517578125, -0.7341690063476562, -0.7073974609375, -0.6806259155273438, -0.6538543701171875, -0.6270828247070312, -0.600311279296875, -0.5735397338867188, -0.5467681884765625, -0.5199966430664062, -0.49322509765625, -0.46645355224609375, -0.4396820068359375, -0.41291046142578125, -0.386138916015625, -0.35936737060546875, -0.3325958251953125, -0.30582427978515625, -0.279052734375, -0.25228118896484375, -0.2255096435546875, -0.19873809814453125, -0.171966552734375, -0.14519500732421875, -0.1184234619140625, -0.09165191650390625, -0.06488037109375, -0.03810882568359375, -0.0113372802734375, 0.01543426513671875, 0.042205810546875, 0.06897735595703125, 0.0957489013671875, 0.12252044677734375, 0.1492919921875, 0.17606353759765625, 0.2028350830078125, 0.22960662841796875, 0.256378173828125, 0.28314971923828125, 0.3099212646484375, 0.33669281005859375, 0.36346435546875, 0.39023590087890625, 0.4170074462890625, 0.44377899169921875, 0.470550537109375, 0.49732208251953125, 0.5240936279296875, 0.5508651733398438, 0.57763671875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 7.0, 11.0, 21.0, 45.0, 65.0, 131.0, 157.0, 165.0, 158.0, 110.0, 70.0, 21.0, 14.0, 9.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.241469383239746, -6.104079246520996, -5.966689586639404, -5.829299449920654, -5.6919097900390625, -5.5545196533203125, -5.4171295166015625, -5.279739856719971, -5.142349720001221, -5.004959583282471, -4.867569923400879, -4.730179786682129, -4.592789649963379, -4.455399990081787, -4.318009853363037, -4.180620193481445, -4.043230056762695, -3.9058401584625244, -3.7684502601623535, -3.6310601234436035, -3.4936702251434326, -3.3562803268432617, -3.2188901901245117, -3.081500291824341, -2.94411039352417, -2.806720495223999, -2.669330596923828, -2.531940460205078, -2.3945505619049072, -2.2571606636047363, -2.1197705268859863, -1.9823806285858154, -1.8449907302856445, -1.7076008319854736, -1.5702108144760132, -1.4328207969665527, -1.2954308986663818, -1.158041000366211, -1.0206509828567505, -0.8832610249519348, -0.7458710670471191, -0.6084811091423035, -0.4710911512374878, -0.3337011933326721, -0.19631123542785645, -0.05892127752304077, 0.0784686803817749, 0.21585863828659058, 0.35324859619140625, 0.4906385540962219, 0.6280285120010376, 0.7654184699058533, 0.902808427810669, 1.0401983261108398, 1.1775883436203003, 1.3149783611297607, 1.4523682594299316, 1.5897581577301025, 1.727148175239563, 1.8645381927490234, 2.0019280910491943, 2.1393179893493652, 2.2767081260681152, 2.414098024368286, 2.551487922668457]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 9.0, 6.0, 14.0, 9.0, 11.0, 13.0, 21.0, 29.0, 18.0, 21.0, 31.0, 19.0, 27.0, 33.0, 39.0, 37.0, 32.0, 43.0, 41.0, 43.0, 32.0, 30.0, 47.0, 46.0, 29.0, 42.0, 29.0, 37.0, 28.0, 28.0, 9.0, 19.0, 20.0, 19.0, 16.0, 9.0, 10.0, 8.0, 14.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2509021759033203, -1.2080273628234863, -1.1651525497436523, -1.1222777366638184, -1.0794029235839844, -1.03652822971344, -0.993653416633606, -0.950778603553772, -0.907903790473938, -0.865028977394104, -0.82215416431427, -0.7792794108390808, -0.7364045977592468, -0.6935297846794128, -0.6506550312042236, -0.6077802181243896, -0.5649054050445557, -0.5220305919647217, -0.4791558086872101, -0.4362810254096985, -0.3934062123298645, -0.3505313992500305, -0.3076566159725189, -0.2647818326950073, -0.22190701961517334, -0.17903222143650055, -0.13615742325782776, -0.09328262507915497, -0.05040782690048218, -0.007533028721809387, 0.0353417694568634, 0.078216552734375, 0.12109136581420898, 0.16396616399288177, 0.20684096217155457, 0.24971576035022736, 0.29259055852890015, 0.33546537160873413, 0.3783401548862457, 0.4212149381637573, 0.4640897512435913, 0.5069645643234253, 0.5498393774032593, 0.5927141308784485, 0.6355889439582825, 0.6784637570381165, 0.7213385105133057, 0.7642133235931396, 0.8070881366729736, 0.8499629497528076, 0.8928377628326416, 0.9357125163078308, 0.9785873293876648, 1.021462082862854, 1.064336895942688, 1.107211709022522, 1.150086522102356, 1.19296133518219, 1.235836148262024, 1.278710961341858, 1.3215856552124023, 1.3644604682922363, 1.4073352813720703, 1.4502100944519043, 1.4930849075317383]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 10.0, 16.0, 30.0, 41.0, 67.0, 115.0, 217.0, 370.0, 688.0, 1408.0, 3055.0, 7280.0, 20885.0, 77673.0, 289393.0, 426563.0, 159512.0, 40089.0, 12206.0, 4728.0, 2056.0, 969.0, 523.0, 273.0, 129.0, 90.0, 55.0, 31.0, 15.0, 15.0, 13.0, 8.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.41854095458984375, -0.4047088623046875, -0.39087677001953125, -0.377044677734375, -0.36321258544921875, -0.3493804931640625, -0.33554840087890625, -0.32171630859375, -0.30788421630859375, -0.2940521240234375, -0.28022003173828125, -0.266387939453125, -0.25255584716796875, -0.2387237548828125, -0.22489166259765625, -0.2110595703125, -0.19722747802734375, -0.1833953857421875, -0.16956329345703125, -0.155731201171875, -0.14189910888671875, -0.1280670166015625, -0.11423492431640625, -0.10040283203125, -0.08657073974609375, -0.0727386474609375, -0.05890655517578125, -0.045074462890625, -0.03124237060546875, -0.0174102783203125, -0.00357818603515625, 0.01025390625, 0.02408599853515625, 0.0379180908203125, 0.05175018310546875, 0.065582275390625, 0.07941436767578125, 0.0932464599609375, 0.10707855224609375, 0.12091064453125, 0.13474273681640625, 0.1485748291015625, 0.16240692138671875, 0.176239013671875, 0.19007110595703125, 0.2039031982421875, 0.21773529052734375, 0.2315673828125, 0.24539947509765625, 0.2592315673828125, 0.27306365966796875, 0.286895751953125, 0.30072784423828125, 0.3145599365234375, 0.32839202880859375, 0.34222412109375, 0.35605621337890625, 0.3698883056640625, 0.38372039794921875, 0.397552490234375, 0.41138458251953125, 0.4252166748046875, 0.43904876708984375, 0.452880859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 13.0, 9.0, 22.0, 16.0, 24.0, 24.0, 26.0, 27.0, 34.0, 35.0, 32.0, 49.0, 37.0, 50.0, 35.0, 33.0, 35.0, 38.0, 38.0, 34.0, 39.0, 35.0, 31.0, 34.0, 30.0, 27.0, 16.0, 20.0, 10.0, 19.0, 20.0, 13.0, 10.0, 6.0, 3.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1795654296875, -0.17431259155273438, -0.16905975341796875, -0.16380691528320312, -0.1585540771484375, -0.15330123901367188, -0.14804840087890625, -0.14279556274414062, -0.137542724609375, -0.13228988647460938, -0.12703704833984375, -0.12178421020507812, -0.1165313720703125, -0.11127853393554688, -0.10602569580078125, -0.10077285766601562, -0.09552001953125, -0.09026718139648438, -0.08501434326171875, -0.07976150512695312, -0.0745086669921875, -0.06925582885742188, -0.06400299072265625, -0.058750152587890625, -0.053497314453125, -0.048244476318359375, -0.04299163818359375, -0.037738800048828125, -0.0324859619140625, -0.027233123779296875, -0.02198028564453125, -0.016727447509765625, -0.011474609375, -0.006221771240234375, -0.00096893310546875, 0.004283905029296875, 0.0095367431640625, 0.014789581298828125, 0.02004241943359375, 0.025295257568359375, 0.030548095703125, 0.035800933837890625, 0.04105377197265625, 0.046306610107421875, 0.0515594482421875, 0.056812286376953125, 0.06206512451171875, 0.06731796264648438, 0.07257080078125, 0.07782363891601562, 0.08307647705078125, 0.08832931518554688, 0.0935821533203125, 0.09883499145507812, 0.10408782958984375, 0.10934066772460938, 0.114593505859375, 0.11984634399414062, 0.12509918212890625, 0.13035202026367188, 0.1356048583984375, 0.14085769653320312, 0.14611053466796875, 0.15136337280273438, 0.1566162109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 7.0, 10.0, 16.0, 25.0, 35.0, 73.0, 149.0, 305.0, 684.0, 1655.0, 4915.0, 17382.0, 74259.0, 342551.0, 453863.0, 116445.0, 25156.0, 7115.0, 2349.0, 863.0, 334.0, 158.0, 81.0, 36.0, 25.0, 13.0, 16.0, 4.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453369140625, -0.4366645812988281, -0.41996002197265625, -0.4032554626464844, -0.3865509033203125, -0.3698463439941406, -0.35314178466796875, -0.3364372253417969, -0.319732666015625, -0.3030281066894531, -0.28632354736328125, -0.2696189880371094, -0.2529144287109375, -0.23620986938476562, -0.21950531005859375, -0.20280075073242188, -0.18609619140625, -0.16939163208007812, -0.15268707275390625, -0.13598251342773438, -0.1192779541015625, -0.10257339477539062, -0.08586883544921875, -0.06916427612304688, -0.052459716796875, -0.035755157470703125, -0.01905059814453125, -0.002346038818359375, 0.0143585205078125, 0.031063079833984375, 0.04776763916015625, 0.06447219848632812, 0.0811767578125, 0.09788131713867188, 0.11458587646484375, 0.13129043579101562, 0.1479949951171875, 0.16469955444335938, 0.18140411376953125, 0.19810867309570312, 0.214813232421875, 0.23151779174804688, 0.24822235107421875, 0.2649269104003906, 0.2816314697265625, 0.2983360290527344, 0.31504058837890625, 0.3317451477050781, 0.34844970703125, 0.3651542663574219, 0.38185882568359375, 0.3985633850097656, 0.4152679443359375, 0.4319725036621094, 0.44867706298828125, 0.4653816223144531, 0.482086181640625, 0.4987907409667969, 0.5154953002929688, 0.5321998596191406, 0.5489044189453125, 0.5656089782714844, 0.5823135375976562, 0.5990180969238281, 0.61572265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 12.0, 3.0, 16.0, 13.0, 16.0, 14.0, 22.0, 28.0, 19.0, 30.0, 44.0, 38.0, 45.0, 48.0, 51.0, 52.0, 41.0, 49.0, 36.0, 39.0, 51.0, 49.0, 31.0, 27.0, 38.0, 30.0, 30.0, 22.0, 19.0, 20.0, 12.0, 10.0, 13.0, 2.0, 5.0, 1.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56591796875, -0.5464859008789062, -0.5270538330078125, -0.5076217651367188, -0.488189697265625, -0.46875762939453125, -0.4493255615234375, -0.42989349365234375, -0.41046142578125, -0.39102935791015625, -0.3715972900390625, -0.35216522216796875, -0.332733154296875, -0.31330108642578125, -0.2938690185546875, -0.27443695068359375, -0.2550048828125, -0.23557281494140625, -0.2161407470703125, -0.19670867919921875, -0.177276611328125, -0.15784454345703125, -0.1384124755859375, -0.11898040771484375, -0.09954833984375, -0.08011627197265625, -0.0606842041015625, -0.04125213623046875, -0.021820068359375, -0.00238800048828125, 0.0170440673828125, 0.03647613525390625, 0.055908203125, 0.07534027099609375, 0.0947723388671875, 0.11420440673828125, 0.133636474609375, 0.15306854248046875, 0.1725006103515625, 0.19193267822265625, 0.21136474609375, 0.23079681396484375, 0.2502288818359375, 0.26966094970703125, 0.289093017578125, 0.30852508544921875, 0.3279571533203125, 0.34738922119140625, 0.3668212890625, 0.38625335693359375, 0.4056854248046875, 0.42511749267578125, 0.444549560546875, 0.46398162841796875, 0.4834136962890625, 0.5028457641601562, 0.52227783203125, 0.5417098999023438, 0.5611419677734375, 0.5805740356445312, 0.600006103515625, 0.6194381713867188, 0.6388702392578125, 0.6583023071289062, 0.677734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 18.0, 18.0, 28.0, 42.0, 72.0, 116.0, 191.0, 321.0, 530.0, 1016.0, 1835.0, 3721.0, 7628.0, 17017.0, 43313.0, 135000.0, 388760.0, 300624.0, 91115.0, 31741.0, 12969.0, 6079.0, 2925.0, 1491.0, 831.0, 459.0, 270.0, 160.0, 90.0, 56.0, 43.0, 27.0, 16.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267822265625, -0.2603492736816406, -0.25287628173828125, -0.24540328979492188, -0.2379302978515625, -0.23045730590820312, -0.22298431396484375, -0.21551132202148438, -0.208038330078125, -0.20056533813476562, -0.19309234619140625, -0.18561935424804688, -0.1781463623046875, -0.17067337036132812, -0.16320037841796875, -0.15572738647460938, -0.14825439453125, -0.14078140258789062, -0.13330841064453125, -0.12583541870117188, -0.1183624267578125, -0.11088943481445312, -0.10341644287109375, -0.09594345092773438, -0.088470458984375, -0.08099746704101562, -0.07352447509765625, -0.06605148315429688, -0.0585784912109375, -0.051105499267578125, -0.04363250732421875, -0.036159515380859375, -0.0286865234375, -0.021213531494140625, -0.01374053955078125, -0.006267547607421875, 0.0012054443359375, 0.008678436279296875, 0.01615142822265625, 0.023624420166015625, 0.031097412109375, 0.038570404052734375, 0.04604339599609375, 0.053516387939453125, 0.0609893798828125, 0.06846237182617188, 0.07593536376953125, 0.08340835571289062, 0.09088134765625, 0.09835433959960938, 0.10582733154296875, 0.11330032348632812, 0.1207733154296875, 0.12824630737304688, 0.13571929931640625, 0.14319229125976562, 0.150665283203125, 0.15813827514648438, 0.16561126708984375, 0.17308425903320312, 0.1805572509765625, 0.18803024291992188, 0.19550323486328125, 0.20297622680664062, 0.21044921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 10.0, 2.0, 8.0, 18.0, 24.0, 37.0, 56.0, 75.0, 97.0, 114.0, 137.0, 134.0, 90.0, 47.0, 31.0, 34.0, 29.0, 13.0, 14.0, 10.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.449222564697266e-05, -6.221514195203781e-05, -5.9938058257102966e-05, -5.766097456216812e-05, -5.5383890867233276e-05, -5.310680717229843e-05, -5.0829723477363586e-05, -4.855263978242874e-05, -4.6275556087493896e-05, -4.399847239255905e-05, -4.1721388697624207e-05, -3.944430500268936e-05, -3.7167221307754517e-05, -3.489013761281967e-05, -3.261305391788483e-05, -3.033597022294998e-05, -2.8058886528015137e-05, -2.5781802833080292e-05, -2.3504719138145447e-05, -2.1227635443210602e-05, -1.8950551748275757e-05, -1.6673468053340912e-05, -1.4396384358406067e-05, -1.2119300663471222e-05, -9.842216968536377e-06, -7.565133273601532e-06, -5.288049578666687e-06, -3.010965883731842e-06, -7.338821887969971e-07, 1.543201506137848e-06, 3.820285201072693e-06, 6.097368896007538e-06, 8.374452590942383e-06, 1.0651536285877228e-05, 1.2928619980812073e-05, 1.5205703675746918e-05, 1.7482787370681763e-05, 1.9759871065616608e-05, 2.2036954760551453e-05, 2.4314038455486298e-05, 2.6591122150421143e-05, 2.8868205845355988e-05, 3.114528954029083e-05, 3.342237323522568e-05, 3.569945693016052e-05, 3.797654062509537e-05, 4.025362432003021e-05, 4.253070801496506e-05, 4.48077917098999e-05, 4.708487540483475e-05, 4.936195909976959e-05, 5.163904279470444e-05, 5.391612648963928e-05, 5.619321018457413e-05, 5.847029387950897e-05, 6.074737757444382e-05, 6.302446126937866e-05, 6.530154496431351e-05, 6.757862865924835e-05, 6.98557123541832e-05, 7.213279604911804e-05, 7.440987974405289e-05, 7.668696343898773e-05, 7.896404713392258e-05, 8.124113082885742e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 16.0, 33.0, 44.0, 81.0, 141.0, 210.0, 360.0, 686.0, 1342.0, 2564.0, 5529.0, 12895.0, 36999.0, 146561.0, 469310.0, 272449.0, 64565.0, 19515.0, 7857.0, 3464.0, 1800.0, 900.0, 463.0, 250.0, 176.0, 99.0, 67.0, 33.0, 21.0, 20.0, 19.0, 9.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307373046875, -0.2979774475097656, -0.28858184814453125, -0.2791862487792969, -0.2697906494140625, -0.2603950500488281, -0.25099945068359375, -0.24160385131835938, -0.232208251953125, -0.22281265258789062, -0.21341705322265625, -0.20402145385742188, -0.1946258544921875, -0.18523025512695312, -0.17583465576171875, -0.16643905639648438, -0.15704345703125, -0.14764785766601562, -0.13825225830078125, -0.12885665893554688, -0.1194610595703125, -0.11006546020507812, -0.10066986083984375, -0.09127426147460938, -0.081878662109375, -0.07248306274414062, -0.06308746337890625, -0.053691864013671875, -0.0442962646484375, -0.034900665283203125, -0.02550506591796875, -0.016109466552734375, -0.0067138671875, 0.002681732177734375, 0.01207733154296875, 0.021472930908203125, 0.0308685302734375, 0.040264129638671875, 0.04965972900390625, 0.059055328369140625, 0.068450927734375, 0.07784652709960938, 0.08724212646484375, 0.09663772583007812, 0.1060333251953125, 0.11542892456054688, 0.12482452392578125, 0.13422012329101562, 0.14361572265625, 0.15301132202148438, 0.16240692138671875, 0.17180252075195312, 0.1811981201171875, 0.19059371948242188, 0.19998931884765625, 0.20938491821289062, 0.218780517578125, 0.22817611694335938, 0.23757171630859375, 0.24696731567382812, 0.2563629150390625, 0.2657585144042969, 0.27515411376953125, 0.2845497131347656, 0.2939453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 12.0, 9.0, 19.0, 17.0, 23.0, 23.0, 42.0, 50.0, 51.0, 62.0, 82.0, 81.0, 93.0, 75.0, 69.0, 58.0, 34.0, 33.0, 23.0, 26.0, 19.0, 13.0, 12.0, 16.0, 7.0, 4.0, 6.0, 4.0, 1.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.18806076049804688, -0.18154144287109375, -0.17502212524414062, -0.1685028076171875, -0.16198348999023438, -0.15546417236328125, -0.14894485473632812, -0.142425537109375, -0.13590621948242188, -0.12938690185546875, -0.12286758422851562, -0.1163482666015625, -0.10982894897460938, -0.10330963134765625, -0.09679031372070312, -0.09027099609375, -0.08375167846679688, -0.07723236083984375, -0.07071304321289062, -0.0641937255859375, -0.057674407958984375, -0.05115509033203125, -0.044635772705078125, -0.038116455078125, -0.031597137451171875, -0.02507781982421875, -0.018558502197265625, -0.0120391845703125, -0.005519866943359375, 0.00099945068359375, 0.007518768310546875, 0.0140380859375, 0.020557403564453125, 0.02707672119140625, 0.033596038818359375, 0.0401153564453125, 0.046634674072265625, 0.05315399169921875, 0.059673309326171875, 0.066192626953125, 0.07271194458007812, 0.07923126220703125, 0.08575057983398438, 0.0922698974609375, 0.09878921508789062, 0.10530853271484375, 0.11182785034179688, 0.11834716796875, 0.12486648559570312, 0.13138580322265625, 0.13790512084960938, 0.1444244384765625, 0.15094375610351562, 0.15746307373046875, 0.16398239135742188, 0.170501708984375, 0.17702102661132812, 0.18354034423828125, 0.19005966186523438, 0.1965789794921875, 0.20309829711914062, 0.20961761474609375, 0.21613693237304688, 0.22265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 14.0, 38.0, 89.0, 172.0, 234.0, 220.0, 124.0, 64.0, 22.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.845476150512695, -5.6986165046691895, -5.551756858825684, -5.404897689819336, -5.25803804397583, -5.111178398132324, -4.964318752288818, -4.8174591064453125, -4.670599460601807, -4.523739814758301, -4.376880168914795, -4.230020523071289, -4.083161354064941, -3.9363017082214355, -3.7894420623779297, -3.642582416534424, -3.495723009109497, -3.348863363265991, -3.2020039558410645, -3.0551443099975586, -2.9082846641540527, -2.761425018310547, -2.61456561088562, -2.4677059650421143, -2.3208465576171875, -2.1739869117736816, -2.027127504348755, -1.880267858505249, -1.7334082126617432, -1.5865486860275269, -1.4396891593933105, -1.2928295135498047, -1.145970106124878, -0.9991105198860168, -0.8522509336471558, -0.7053914070129395, -0.5585318207740784, -0.4116722345352173, -0.264812707901001, -0.11795306205749512, 0.02890646457672119, 0.17576603591442108, 0.32262560725212097, 0.46948516368865967, 0.6163447499275208, 0.7632043361663818, 0.9100638628005981, 1.056923508644104, 1.2037830352783203, 1.3506425619125366, 1.4975022077560425, 1.6443617343902588, 1.7912213802337646, 1.938080906867981, 2.0849404335021973, 2.231800079345703, 2.378659725189209, 2.525519371032715, 2.6723787784576416, 2.8192384243011475, 2.9660980701446533, 3.11295747756958, 3.259817123413086, 3.406676769256592, 3.5535361766815186]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 11.0, 18.0, 16.0, 11.0, 16.0, 21.0, 38.0, 29.0, 31.0, 26.0, 34.0, 32.0, 42.0, 26.0, 42.0, 43.0, 47.0, 38.0, 39.0, 33.0, 45.0, 39.0, 38.0, 26.0, 32.0, 18.0, 23.0, 22.0, 22.0, 15.0, 20.0, 15.0, 10.0, 5.0, 8.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.6498146057128906, -1.5995581150054932, -1.5493016242980957, -1.4990451335906982, -1.4487886428833008, -1.3985321521759033, -1.3482756614685059, -1.2980191707611084, -1.247762680053711, -1.1975061893463135, -1.147249698638916, -1.0969932079315186, -1.046736717224121, -0.9964802265167236, -0.9462236762046814, -0.8959671854972839, -0.8457106351852417, -0.7954541444778442, -0.7451976537704468, -0.6949411630630493, -0.6446846723556519, -0.5944281816482544, -0.5441716313362122, -0.4939151406288147, -0.44365864992141724, -0.3934021592140198, -0.3431456685066223, -0.29288914799690247, -0.242632657289505, -0.19237616658210754, -0.1421196460723877, -0.09186315536499023, -0.04160666465759277, 0.008649833500385284, 0.05890633165836334, 0.109162837266922, 0.15941932797431946, 0.20967581868171692, 0.25993233919143677, 0.31018882989883423, 0.3604453206062317, 0.41070181131362915, 0.4609583020210266, 0.5112148523330688, 0.5614713430404663, 0.6117278337478638, 0.6619843244552612, 0.7122408151626587, 0.7624973058700562, 0.8127537965774536, 0.8630102872848511, 0.9132667779922485, 0.963523268699646, 1.0137797594070435, 1.0640363693237305, 1.114292860031128, 1.1645493507385254, 1.2148058414459229, 1.2650623321533203, 1.3153188228607178, 1.3655753135681152, 1.4158318042755127, 1.4660882949829102, 1.5163447856903076, 1.566601276397705]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 12.0, 15.0, 26.0, 18.0, 39.0, 43.0, 68.0, 85.0, 135.0, 193.0, 275.0, 433.0, 644.0, 998.0, 1691.0, 2833.0, 5192.0, 10374.0, 24255.0, 74940.0, 327328.0, 1555616.0, 1696971.0, 357166.0, 84006.0, 27261.0, 11080.0, 5392.0, 2824.0, 1601.0, 1031.0, 612.0, 352.0, 250.0, 166.0, 107.0, 75.0, 57.0, 44.0, 22.0, 14.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.35546875, -0.34560394287109375, -0.3357391357421875, -0.32587432861328125, -0.316009521484375, -0.30614471435546875, -0.2962799072265625, -0.28641510009765625, -0.27655029296875, -0.26668548583984375, -0.2568206787109375, -0.24695587158203125, -0.237091064453125, -0.22722625732421875, -0.2173614501953125, -0.20749664306640625, -0.1976318359375, -0.18776702880859375, -0.1779022216796875, -0.16803741455078125, -0.158172607421875, -0.14830780029296875, -0.1384429931640625, -0.12857818603515625, -0.11871337890625, -0.10884857177734375, -0.0989837646484375, -0.08911895751953125, -0.079254150390625, -0.06938934326171875, -0.0595245361328125, -0.04965972900390625, -0.039794921875, -0.02993011474609375, -0.0200653076171875, -0.01020050048828125, -0.000335693359375, 0.00952911376953125, 0.0193939208984375, 0.02925872802734375, 0.03912353515625, 0.04898834228515625, 0.0588531494140625, 0.06871795654296875, 0.078582763671875, 0.08844757080078125, 0.0983123779296875, 0.10817718505859375, 0.1180419921875, 0.12790679931640625, 0.1377716064453125, 0.14763641357421875, 0.157501220703125, 0.16736602783203125, 0.1772308349609375, 0.18709564208984375, 0.19696044921875, 0.20682525634765625, 0.2166900634765625, 0.22655487060546875, 0.236419677734375, 0.24628448486328125, 0.2561492919921875, 0.26601409912109375, 0.27587890625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 5.0, 12.0, 8.0, 18.0, 16.0, 12.0, 17.0, 27.0, 31.0, 36.0, 31.0, 44.0, 36.0, 49.0, 50.0, 60.0, 50.0, 48.0, 36.0, 32.0, 42.0, 45.0, 43.0, 37.0, 32.0, 18.0, 29.0, 25.0, 12.0, 17.0, 15.0, 11.0, 13.0, 8.0, 4.0, 10.0, 4.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-0.2454833984375, -0.23904037475585938, -0.23259735107421875, -0.22615432739257812, -0.2197113037109375, -0.21326828002929688, -0.20682525634765625, -0.20038223266601562, -0.193939208984375, -0.18749618530273438, -0.18105316162109375, -0.17461013793945312, -0.1681671142578125, -0.16172409057617188, -0.15528106689453125, -0.14883804321289062, -0.14239501953125, -0.13595199584960938, -0.12950897216796875, -0.12306594848632812, -0.1166229248046875, -0.11017990112304688, -0.10373687744140625, -0.09729385375976562, -0.090850830078125, -0.08440780639648438, -0.07796478271484375, -0.07152175903320312, -0.0650787353515625, -0.058635711669921875, -0.05219268798828125, -0.045749664306640625, -0.039306640625, -0.032863616943359375, -0.02642059326171875, -0.019977569580078125, -0.0135345458984375, -0.007091522216796875, -0.00064849853515625, 0.005794525146484375, 0.012237548828125, 0.018680572509765625, 0.02512359619140625, 0.031566619873046875, 0.0380096435546875, 0.044452667236328125, 0.05089569091796875, 0.057338714599609375, 0.06378173828125, 0.07022476196289062, 0.07666778564453125, 0.08311080932617188, 0.0895538330078125, 0.09599685668945312, 0.10243988037109375, 0.10888290405273438, 0.115325927734375, 0.12176895141601562, 0.12821197509765625, 0.13465499877929688, 0.1410980224609375, 0.14754104614257812, 0.15398406982421875, 0.16042709350585938, 0.1668701171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 14.0, 9.0, 12.0, 24.0, 18.0, 36.0, 48.0, 57.0, 106.0, 147.0, 234.0, 349.0, 549.0, 913.0, 1730.0, 3723.0, 9052.0, 28752.0, 146011.0, 1909489.0, 1902036.0, 145253.0, 28707.0, 9085.0, 3670.0, 1724.0, 985.0, 553.0, 304.0, 234.0, 143.0, 93.0, 57.0, 34.0, 39.0, 23.0, 22.0, 15.0, 12.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57861328125, -0.5563583374023438, -0.5341033935546875, -0.5118484497070312, -0.489593505859375, -0.46733856201171875, -0.4450836181640625, -0.42282867431640625, -0.40057373046875, -0.37831878662109375, -0.3560638427734375, -0.33380889892578125, -0.311553955078125, -0.28929901123046875, -0.2670440673828125, -0.24478912353515625, -0.2225341796875, -0.20027923583984375, -0.1780242919921875, -0.15576934814453125, -0.133514404296875, -0.11125946044921875, -0.0890045166015625, -0.06674957275390625, -0.04449462890625, -0.02223968505859375, 1.52587890625e-05, 0.02227020263671875, 0.044525146484375, 0.06678009033203125, 0.0890350341796875, 0.11128997802734375, 0.133544921875, 0.15579986572265625, 0.1780548095703125, 0.20030975341796875, 0.222564697265625, 0.24481964111328125, 0.2670745849609375, 0.28932952880859375, 0.31158447265625, 0.33383941650390625, 0.3560943603515625, 0.37834930419921875, 0.400604248046875, 0.42285919189453125, 0.4451141357421875, 0.46736907958984375, 0.4896240234375, 0.5118789672851562, 0.5341339111328125, 0.5563888549804688, 0.578643798828125, 0.6008987426757812, 0.6231536865234375, 0.6454086303710938, 0.66766357421875, 0.6899185180664062, 0.7121734619140625, 0.7344284057617188, 0.756683349609375, 0.7789382934570312, 0.8011932373046875, 0.8234481811523438, 0.845703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 8.0, 3.0, 4.0, 13.0, 29.0, 34.0, 38.0, 82.0, 103.0, 175.0, 266.0, 487.0, 804.0, 866.0, 494.0, 239.0, 141.0, 96.0, 69.0, 34.0, 22.0, 23.0, 12.0, 12.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.7998046875, -0.7802886962890625, -0.760772705078125, -0.7412567138671875, -0.72174072265625, -0.7022247314453125, -0.682708740234375, -0.6631927490234375, -0.6436767578125, -0.6241607666015625, -0.604644775390625, -0.5851287841796875, -0.56561279296875, -0.5460968017578125, -0.526580810546875, -0.5070648193359375, -0.487548828125, -0.4680328369140625, -0.448516845703125, -0.4290008544921875, -0.40948486328125, -0.3899688720703125, -0.370452880859375, -0.3509368896484375, -0.3314208984375, -0.3119049072265625, -0.292388916015625, -0.2728729248046875, -0.25335693359375, -0.2338409423828125, -0.214324951171875, -0.1948089599609375, -0.17529296875, -0.1557769775390625, -0.136260986328125, -0.1167449951171875, -0.09722900390625, -0.0777130126953125, -0.058197021484375, -0.0386810302734375, -0.0191650390625, 0.0003509521484375, 0.019866943359375, 0.0393829345703125, 0.05889892578125, 0.0784149169921875, 0.097930908203125, 0.1174468994140625, 0.136962890625, 0.1564788818359375, 0.175994873046875, 0.1955108642578125, 0.21502685546875, 0.2345428466796875, 0.254058837890625, 0.2735748291015625, 0.2930908203125, 0.3126068115234375, 0.332122802734375, 0.3516387939453125, 0.37115478515625, 0.3906707763671875, 0.410186767578125, 0.4297027587890625, 0.44921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 7.0, 16.0, 13.0, 30.0, 42.0, 136.0, 238.0, 243.0, 155.0, 81.0, 28.0, 11.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.802663803100586, -7.630014419555664, -7.457364559173584, -7.284715175628662, -7.11206579208374, -6.939416408538818, -6.766766548156738, -6.594117164611816, -6.4214677810668945, -6.248818397521973, -6.076168537139893, -5.903519153594971, -5.730869770050049, -5.558220386505127, -5.385570526123047, -5.212921142578125, -5.040271759033203, -4.867622375488281, -4.694972515106201, -4.522323131561279, -4.349673748016357, -4.1770243644714355, -4.0043745040893555, -3.8317251205444336, -3.6590752601623535, -3.4864256381988525, -3.3137762546539307, -3.1411266326904297, -2.968477249145508, -2.795827627182007, -2.623178005218506, -2.450528621673584, -2.277879238128662, -2.105229616165161, -1.9325802326202393, -1.7599306106567383, -1.5872812271118164, -1.4146316051483154, -1.241982102394104, -1.0693325996398926, -0.8966830968856812, -0.7240335941314697, -0.5513840913772583, -0.3787345290184021, -0.20608502626419067, -0.03343552350997925, 0.13921403884887695, 0.3118635416030884, 0.4845130443572998, 0.6571625471115112, 0.8298120498657227, 1.0024616718292236, 1.1751110553741455, 1.3477606773376465, 1.520410180091858, 1.6930596828460693, 1.8657091856002808, 2.038358688354492, 2.211008310317993, 2.383657693862915, 2.556307315826416, 2.728956699371338, 2.901606321334839, 3.07425594329834, 3.2469053268432617]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 13.0, 9.0, 11.0, 6.0, 17.0, 10.0, 20.0, 18.0, 19.0, 28.0, 33.0, 32.0, 29.0, 24.0, 29.0, 41.0, 33.0, 44.0, 37.0, 30.0, 38.0, 44.0, 45.0, 30.0, 40.0, 38.0, 30.0, 31.0, 24.0, 25.0, 23.0, 19.0, 22.0, 21.0, 12.0, 13.0, 8.0, 12.0, 6.0, 8.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.2920538187026978, -1.2525336742401123, -1.2130136489868164, -1.173493504524231, -1.1339733600616455, -1.0944533348083496, -1.0549331903457642, -1.0154130458831787, -0.9758930206298828, -0.9363729357719421, -0.8968528509140015, -0.857332706451416, -0.8178126215934753, -0.7782925367355347, -0.7387723922729492, -0.6992523074150085, -0.6597322225570679, -0.6202121376991272, -0.5806920528411865, -0.5411719083786011, -0.5016518235206604, -0.4621317386627197, -0.42261162400245667, -0.3830915093421936, -0.34357142448425293, -0.30405133962631226, -0.2645312249660492, -0.22501112520694733, -0.18549102544784546, -0.1459709256887436, -0.10645082592964172, -0.06693071126937866, -0.02741062641143799, 0.01210947334766388, 0.05162957310676575, 0.09114967286586761, 0.13066977262496948, 0.17018987238407135, 0.20970997214317322, 0.24923008680343628, 0.28875017166137695, 0.3282702565193176, 0.3677903711795807, 0.40731048583984375, 0.4468305706977844, 0.4863506555557251, 0.5258708000183105, 0.5653908848762512, 0.6049109697341919, 0.6444310545921326, 0.6839511394500732, 0.7234712839126587, 0.7629913687705994, 0.80251145362854, 0.8420315980911255, 0.8815516829490662, 0.9210717678070068, 0.9605918526649475, 1.0001119375228882, 1.0396320819854736, 1.0791521072387695, 1.118672251701355, 1.1581923961639404, 1.1977124214172363, 1.2372325658798218]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 16.0, 23.0, 20.0, 36.0, 79.0, 112.0, 172.0, 276.0, 443.0, 725.0, 1314.0, 2350.0, 4350.0, 8770.0, 18687.0, 45650.0, 134330.0, 346117.0, 306532.0, 107597.0, 38025.0, 16371.0, 7787.0, 3883.0, 2042.0, 1147.0, 631.0, 414.0, 240.0, 127.0, 95.0, 71.0, 46.0, 29.0, 15.0, 12.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.45361328125, -0.4393959045410156, -0.42517852783203125, -0.4109611511230469, -0.3967437744140625, -0.3825263977050781, -0.36830902099609375, -0.3540916442871094, -0.339874267578125, -0.3256568908691406, -0.31143951416015625, -0.2972221374511719, -0.2830047607421875, -0.2687873840332031, -0.25457000732421875, -0.24035263061523438, -0.22613525390625, -0.21191787719726562, -0.19770050048828125, -0.18348312377929688, -0.1692657470703125, -0.15504837036132812, -0.14083099365234375, -0.12661361694335938, -0.112396240234375, -0.09817886352539062, -0.08396148681640625, -0.06974411010742188, -0.0555267333984375, -0.041309356689453125, -0.02709197998046875, -0.012874603271484375, 0.0013427734375, 0.015560150146484375, 0.02977752685546875, 0.043994903564453125, 0.0582122802734375, 0.07242965698242188, 0.08664703369140625, 0.10086441040039062, 0.115081787109375, 0.12929916381835938, 0.14351654052734375, 0.15773391723632812, 0.1719512939453125, 0.18616867065429688, 0.20038604736328125, 0.21460342407226562, 0.22882080078125, 0.24303817749023438, 0.25725555419921875, 0.2714729309082031, 0.2856903076171875, 0.2999076843261719, 0.31412506103515625, 0.3283424377441406, 0.342559814453125, 0.3567771911621094, 0.37099456787109375, 0.3852119445800781, 0.3994293212890625, 0.4136466979980469, 0.42786407470703125, 0.4420814514160156, 0.456298828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 12.0, 9.0, 12.0, 11.0, 21.0, 20.0, 19.0, 24.0, 32.0, 28.0, 28.0, 50.0, 31.0, 43.0, 52.0, 43.0, 35.0, 49.0, 44.0, 54.0, 39.0, 41.0, 34.0, 35.0, 28.0, 28.0, 29.0, 22.0, 23.0, 20.0, 19.0, 10.0, 10.0, 7.0, 6.0, 3.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0], "bins": [-0.248779296875, -0.241973876953125, -0.23516845703125, -0.228363037109375, -0.2215576171875, -0.214752197265625, -0.20794677734375, -0.201141357421875, -0.1943359375, -0.187530517578125, -0.18072509765625, -0.173919677734375, -0.1671142578125, -0.160308837890625, -0.15350341796875, -0.146697998046875, -0.139892578125, -0.133087158203125, -0.12628173828125, -0.119476318359375, -0.1126708984375, -0.105865478515625, -0.09906005859375, -0.092254638671875, -0.08544921875, -0.078643798828125, -0.07183837890625, -0.065032958984375, -0.0582275390625, -0.051422119140625, -0.04461669921875, -0.037811279296875, -0.031005859375, -0.024200439453125, -0.01739501953125, -0.010589599609375, -0.0037841796875, 0.003021240234375, 0.00982666015625, 0.016632080078125, 0.0234375, 0.030242919921875, 0.03704833984375, 0.043853759765625, 0.0506591796875, 0.057464599609375, 0.06427001953125, 0.071075439453125, 0.077880859375, 0.084686279296875, 0.09149169921875, 0.098297119140625, 0.1051025390625, 0.111907958984375, 0.11871337890625, 0.125518798828125, 0.13232421875, 0.139129638671875, 0.14593505859375, 0.152740478515625, 0.1595458984375, 0.166351318359375, 0.17315673828125, 0.179962158203125, 0.186767578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 14.0, 28.0, 33.0, 58.0, 88.0, 135.0, 176.0, 266.0, 407.0, 675.0, 1087.0, 1806.0, 3180.0, 5323.0, 9886.0, 19250.0, 46786.0, 142864.0, 383623.0, 280472.0, 88077.0, 31695.0, 14467.0, 7502.0, 4125.0, 2466.0, 1492.0, 890.0, 592.0, 351.0, 214.0, 157.0, 106.0, 88.0, 46.0, 40.0, 24.0, 10.0, 14.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.474853515625, -0.4599189758300781, -0.44498443603515625, -0.4300498962402344, -0.4151153564453125, -0.4001808166503906, -0.38524627685546875, -0.3703117370605469, -0.355377197265625, -0.3404426574707031, -0.32550811767578125, -0.3105735778808594, -0.2956390380859375, -0.2807044982910156, -0.26576995849609375, -0.2508354187011719, -0.23590087890625, -0.22096633911132812, -0.20603179931640625, -0.19109725952148438, -0.1761627197265625, -0.16122817993164062, -0.14629364013671875, -0.13135910034179688, -0.116424560546875, -0.10149002075195312, -0.08655548095703125, -0.07162094116210938, -0.0566864013671875, -0.041751861572265625, -0.02681732177734375, -0.011882781982421875, 0.0030517578125, 0.017986297607421875, 0.03292083740234375, 0.047855377197265625, 0.0627899169921875, 0.07772445678710938, 0.09265899658203125, 0.10759353637695312, 0.122528076171875, 0.13746261596679688, 0.15239715576171875, 0.16733169555664062, 0.1822662353515625, 0.19720077514648438, 0.21213531494140625, 0.22706985473632812, 0.24200439453125, 0.2569389343261719, 0.27187347412109375, 0.2868080139160156, 0.3017425537109375, 0.3166770935058594, 0.33161163330078125, 0.3465461730957031, 0.361480712890625, 0.3764152526855469, 0.39134979248046875, 0.4062843322753906, 0.4212188720703125, 0.4361534118652344, 0.45108795166015625, 0.4660224914550781, 0.48095703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 7.0, 11.0, 14.0, 8.0, 16.0, 15.0, 19.0, 21.0, 28.0, 36.0, 27.0, 34.0, 43.0, 43.0, 34.0, 52.0, 39.0, 44.0, 59.0, 40.0, 46.0, 32.0, 34.0, 32.0, 48.0, 42.0, 34.0, 20.0, 20.0, 8.0, 17.0, 7.0, 14.0, 7.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75, -0.7263717651367188, -0.7027435302734375, -0.6791152954101562, -0.655487060546875, -0.6318588256835938, -0.6082305908203125, -0.5846023559570312, -0.56097412109375, -0.5373458862304688, -0.5137176513671875, -0.49008941650390625, -0.466461181640625, -0.44283294677734375, -0.4192047119140625, -0.39557647705078125, -0.3719482421875, -0.34832000732421875, -0.3246917724609375, -0.30106353759765625, -0.277435302734375, -0.25380706787109375, -0.2301788330078125, -0.20655059814453125, -0.18292236328125, -0.15929412841796875, -0.1356658935546875, -0.11203765869140625, -0.088409423828125, -0.06478118896484375, -0.0411529541015625, -0.01752471923828125, 0.006103515625, 0.02973175048828125, 0.0533599853515625, 0.07698822021484375, 0.100616455078125, 0.12424468994140625, 0.1478729248046875, 0.17150115966796875, 0.19512939453125, 0.21875762939453125, 0.2423858642578125, 0.26601409912109375, 0.289642333984375, 0.31327056884765625, 0.3368988037109375, 0.36052703857421875, 0.3841552734375, 0.40778350830078125, 0.4314117431640625, 0.45503997802734375, 0.478668212890625, 0.5022964477539062, 0.5259246826171875, 0.5495529174804688, 0.57318115234375, 0.5968093872070312, 0.6204376220703125, 0.6440658569335938, 0.667694091796875, 0.6913223266601562, 0.7149505615234375, 0.7385787963867188, 0.76220703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 21.0, 21.0, 42.0, 56.0, 92.0, 129.0, 188.0, 255.0, 403.0, 588.0, 937.0, 1380.0, 2200.0, 3424.0, 5399.0, 8973.0, 15350.0, 27956.0, 55244.0, 124366.0, 299346.0, 275702.0, 112154.0, 51022.0, 26213.0, 14349.0, 8458.0, 5058.0, 3141.0, 2111.0, 1347.0, 898.0, 614.0, 343.0, 248.0, 175.0, 105.0, 84.0, 50.0, 37.0, 20.0, 11.0, 7.0, 12.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1513671875, -0.1459503173828125, -0.140533447265625, -0.1351165771484375, -0.12969970703125, -0.1242828369140625, -0.118865966796875, -0.1134490966796875, -0.1080322265625, -0.1026153564453125, -0.097198486328125, -0.0917816162109375, -0.08636474609375, -0.0809478759765625, -0.075531005859375, -0.0701141357421875, -0.064697265625, -0.0592803955078125, -0.053863525390625, -0.0484466552734375, -0.04302978515625, -0.0376129150390625, -0.032196044921875, -0.0267791748046875, -0.0213623046875, -0.0159454345703125, -0.010528564453125, -0.0051116943359375, 0.00030517578125, 0.0057220458984375, 0.011138916015625, 0.0165557861328125, 0.02197265625, 0.0273895263671875, 0.032806396484375, 0.0382232666015625, 0.04364013671875, 0.0490570068359375, 0.054473876953125, 0.0598907470703125, 0.0653076171875, 0.0707244873046875, 0.076141357421875, 0.0815582275390625, 0.08697509765625, 0.0923919677734375, 0.097808837890625, 0.1032257080078125, 0.108642578125, 0.1140594482421875, 0.119476318359375, 0.1248931884765625, 0.13031005859375, 0.1357269287109375, 0.141143798828125, 0.1465606689453125, 0.1519775390625, 0.1573944091796875, 0.162811279296875, 0.1682281494140625, 0.17364501953125, 0.1790618896484375, 0.184478759765625, 0.1898956298828125, 0.1953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 4.0, 7.0, 14.0, 16.0, 24.0, 28.0, 38.0, 50.0, 72.0, 135.0, 161.0, 121.0, 88.0, 53.0, 40.0, 23.0, 26.0, 16.0, 15.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.022785186767578e-05, -7.783900946378708e-05, -7.545016705989838e-05, -7.306132465600967e-05, -7.067248225212097e-05, -6.828363984823227e-05, -6.589479744434357e-05, -6.350595504045486e-05, -6.111711263656616e-05, -5.872827023267746e-05, -5.633942782878876e-05, -5.3950585424900055e-05, -5.156174302101135e-05, -4.917290061712265e-05, -4.678405821323395e-05, -4.4395215809345245e-05, -4.200637340545654e-05, -3.961753100156784e-05, -3.722868859767914e-05, -3.4839846193790436e-05, -3.2451003789901733e-05, -3.006216138601303e-05, -2.767331898212433e-05, -2.5284476578235626e-05, -2.2895634174346924e-05, -2.050679177045822e-05, -1.811794936656952e-05, -1.5729106962680817e-05, -1.3340264558792114e-05, -1.0951422154903412e-05, -8.56257975101471e-06, -6.173737347126007e-06, -3.7848949432373047e-06, -1.3960525393486023e-06, 9.927898645401e-07, 3.3816322684288025e-06, 5.770474672317505e-06, 8.159317076206207e-06, 1.054815948009491e-05, 1.2937001883983612e-05, 1.5325844287872314e-05, 1.7714686691761017e-05, 2.010352909564972e-05, 2.249237149953842e-05, 2.4881213903427124e-05, 2.7270056307315826e-05, 2.965889871120453e-05, 3.204774111509323e-05, 3.4436583518981934e-05, 3.6825425922870636e-05, 3.921426832675934e-05, 4.160311073064804e-05, 4.399195313453674e-05, 4.6380795538425446e-05, 4.876963794231415e-05, 5.115848034620285e-05, 5.354732275009155e-05, 5.5936165153980255e-05, 5.832500755786896e-05, 6.071384996175766e-05, 6.310269236564636e-05, 6.549153476953506e-05, 6.788037717342377e-05, 7.026921957731247e-05, 7.265806198120117e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 13.0, 9.0, 11.0, 34.0, 34.0, 57.0, 92.0, 139.0, 207.0, 337.0, 529.0, 949.0, 1511.0, 2569.0, 4637.0, 8431.0, 16506.0, 34166.0, 74069.0, 166784.0, 312321.0, 229342.0, 102582.0, 46522.0, 22004.0, 10924.0, 5726.0, 3317.0, 1820.0, 1101.0, 663.0, 416.0, 247.0, 158.0, 98.0, 79.0, 37.0, 36.0, 22.0, 17.0, 11.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.17626953125, -0.17087936401367188, -0.16548919677734375, -0.16009902954101562, -0.1547088623046875, -0.14931869506835938, -0.14392852783203125, -0.13853836059570312, -0.133148193359375, -0.12775802612304688, -0.12236785888671875, -0.11697769165039062, -0.1115875244140625, -0.10619735717773438, -0.10080718994140625, -0.09541702270507812, -0.09002685546875, -0.08463668823242188, -0.07924652099609375, -0.07385635375976562, -0.0684661865234375, -0.06307601928710938, -0.05768585205078125, -0.052295684814453125, -0.046905517578125, -0.041515350341796875, -0.03612518310546875, -0.030735015869140625, -0.0253448486328125, -0.019954681396484375, -0.01456451416015625, -0.009174346923828125, -0.0037841796875, 0.001605987548828125, 0.00699615478515625, 0.012386322021484375, 0.0177764892578125, 0.023166656494140625, 0.02855682373046875, 0.033946990966796875, 0.039337158203125, 0.044727325439453125, 0.05011749267578125, 0.055507659912109375, 0.0608978271484375, 0.06628799438476562, 0.07167816162109375, 0.07706832885742188, 0.08245849609375, 0.08784866333007812, 0.09323883056640625, 0.09862899780273438, 0.1040191650390625, 0.10940933227539062, 0.11479949951171875, 0.12018966674804688, 0.125579833984375, 0.13097000122070312, 0.13636016845703125, 0.14175033569335938, 0.1471405029296875, 0.15253067016601562, 0.15792083740234375, 0.16331100463867188, 0.168701171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 9.0, 14.0, 14.0, 23.0, 33.0, 29.0, 35.0, 44.0, 48.0, 73.0, 80.0, 64.0, 91.0, 82.0, 61.0, 47.0, 49.0, 34.0, 28.0, 23.0, 19.0, 18.0, 11.0, 13.0, 6.0, 6.0, 1.0, 3.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.1944255828857422, -0.18792343139648438, -0.18142127990722656, -0.17491912841796875, -0.16841697692871094, -0.16191482543945312, -0.1554126739501953, -0.1489105224609375, -0.1424083709716797, -0.13590621948242188, -0.12940406799316406, -0.12290191650390625, -0.11639976501464844, -0.10989761352539062, -0.10339546203613281, -0.096893310546875, -0.09039115905761719, -0.08388900756835938, -0.07738685607910156, -0.07088470458984375, -0.06438255310058594, -0.057880401611328125, -0.05137825012207031, -0.0448760986328125, -0.03837394714355469, -0.031871795654296875, -0.025369644165039062, -0.01886749267578125, -0.012365341186523438, -0.005863189697265625, 0.0006389617919921875, 0.00714111328125, 0.013643264770507812, 0.020145416259765625, 0.026647567749023438, 0.03314971923828125, 0.03965187072753906, 0.046154022216796875, 0.05265617370605469, 0.0591583251953125, 0.06566047668457031, 0.07216262817382812, 0.07866477966308594, 0.08516693115234375, 0.09166908264160156, 0.09817123413085938, 0.10467338562011719, 0.111175537109375, 0.11767768859863281, 0.12417984008789062, 0.13068199157714844, 0.13718414306640625, 0.14368629455566406, 0.15018844604492188, 0.1566905975341797, 0.1631927490234375, 0.1696949005126953, 0.17619705200195312, 0.18269920349121094, 0.18920135498046875, 0.19570350646972656, 0.20220565795898438, 0.2087078094482422, 0.2152099609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 6.0, 12.0, 27.0, 45.0, 64.0, 98.0, 125.0, 132.0, 129.0, 108.0, 74.0, 57.0, 44.0, 27.0, 12.0, 6.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.774855613708496, -2.675018310546875, -2.575181007385254, -2.475343704223633, -2.3755064010620117, -2.2756690979003906, -2.1758317947387695, -2.0759944915771484, -1.9761570692062378, -1.8763197660446167, -1.7764824628829956, -1.676645040512085, -1.5768077373504639, -1.4769704341888428, -1.3771331310272217, -1.2772958278656006, -1.1774585247039795, -1.0776212215423584, -0.9777839183807373, -0.8779465556144714, -0.7781092524528503, -0.6782719492912292, -0.5784345865249634, -0.4785972833633423, -0.3787599802017212, -0.2789226770401001, -0.17908534407615662, -0.07924801111221313, 0.02058929204940796, 0.12042659521102905, 0.22026395797729492, 0.320101261138916, 0.4199388027191162, 0.5197761058807373, 0.6196134090423584, 0.7194507718086243, 0.8192880749702454, 0.9191253781318665, 1.0189627408981323, 1.1188000440597534, 1.2186373472213745, 1.3184746503829956, 1.4183119535446167, 1.5181493759155273, 1.6179866790771484, 1.7178239822387695, 1.8176612854003906, 1.9174985885620117, 2.017335891723633, 2.117173194885254, 2.217010498046875, 2.316847801208496, 2.416685104370117, 2.5165224075317383, 2.6163597106933594, 2.7161970138549805, 2.8160343170166016, 2.9158716201782227, 3.0157089233398438, 3.115546226501465, 3.215383529663086, 3.315220832824707, 3.415058135986328, 3.514895439147949, 3.6147329807281494]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 3.0, 5.0, 4.0, 7.0, 10.0, 12.0, 21.0, 18.0, 16.0, 23.0, 24.0, 36.0, 35.0, 26.0, 27.0, 28.0, 39.0, 37.0, 50.0, 45.0, 43.0, 43.0, 38.0, 34.0, 34.0, 34.0, 31.0, 30.0, 30.0, 28.0, 22.0, 23.0, 25.0, 16.0, 10.0, 17.0, 10.0, 13.0, 10.0, 8.0, 9.0, 5.0, 6.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5864137411117554, -1.5318446159362793, -1.4772756099700928, -1.4227064847946167, -1.3681373596191406, -1.313568353652954, -1.258999228477478, -1.204430103302002, -1.1498610973358154, -1.0952919721603394, -1.0407229661941528, -0.9861538410186768, -0.9315847754478455, -0.8770157098770142, -0.8224465847015381, -0.7678775191307068, -0.7133084535598755, -0.6587393879890442, -0.6041703224182129, -0.5496011972427368, -0.4950321316719055, -0.4404630661010742, -0.38589397072792053, -0.33132487535476685, -0.27675580978393555, -0.22218672931194305, -0.16761764883995056, -0.11304856836795807, -0.058479487895965576, -0.003910422325134277, 0.05065867304801941, 0.1052277684211731, 0.1597968339920044, 0.2143659144639969, 0.2689349949359894, 0.32350409030914307, 0.37807315587997437, 0.43264222145080566, 0.48721131682395935, 0.541780412197113, 0.5963494777679443, 0.6509185433387756, 0.7054876089096069, 0.760056734085083, 0.8146257996559143, 0.8691948652267456, 0.9237639904022217, 0.978333055973053, 1.0329021215438843, 1.0874712467193604, 1.1420402526855469, 1.196609377861023, 1.251178503036499, 1.3057475090026855, 1.3603166341781616, 1.4148857593536377, 1.4694547653198242, 1.5240238904953003, 1.5785928964614868, 1.633162021636963, 1.6877310276031494, 1.7423001527786255, 1.7968692779541016, 1.851438283920288, 1.9060074090957642]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 8.0, 18.0, 15.0, 33.0, 20.0, 44.0, 66.0, 80.0, 79.0, 122.0, 171.0, 208.0, 333.0, 444.0, 740.0, 1287.0, 2007.0, 3771.0, 7148.0, 15882.0, 40382.0, 126260.0, 459388.0, 1507619.0, 1411146.0, 430578.0, 120045.0, 37909.0, 14326.0, 6274.0, 3131.0, 1657.0, 971.0, 702.0, 421.0, 277.0, 167.0, 152.0, 110.0, 65.0, 67.0, 23.0, 25.0, 24.0, 25.0, 12.0, 15.0, 8.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2958984375, -0.2863426208496094, -0.27678680419921875, -0.2672309875488281, -0.2576751708984375, -0.24811935424804688, -0.23856353759765625, -0.22900772094726562, -0.219451904296875, -0.20989608764648438, -0.20034027099609375, -0.19078445434570312, -0.1812286376953125, -0.17167282104492188, -0.16211700439453125, -0.15256118774414062, -0.14300537109375, -0.13344955444335938, -0.12389373779296875, -0.11433792114257812, -0.1047821044921875, -0.09522628784179688, -0.08567047119140625, -0.07611465454101562, -0.066558837890625, -0.057003021240234375, -0.04744720458984375, -0.037891387939453125, -0.0283355712890625, -0.018779754638671875, -0.00922393798828125, 0.000331878662109375, 0.0098876953125, 0.019443511962890625, 0.02899932861328125, 0.038555145263671875, 0.0481109619140625, 0.057666778564453125, 0.06722259521484375, 0.07677841186523438, 0.086334228515625, 0.09589004516601562, 0.10544586181640625, 0.11500167846679688, 0.1245574951171875, 0.13411331176757812, 0.14366912841796875, 0.15322494506835938, 0.16278076171875, 0.17233657836914062, 0.18189239501953125, 0.19144821166992188, 0.2010040283203125, 0.21055984497070312, 0.22011566162109375, 0.22967147827148438, 0.239227294921875, 0.24878311157226562, 0.25833892822265625, 0.2678947448730469, 0.2774505615234375, 0.2870063781738281, 0.29656219482421875, 0.3061180114746094, 0.315673828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 4.0, 5.0, 4.0, 17.0, 15.0, 22.0, 21.0, 17.0, 20.0, 22.0, 25.0, 27.0, 30.0, 36.0, 40.0, 41.0, 44.0, 53.0, 42.0, 47.0, 38.0, 51.0, 40.0, 28.0, 37.0, 37.0, 36.0, 28.0, 37.0, 22.0, 15.0, 22.0, 12.0, 12.0, 14.0, 5.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19873046875, -0.19141387939453125, -0.1840972900390625, -0.17678070068359375, -0.169464111328125, -0.16214752197265625, -0.1548309326171875, -0.14751434326171875, -0.14019775390625, -0.13288116455078125, -0.1255645751953125, -0.11824798583984375, -0.110931396484375, -0.10361480712890625, -0.0962982177734375, -0.08898162841796875, -0.0816650390625, -0.07434844970703125, -0.0670318603515625, -0.05971527099609375, -0.052398681640625, -0.04508209228515625, -0.0377655029296875, -0.03044891357421875, -0.02313232421875, -0.01581573486328125, -0.0084991455078125, -0.00118255615234375, 0.006134033203125, 0.01345062255859375, 0.0207672119140625, 0.02808380126953125, 0.035400390625, 0.04271697998046875, 0.0500335693359375, 0.05735015869140625, 0.064666748046875, 0.07198333740234375, 0.0792999267578125, 0.08661651611328125, 0.09393310546875, 0.10124969482421875, 0.1085662841796875, 0.11588287353515625, 0.123199462890625, 0.13051605224609375, 0.1378326416015625, 0.14514923095703125, 0.1524658203125, 0.15978240966796875, 0.1670989990234375, 0.17441558837890625, 0.181732177734375, 0.18904876708984375, 0.1963653564453125, 0.20368194580078125, 0.21099853515625, 0.21831512451171875, 0.2256317138671875, 0.23294830322265625, 0.240264892578125, 0.24758148193359375, 0.2548980712890625, 0.26221466064453125, 0.26953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 8.0, 7.0, 29.0, 39.0, 40.0, 55.0, 77.0, 107.0, 199.0, 242.0, 360.0, 576.0, 943.0, 1444.0, 2361.0, 4266.0, 8146.0, 17933.0, 47143.0, 164703.0, 927631.0, 2410399.0, 448169.0, 98936.0, 31994.0, 13123.0, 6418.0, 3439.0, 2002.0, 1227.0, 726.0, 512.0, 311.0, 232.0, 138.0, 91.0, 71.0, 48.0, 37.0, 26.0, 23.0, 16.0, 14.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59619140625, -0.57977294921875, -0.5633544921875, -0.54693603515625, -0.530517578125, -0.51409912109375, -0.4976806640625, -0.48126220703125, -0.46484375, -0.44842529296875, -0.4320068359375, -0.41558837890625, -0.399169921875, -0.38275146484375, -0.3663330078125, -0.34991455078125, -0.33349609375, -0.31707763671875, -0.3006591796875, -0.28424072265625, -0.267822265625, -0.25140380859375, -0.2349853515625, -0.21856689453125, -0.2021484375, -0.18572998046875, -0.1693115234375, -0.15289306640625, -0.136474609375, -0.12005615234375, -0.1036376953125, -0.08721923828125, -0.07080078125, -0.05438232421875, -0.0379638671875, -0.02154541015625, -0.005126953125, 0.01129150390625, 0.0277099609375, 0.04412841796875, 0.060546875, 0.07696533203125, 0.0933837890625, 0.10980224609375, 0.126220703125, 0.14263916015625, 0.1590576171875, 0.17547607421875, 0.19189453125, 0.20831298828125, 0.2247314453125, 0.24114990234375, 0.257568359375, 0.27398681640625, 0.2904052734375, 0.30682373046875, 0.3232421875, 0.33966064453125, 0.3560791015625, 0.37249755859375, 0.388916015625, 0.40533447265625, 0.4217529296875, 0.43817138671875, 0.45458984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 1.0, 6.0, 9.0, 15.0, 17.0, 25.0, 27.0, 47.0, 73.0, 120.0, 200.0, 307.0, 557.0, 837.0, 678.0, 427.0, 261.0, 136.0, 92.0, 61.0, 49.0, 34.0, 25.0, 17.0, 10.0, 5.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.693359375, -0.6728363037109375, -0.652313232421875, -0.6317901611328125, -0.61126708984375, -0.5907440185546875, -0.570220947265625, -0.5496978759765625, -0.5291748046875, -0.5086517333984375, -0.488128662109375, -0.4676055908203125, -0.44708251953125, -0.4265594482421875, -0.406036376953125, -0.3855133056640625, -0.364990234375, -0.3444671630859375, -0.323944091796875, -0.3034210205078125, -0.28289794921875, -0.2623748779296875, -0.241851806640625, -0.2213287353515625, -0.2008056640625, -0.1802825927734375, -0.159759521484375, -0.1392364501953125, -0.11871337890625, -0.0981903076171875, -0.077667236328125, -0.0571441650390625, -0.03662109375, -0.0160980224609375, 0.004425048828125, 0.0249481201171875, 0.04547119140625, 0.0659942626953125, 0.086517333984375, 0.1070404052734375, 0.1275634765625, 0.1480865478515625, 0.168609619140625, 0.1891326904296875, 0.20965576171875, 0.2301788330078125, 0.250701904296875, 0.2712249755859375, 0.291748046875, 0.3122711181640625, 0.332794189453125, 0.3533172607421875, 0.37384033203125, 0.3943634033203125, 0.414886474609375, 0.4354095458984375, 0.4559326171875, 0.4764556884765625, 0.496978759765625, 0.5175018310546875, 0.53802490234375, 0.5585479736328125, 0.579071044921875, 0.5995941162109375, 0.6201171875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 3.0, 5.0, 4.0, 5.0, 20.0, 41.0, 66.0, 78.0, 112.0, 133.0, 164.0, 110.0, 104.0, 62.0, 38.0, 22.0, 9.0, 8.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.158179998397827, -2.038081407546997, -1.9179826974868774, -1.7978839874267578, -1.6777853965759277, -1.5576868057250977, -1.437588095664978, -1.3174893856048584, -1.1973907947540283, -1.0772922039031982, -0.9571934938430786, -0.8370948433876038, -0.7169961929321289, -0.596897542476654, -0.4767988920211792, -0.35670024156570435, -0.2366015911102295, -0.11650294065475464, 0.003595709800720215, 0.12369436025619507, 0.24379301071166992, 0.3638916611671448, 0.48399031162261963, 0.6040889620780945, 0.7241876125335693, 0.8442862629890442, 0.964384913444519, 1.0844836235046387, 1.2045822143554688, 1.3246808052062988, 1.4447795152664185, 1.564878225326538, 1.6849770545959473, 1.8050756454467773, 1.925174355506897, 2.0452730655670166, 2.1653716564178467, 2.2854702472686768, 2.405569076538086, 2.525667667388916, 2.645766258239746, 2.765864849090576, 2.8859634399414062, 3.0060622692108154, 3.1261608600616455, 3.2462594509124756, 3.3663582801818848, 3.486456871032715, 3.606555461883545, 3.726654052734375, 3.846752643585205, 3.9668514728546143, 4.086950302124023, 4.2070488929748535, 4.327147483825684, 4.447246074676514, 4.567344665527344, 4.687443256378174, 4.807541847229004, 4.927640438079834, 5.047739028930664, 5.167838096618652, 5.287936687469482, 5.4080352783203125, 5.528133869171143]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 11.0, 15.0, 12.0, 22.0, 26.0, 23.0, 28.0, 20.0, 35.0, 31.0, 34.0, 46.0, 45.0, 35.0, 38.0, 52.0, 44.0, 48.0, 38.0, 34.0, 34.0, 45.0, 30.0, 24.0, 26.0, 19.0, 25.0, 25.0, 18.0, 16.0, 17.0, 11.0, 6.0, 8.0, 2.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6161739826202393, -1.5630261898040771, -1.5098782777786255, -1.4567304849624634, -1.4035825729370117, -1.3504347801208496, -1.2972869873046875, -1.2441390752792358, -1.1909911632537842, -1.137843370437622, -1.0846954584121704, -1.0315476655960083, -0.9783997535705566, -0.9252519607543945, -0.8721041083335876, -0.8189562559127808, -0.7658084630966187, -0.7126606106758118, -0.6595127582550049, -0.6063649654388428, -0.5532170534133911, -0.500069260597229, -0.4469214081764221, -0.39377355575561523, -0.34062570333480835, -0.28747785091400146, -0.23433001339435577, -0.18118217587471008, -0.1280343234539032, -0.07488647103309631, -0.021738648414611816, 0.03140920400619507, 0.0845571756362915, 0.1377050280570984, 0.19085286557674408, 0.24400070309638977, 0.29714855551719666, 0.35029640793800354, 0.40344423055648804, 0.4565920829772949, 0.5097399353981018, 0.5628877878189087, 0.6160356402397156, 0.6691834926605225, 0.7223312854766846, 0.7754791975021362, 0.8286269903182983, 0.8817748427391052, 0.9349226951599121, 0.988070547580719, 1.0412184000015259, 1.094366192817688, 1.1475141048431396, 1.2006618976593018, 1.2538096904754639, 1.3069576025009155, 1.3601055145263672, 1.4132533073425293, 1.466401219367981, 1.519549012184143, 1.5726969242095947, 1.6258447170257568, 1.678992509841919, 1.7321404218673706, 1.7852882146835327]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 12.0, 10.0, 30.0, 33.0, 44.0, 71.0, 84.0, 104.0, 174.0, 254.0, 395.0, 646.0, 953.0, 1629.0, 2746.0, 4774.0, 8607.0, 16776.0, 36053.0, 93584.0, 242293.0, 337289.0, 179134.0, 65346.0, 27238.0, 13244.0, 6948.0, 3793.0, 2357.0, 1420.0, 841.0, 544.0, 386.0, 202.0, 171.0, 112.0, 61.0, 45.0, 41.0, 33.0, 18.0, 16.0, 11.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.456298828125, -0.4407386779785156, -0.42517852783203125, -0.4096183776855469, -0.3940582275390625, -0.3784980773925781, -0.36293792724609375, -0.3473777770996094, -0.331817626953125, -0.3162574768066406, -0.30069732666015625, -0.2851371765136719, -0.2695770263671875, -0.2540168762207031, -0.23845672607421875, -0.22289657592773438, -0.20733642578125, -0.19177627563476562, -0.17621612548828125, -0.16065597534179688, -0.1450958251953125, -0.12953567504882812, -0.11397552490234375, -0.09841537475585938, -0.082855224609375, -0.06729507446289062, -0.05173492431640625, -0.036174774169921875, -0.0206146240234375, -0.005054473876953125, 0.01050567626953125, 0.026065826416015625, 0.0416259765625, 0.057186126708984375, 0.07274627685546875, 0.08830642700195312, 0.1038665771484375, 0.11942672729492188, 0.13498687744140625, 0.15054702758789062, 0.166107177734375, 0.18166732788085938, 0.19722747802734375, 0.21278762817382812, 0.2283477783203125, 0.24390792846679688, 0.25946807861328125, 0.2750282287597656, 0.29058837890625, 0.3061485290527344, 0.32170867919921875, 0.3372688293457031, 0.3528289794921875, 0.3683891296386719, 0.38394927978515625, 0.3995094299316406, 0.415069580078125, 0.4306297302246094, 0.44618988037109375, 0.4617500305175781, 0.4773101806640625, 0.4928703308105469, 0.5084304809570312, 0.5239906311035156, 0.53955078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 3.0, 5.0, 3.0, 9.0, 11.0, 18.0, 14.0, 14.0, 22.0, 28.0, 26.0, 42.0, 39.0, 41.0, 34.0, 38.0, 46.0, 46.0, 66.0, 52.0, 56.0, 62.0, 33.0, 44.0, 35.0, 23.0, 32.0, 28.0, 21.0, 20.0, 19.0, 19.0, 9.0, 9.0, 8.0, 9.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24728775024414062, -0.23896026611328125, -0.23063278198242188, -0.2223052978515625, -0.21397781372070312, -0.20565032958984375, -0.19732284545898438, -0.188995361328125, -0.18066787719726562, -0.17234039306640625, -0.16401290893554688, -0.1556854248046875, -0.14735794067382812, -0.13903045654296875, -0.13070297241210938, -0.12237548828125, -0.11404800415039062, -0.10572052001953125, -0.09739303588867188, -0.0890655517578125, -0.08073806762695312, -0.07241058349609375, -0.06408309936523438, -0.055755615234375, -0.047428131103515625, -0.03910064697265625, -0.030773162841796875, -0.0224456787109375, -0.014118194580078125, -0.00579071044921875, 0.002536773681640625, 0.0108642578125, 0.019191741943359375, 0.02751922607421875, 0.035846710205078125, 0.0441741943359375, 0.052501678466796875, 0.06082916259765625, 0.06915664672851562, 0.077484130859375, 0.08581161499023438, 0.09413909912109375, 0.10246658325195312, 0.1107940673828125, 0.11912155151367188, 0.12744903564453125, 0.13577651977539062, 0.14410400390625, 0.15243148803710938, 0.16075897216796875, 0.16908645629882812, 0.1774139404296875, 0.18574142456054688, 0.19406890869140625, 0.20239639282226562, 0.210723876953125, 0.21905136108398438, 0.22737884521484375, 0.23570632934570312, 0.2440338134765625, 0.2523612976074219, 0.26068878173828125, 0.2690162658691406, 0.27734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 2.0, 6.0, 13.0, 16.0, 23.0, 35.0, 47.0, 78.0, 139.0, 213.0, 390.0, 671.0, 1298.0, 2573.0, 5465.0, 12954.0, 34033.0, 105465.0, 334983.0, 364135.0, 121646.0, 38142.0, 14257.0, 6022.0, 2817.0, 1394.0, 674.0, 403.0, 262.0, 143.0, 97.0, 50.0, 38.0, 24.0, 19.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4755859375, -0.45660400390625, -0.4376220703125, -0.41864013671875, -0.399658203125, -0.38067626953125, -0.3616943359375, -0.34271240234375, -0.32373046875, -0.30474853515625, -0.2857666015625, -0.26678466796875, -0.247802734375, -0.22882080078125, -0.2098388671875, -0.19085693359375, -0.171875, -0.15289306640625, -0.1339111328125, -0.11492919921875, -0.095947265625, -0.07696533203125, -0.0579833984375, -0.03900146484375, -0.02001953125, -0.00103759765625, 0.0179443359375, 0.03692626953125, 0.055908203125, 0.07489013671875, 0.0938720703125, 0.11285400390625, 0.1318359375, 0.15081787109375, 0.1697998046875, 0.18878173828125, 0.207763671875, 0.22674560546875, 0.2457275390625, 0.26470947265625, 0.28369140625, 0.30267333984375, 0.3216552734375, 0.34063720703125, 0.359619140625, 0.37860107421875, 0.3975830078125, 0.41656494140625, 0.435546875, 0.45452880859375, 0.4735107421875, 0.49249267578125, 0.511474609375, 0.53045654296875, 0.5494384765625, 0.56842041015625, 0.58740234375, 0.60638427734375, 0.6253662109375, 0.64434814453125, 0.663330078125, 0.68231201171875, 0.7012939453125, 0.72027587890625, 0.7392578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 5.0, 8.0, 9.0, 10.0, 17.0, 17.0, 18.0, 19.0, 30.0, 19.0, 37.0, 28.0, 24.0, 29.0, 37.0, 31.0, 36.0, 34.0, 34.0, 34.0, 44.0, 48.0, 27.0, 33.0, 44.0, 35.0, 36.0, 32.0, 27.0, 31.0, 17.0, 19.0, 22.0, 16.0, 14.0, 11.0, 6.0, 8.0, 5.0, 9.0, 9.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.71923828125, -0.6988601684570312, -0.6784820556640625, -0.6581039428710938, -0.637725830078125, -0.6173477172851562, -0.5969696044921875, -0.5765914916992188, -0.55621337890625, -0.5358352661132812, -0.5154571533203125, -0.49507904052734375, -0.474700927734375, -0.45432281494140625, -0.4339447021484375, -0.41356658935546875, -0.3931884765625, -0.37281036376953125, -0.3524322509765625, -0.33205413818359375, -0.311676025390625, -0.29129791259765625, -0.2709197998046875, -0.25054168701171875, -0.23016357421875, -0.20978546142578125, -0.1894073486328125, -0.16902923583984375, -0.148651123046875, -0.12827301025390625, -0.1078948974609375, -0.08751678466796875, -0.067138671875, -0.04676055908203125, -0.0263824462890625, -0.00600433349609375, 0.014373779296875, 0.03475189208984375, 0.0551300048828125, 0.07550811767578125, 0.09588623046875, 0.11626434326171875, 0.1366424560546875, 0.15702056884765625, 0.177398681640625, 0.19777679443359375, 0.2181549072265625, 0.23853302001953125, 0.2589111328125, 0.27928924560546875, 0.2996673583984375, 0.32004547119140625, 0.340423583984375, 0.36080169677734375, 0.3811798095703125, 0.40155792236328125, 0.42193603515625, 0.44231414794921875, 0.4626922607421875, 0.48307037353515625, 0.503448486328125, 0.5238265991210938, 0.5442047119140625, 0.5645828247070312, 0.5849609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 6.0, 12.0, 13.0, 18.0, 38.0, 47.0, 71.0, 104.0, 120.0, 212.0, 337.0, 518.0, 796.0, 1232.0, 2013.0, 3430.0, 6113.0, 11515.0, 23684.0, 53499.0, 137723.0, 328869.0, 282681.0, 108740.0, 43344.0, 20192.0, 9965.0, 5304.0, 2997.0, 1782.0, 1091.0, 705.0, 487.0, 301.0, 182.0, 117.0, 114.0, 46.0, 47.0, 30.0, 15.0, 13.0, 5.0, 13.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.230712890625, -0.222991943359375, -0.21527099609375, -0.207550048828125, -0.1998291015625, -0.192108154296875, -0.18438720703125, -0.176666259765625, -0.1689453125, -0.161224365234375, -0.15350341796875, -0.145782470703125, -0.1380615234375, -0.130340576171875, -0.12261962890625, -0.114898681640625, -0.107177734375, -0.099456787109375, -0.09173583984375, -0.084014892578125, -0.0762939453125, -0.068572998046875, -0.06085205078125, -0.053131103515625, -0.04541015625, -0.037689208984375, -0.02996826171875, -0.022247314453125, -0.0145263671875, -0.006805419921875, 0.00091552734375, 0.008636474609375, 0.016357421875, 0.024078369140625, 0.03179931640625, 0.039520263671875, 0.0472412109375, 0.054962158203125, 0.06268310546875, 0.070404052734375, 0.078125, 0.085845947265625, 0.09356689453125, 0.101287841796875, 0.1090087890625, 0.116729736328125, 0.12445068359375, 0.132171630859375, 0.139892578125, 0.147613525390625, 0.15533447265625, 0.163055419921875, 0.1707763671875, 0.178497314453125, 0.18621826171875, 0.193939208984375, 0.20166015625, 0.209381103515625, 0.21710205078125, 0.224822998046875, 0.2325439453125, 0.240264892578125, 0.24798583984375, 0.255706787109375, 0.263427734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 13.0, 11.0, 10.0, 20.0, 24.0, 39.0, 64.0, 90.0, 121.0, 127.0, 124.0, 93.0, 57.0, 46.0, 33.0, 28.0, 15.0, 15.0, 10.0, 10.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.22083854675293e-05, -8.912384510040283e-05, -8.603930473327637e-05, -8.29547643661499e-05, -7.987022399902344e-05, -7.678568363189697e-05, -7.370114326477051e-05, -7.061660289764404e-05, -6.753206253051758e-05, -6.444752216339111e-05, -6.136298179626465e-05, -5.8278441429138184e-05, -5.519390106201172e-05, -5.2109360694885254e-05, -4.902482032775879e-05, -4.5940279960632324e-05, -4.285573959350586e-05, -3.9771199226379395e-05, -3.668665885925293e-05, -3.3602118492126465e-05, -3.0517578125e-05, -2.7433037757873535e-05, -2.434849739074707e-05, -2.1263957023620605e-05, -1.817941665649414e-05, -1.5094876289367676e-05, -1.2010335922241211e-05, -8.925795555114746e-06, -5.841255187988281e-06, -2.7567148208618164e-06, 3.2782554626464844e-07, 3.4123659133911133e-06, 6.496906280517578e-06, 9.581446647644043e-06, 1.2665987014770508e-05, 1.5750527381896973e-05, 1.8835067749023438e-05, 2.1919608116149902e-05, 2.5004148483276367e-05, 2.8088688850402832e-05, 3.11732292175293e-05, 3.425776958465576e-05, 3.7342309951782227e-05, 4.042685031890869e-05, 4.3511390686035156e-05, 4.659593105316162e-05, 4.9680471420288086e-05, 5.276501178741455e-05, 5.5849552154541016e-05, 5.893409252166748e-05, 6.201863288879395e-05, 6.510317325592041e-05, 6.818771362304688e-05, 7.127225399017334e-05, 7.43567943572998e-05, 7.744133472442627e-05, 8.052587509155273e-05, 8.36104154586792e-05, 8.669495582580566e-05, 8.977949619293213e-05, 9.28640365600586e-05, 9.594857692718506e-05, 9.903311729431152e-05, 0.00010211765766143799, 0.00010520219802856445]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 11.0, 21.0, 13.0, 22.0, 46.0, 57.0, 110.0, 123.0, 180.0, 257.0, 357.0, 553.0, 870.0, 1344.0, 2197.0, 3704.0, 6297.0, 11322.0, 22210.0, 45974.0, 99983.0, 209946.0, 284832.0, 186743.0, 86168.0, 40461.0, 19641.0, 10435.0, 5692.0, 3323.0, 1986.0, 1232.0, 773.0, 544.0, 353.0, 225.0, 159.0, 96.0, 72.0, 49.0, 42.0, 38.0, 32.0, 14.0, 12.0, 9.0, 8.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2027587890625, -0.196502685546875, -0.19024658203125, -0.183990478515625, -0.177734375, -0.171478271484375, -0.16522216796875, -0.158966064453125, -0.1527099609375, -0.146453857421875, -0.14019775390625, -0.133941650390625, -0.127685546875, -0.121429443359375, -0.11517333984375, -0.108917236328125, -0.1026611328125, -0.096405029296875, -0.09014892578125, -0.083892822265625, -0.07763671875, -0.071380615234375, -0.06512451171875, -0.058868408203125, -0.0526123046875, -0.046356201171875, -0.04010009765625, -0.033843994140625, -0.027587890625, -0.021331787109375, -0.01507568359375, -0.008819580078125, -0.0025634765625, 0.003692626953125, 0.00994873046875, 0.016204833984375, 0.0224609375, 0.028717041015625, 0.03497314453125, 0.041229248046875, 0.0474853515625, 0.053741455078125, 0.05999755859375, 0.066253662109375, 0.072509765625, 0.078765869140625, 0.08502197265625, 0.091278076171875, 0.0975341796875, 0.103790283203125, 0.11004638671875, 0.116302490234375, 0.12255859375, 0.128814697265625, 0.13507080078125, 0.141326904296875, 0.1475830078125, 0.153839111328125, 0.16009521484375, 0.166351318359375, 0.172607421875, 0.178863525390625, 0.18511962890625, 0.191375732421875, 0.1976318359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 6.0, 5.0, 8.0, 16.0, 14.0, 18.0, 26.0, 23.0, 31.0, 33.0, 39.0, 49.0, 57.0, 63.0, 68.0, 63.0, 82.0, 51.0, 46.0, 55.0, 35.0, 28.0, 37.0, 22.0, 19.0, 18.0, 14.0, 9.0, 13.0, 7.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2423095703125, -0.23499488830566406, -0.22768020629882812, -0.2203655242919922, -0.21305084228515625, -0.2057361602783203, -0.19842147827148438, -0.19110679626464844, -0.1837921142578125, -0.17647743225097656, -0.16916275024414062, -0.1618480682373047, -0.15453338623046875, -0.1472187042236328, -0.13990402221679688, -0.13258934020996094, -0.125274658203125, -0.11795997619628906, -0.11064529418945312, -0.10333061218261719, -0.09601593017578125, -0.08870124816894531, -0.08138656616210938, -0.07407188415527344, -0.0667572021484375, -0.05944252014160156, -0.052127838134765625, -0.04481315612792969, -0.03749847412109375, -0.030183792114257812, -0.022869110107421875, -0.015554428100585938, -0.00823974609375, -0.0009250640869140625, 0.006389617919921875, 0.013704299926757812, 0.02101898193359375, 0.028333663940429688, 0.035648345947265625, 0.04296302795410156, 0.0502777099609375, 0.05759239196777344, 0.06490707397460938, 0.07222175598144531, 0.07953643798828125, 0.08685111999511719, 0.09416580200195312, 0.10148048400878906, 0.108795166015625, 0.11610984802246094, 0.12342453002929688, 0.1307392120361328, 0.13805389404296875, 0.1453685760498047, 0.15268325805664062, 0.15999794006347656, 0.1673126220703125, 0.17462730407714844, 0.18194198608398438, 0.1892566680908203, 0.19657135009765625, 0.2038860321044922, 0.21120071411132812, 0.21851539611816406, 0.225830078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 12.0, 7.0, 47.0, 95.0, 154.0, 222.0, 199.0, 134.0, 61.0, 30.0, 13.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1180877685546875, -6.924006462097168, -6.729925155639648, -6.535843849182129, -6.341762542724609, -6.14768123626709, -5.95359992980957, -5.759518623352051, -5.565437316894531, -5.371356010437012, -5.177274703979492, -4.983193397521973, -4.789112091064453, -4.595030784606934, -4.400949478149414, -4.2068681716918945, -4.012786865234375, -3.8187055587768555, -3.624624252319336, -3.4305429458618164, -3.236461639404297, -3.0423803329467773, -2.848299026489258, -2.6542177200317383, -2.4601359367370605, -2.266054630279541, -2.0719733238220215, -1.877892017364502, -1.6838107109069824, -1.489729404449463, -1.2956479787826538, -1.1015666723251343, -0.9074854850769043, -0.7134041786193848, -0.5193228721618652, -0.3252415060997009, -0.1311601996421814, 0.06292110681533813, 0.25700247287750244, 0.451083779335022, 0.6451650857925415, 0.839246392250061, 1.0333276987075806, 1.2274091243743896, 1.4214904308319092, 1.6155717372894287, 1.8096530437469482, 2.0037343502044678, 2.1978156566619873, 2.391896963119507, 2.5859782695770264, 2.780059576034546, 2.9741408824920654, 3.168222188949585, 3.3623037338256836, 3.556385040283203, 3.7504663467407227, 3.944547653198242, 4.138628959655762, 4.332710266113281, 4.526791572570801, 4.72087287902832, 4.91495418548584, 5.109035491943359, 5.303116798400879]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 11.0, 11.0, 13.0, 18.0, 13.0, 11.0, 18.0, 25.0, 24.0, 28.0, 24.0, 33.0, 29.0, 40.0, 38.0, 39.0, 43.0, 41.0, 44.0, 33.0, 37.0, 32.0, 27.0, 39.0, 40.0, 29.0, 36.0, 37.0, 25.0, 26.0, 21.0, 17.0, 14.0, 21.0, 4.0, 9.0, 9.0, 5.0, 5.0, 9.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6392848491668701, -1.5844029188156128, -1.529520869255066, -1.4746389389038086, -1.4197568893432617, -1.3648749589920044, -1.309993028640747, -1.2551109790802002, -1.2002290487289429, -1.1453471183776855, -1.0904650688171387, -1.0355831384658813, -0.9807011485099792, -0.9258191585540771, -0.8709372282028198, -0.8160552382469177, -0.7611732482910156, -0.7062912583351135, -0.6514092683792114, -0.5965273380279541, -0.541645348072052, -0.4867633581161499, -0.4318813979625702, -0.3769994378089905, -0.3221174478530884, -0.2672354578971863, -0.21235349774360657, -0.15747152268886566, -0.10258954763412476, -0.047707557678222656, 0.007174402475357056, 0.06205636262893677, 0.11693823337554932, 0.17182020843029022, 0.22670218348503113, 0.28158414363861084, 0.33646613359451294, 0.39134812355041504, 0.44623008370399475, 0.5011120438575745, 0.5559940338134766, 0.6108760237693787, 0.6657580137252808, 0.7206399440765381, 0.7755219340324402, 0.8304039239883423, 0.8852858543395996, 0.9401678442955017, 0.9950498342514038, 1.0499317646026611, 1.104813814163208, 1.1596957445144653, 1.2145776748657227, 1.2694597244262695, 1.3243416547775269, 1.3792235851287842, 1.434105634689331, 1.4889875650405884, 1.5438696146011353, 1.5987515449523926, 1.6536335945129395, 1.7085155248641968, 1.763397455215454, 1.818279504776001, 1.8731614351272583]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 15.0, 17.0, 29.0, 44.0, 68.0, 101.0, 134.0, 180.0, 250.0, 384.0, 557.0, 816.0, 1202.0, 2126.0, 3523.0, 6493.0, 13432.0, 31728.0, 91680.0, 325470.0, 1113615.0, 1673050.0, 650410.0, 179982.0, 55362.0, 21258.0, 9719.0, 4997.0, 2798.0, 1668.0, 1040.0, 715.0, 428.0, 285.0, 212.0, 154.0, 102.0, 69.0, 46.0, 38.0, 22.0, 16.0, 9.0, 5.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.3248405456542969, -0.31374359130859375, -0.3026466369628906, -0.2915496826171875, -0.2804527282714844, -0.26935577392578125, -0.2582588195800781, -0.247161865234375, -0.23606491088867188, -0.22496795654296875, -0.21387100219726562, -0.2027740478515625, -0.19167709350585938, -0.18058013916015625, -0.16948318481445312, -0.15838623046875, -0.14728927612304688, -0.13619232177734375, -0.12509536743164062, -0.1139984130859375, -0.10290145874023438, -0.09180450439453125, -0.08070755004882812, -0.069610595703125, -0.058513641357421875, -0.04741668701171875, -0.036319732666015625, -0.0252227783203125, -0.014125823974609375, -0.00302886962890625, 0.008068084716796875, 0.0191650390625, 0.030261993408203125, 0.04135894775390625, 0.052455902099609375, 0.0635528564453125, 0.07464981079101562, 0.08574676513671875, 0.09684371948242188, 0.107940673828125, 0.11903762817382812, 0.13013458251953125, 0.14123153686523438, 0.1523284912109375, 0.16342544555664062, 0.17452239990234375, 0.18561935424804688, 0.19671630859375, 0.20781326293945312, 0.21891021728515625, 0.23000717163085938, 0.2411041259765625, 0.2522010803222656, 0.26329803466796875, 0.2743949890136719, 0.285491943359375, 0.2965888977050781, 0.30768585205078125, 0.3187828063964844, 0.3298797607421875, 0.3409767150878906, 0.35207366943359375, 0.3631706237792969, 0.374267578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 7.0, 6.0, 6.0, 14.0, 15.0, 8.0, 20.0, 18.0, 14.0, 22.0, 27.0, 17.0, 28.0, 33.0, 33.0, 31.0, 36.0, 35.0, 42.0, 40.0, 45.0, 39.0, 42.0, 27.0, 41.0, 37.0, 24.0, 25.0, 38.0, 25.0, 22.0, 17.0, 30.0, 20.0, 14.0, 16.0, 21.0, 13.0, 9.0, 8.0, 4.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2186279296875, -0.21173477172851562, -0.20484161376953125, -0.19794845581054688, -0.1910552978515625, -0.18416213989257812, -0.17726898193359375, -0.17037582397460938, -0.163482666015625, -0.15658950805664062, -0.14969635009765625, -0.14280319213867188, -0.1359100341796875, -0.12901687622070312, -0.12212371826171875, -0.11523056030273438, -0.10833740234375, -0.10144424438476562, -0.09455108642578125, -0.08765792846679688, -0.0807647705078125, -0.07387161254882812, -0.06697845458984375, -0.060085296630859375, -0.053192138671875, -0.046298980712890625, -0.03940582275390625, -0.032512664794921875, -0.0256195068359375, -0.018726348876953125, -0.01183319091796875, -0.004940032958984375, 0.001953125, 0.008846282958984375, 0.01573944091796875, 0.022632598876953125, 0.0295257568359375, 0.036418914794921875, 0.04331207275390625, 0.050205230712890625, 0.057098388671875, 0.06399154663085938, 0.07088470458984375, 0.07777786254882812, 0.0846710205078125, 0.09156417846679688, 0.09845733642578125, 0.10535049438476562, 0.11224365234375, 0.11913681030273438, 0.12602996826171875, 0.13292312622070312, 0.1398162841796875, 0.14670944213867188, 0.15360260009765625, 0.16049575805664062, 0.167388916015625, 0.17428207397460938, 0.18117523193359375, 0.18806838989257812, 0.1949615478515625, 0.20185470581054688, 0.20874786376953125, 0.21564102172851562, 0.2225341796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 10.0, 8.0, 25.0, 29.0, 39.0, 63.0, 81.0, 113.0, 176.0, 283.0, 435.0, 768.0, 1265.0, 2234.0, 4462.0, 9894.0, 25793.0, 84803.0, 398928.0, 2384233.0, 1036954.0, 169912.0, 44605.0, 15529.0, 6326.0, 3159.0, 1639.0, 950.0, 541.0, 323.0, 217.0, 150.0, 101.0, 58.0, 52.0, 25.0, 21.0, 15.0, 15.0, 11.0, 11.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5501937866210938, -0.5310516357421875, -0.5119094848632812, -0.492767333984375, -0.47362518310546875, -0.4544830322265625, -0.43534088134765625, -0.41619873046875, -0.39705657958984375, -0.3779144287109375, -0.35877227783203125, -0.339630126953125, -0.32048797607421875, -0.3013458251953125, -0.28220367431640625, -0.2630615234375, -0.24391937255859375, -0.2247772216796875, -0.20563507080078125, -0.186492919921875, -0.16735076904296875, -0.1482086181640625, -0.12906646728515625, -0.10992431640625, -0.09078216552734375, -0.0716400146484375, -0.05249786376953125, -0.033355712890625, -0.01421356201171875, 0.0049285888671875, 0.02407073974609375, 0.043212890625, 0.06235504150390625, 0.0814971923828125, 0.10063934326171875, 0.119781494140625, 0.13892364501953125, 0.1580657958984375, 0.17720794677734375, 0.19635009765625, 0.21549224853515625, 0.2346343994140625, 0.25377655029296875, 0.272918701171875, 0.29206085205078125, 0.3112030029296875, 0.33034515380859375, 0.3494873046875, 0.36862945556640625, 0.3877716064453125, 0.40691375732421875, 0.426055908203125, 0.44519805908203125, 0.4643402099609375, 0.48348236083984375, 0.50262451171875, 0.5217666625976562, 0.5409088134765625, 0.5600509643554688, 0.579193115234375, 0.5983352661132812, 0.6174774169921875, 0.6366195678710938, 0.65576171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 4.0, 7.0, 10.0, 16.0, 27.0, 26.0, 31.0, 41.0, 50.0, 77.0, 89.0, 117.0, 170.0, 264.0, 348.0, 502.0, 557.0, 497.0, 343.0, 231.0, 143.0, 115.0, 87.0, 61.0, 70.0, 45.0, 20.0, 22.0, 24.0, 16.0, 15.0, 7.0, 6.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5078125, -0.49213409423828125, -0.4764556884765625, -0.46077728271484375, -0.445098876953125, -0.42942047119140625, -0.4137420654296875, -0.39806365966796875, -0.38238525390625, -0.36670684814453125, -0.3510284423828125, -0.33535003662109375, -0.319671630859375, -0.30399322509765625, -0.2883148193359375, -0.27263641357421875, -0.2569580078125, -0.24127960205078125, -0.2256011962890625, -0.20992279052734375, -0.194244384765625, -0.17856597900390625, -0.1628875732421875, -0.14720916748046875, -0.13153076171875, -0.11585235595703125, -0.1001739501953125, -0.08449554443359375, -0.068817138671875, -0.05313873291015625, -0.0374603271484375, -0.02178192138671875, -0.006103515625, 0.00957489013671875, 0.0252532958984375, 0.04093170166015625, 0.056610107421875, 0.07228851318359375, 0.0879669189453125, 0.10364532470703125, 0.11932373046875, 0.13500213623046875, 0.1506805419921875, 0.16635894775390625, 0.182037353515625, 0.19771575927734375, 0.2133941650390625, 0.22907257080078125, 0.2447509765625, 0.26042938232421875, 0.2761077880859375, 0.29178619384765625, 0.307464599609375, 0.32314300537109375, 0.3388214111328125, 0.35449981689453125, 0.37017822265625, 0.38585662841796875, 0.4015350341796875, 0.41721343994140625, 0.432891845703125, 0.44857025146484375, 0.4642486572265625, 0.47992706298828125, 0.49560546875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 6.0, 4.0, 6.0, 18.0, 30.0, 45.0, 65.0, 119.0, 115.0, 180.0, 154.0, 93.0, 82.0, 31.0, 19.0, 14.0, 10.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7933478355407715, -3.649268865585327, -3.505189895629883, -3.3611106872558594, -3.217031717300415, -3.0729527473449707, -2.9288735389709473, -2.784794569015503, -2.6407155990600586, -2.4966366291046143, -2.35255765914917, -2.2084784507751465, -2.064399480819702, -1.9203205108642578, -1.776241421699524, -1.63216233253479, -1.4880833625793457, -1.3440043926239014, -1.1999253034591675, -1.0558462142944336, -0.9117672443389893, -0.7676882147789001, -0.623609185218811, -0.47953009605407715, -0.3354511260986328, -0.1913720965385437, -0.04729306697845459, 0.09678596258163452, 0.24086499214172363, 0.38494402170181274, 0.5290230512619019, 0.6731021404266357, 0.8171811103820801, 0.9612601399421692, 1.1053391695022583, 1.2494182586669922, 1.3934972286224365, 1.5375761985778809, 1.6816552877426147, 1.8257343769073486, 1.969813346862793, 2.1138923168182373, 2.2579712867736816, 2.402050495147705, 2.5461294651031494, 2.6902084350585938, 2.834287643432617, 2.9783666133880615, 3.122445583343506, 3.26652455329895, 3.4106035232543945, 3.554682731628418, 3.6987617015838623, 3.8428406715393066, 3.98691987991333, 4.130998611450195, 4.275077819824219, 4.419157028198242, 4.563235759735107, 4.707314968109131, 4.851393699645996, 4.9954729080200195, 5.139552116394043, 5.283631324768066, 5.427710056304932]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 6.0, 8.0, 11.0, 10.0, 14.0, 20.0, 16.0, 16.0, 21.0, 19.0, 29.0, 23.0, 32.0, 36.0, 37.0, 28.0, 35.0, 27.0, 28.0, 36.0, 44.0, 26.0, 31.0, 32.0, 39.0, 38.0, 36.0, 35.0, 29.0, 34.0, 33.0, 20.0, 24.0, 18.0, 10.0, 17.0, 14.0, 10.0, 11.0, 10.0, 4.0, 10.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5321400165557861, -1.485368251800537, -1.438596487045288, -1.391824722290039, -1.34505295753479, -1.298281192779541, -1.251509428024292, -1.204737663269043, -1.157965898513794, -1.111194133758545, -1.064422369003296, -1.0176506042480469, -0.9708788394927979, -0.9241070747375488, -0.877335250377655, -0.830563485622406, -0.7837916612625122, -0.7370198965072632, -0.6902481317520142, -0.6434763669967651, -0.5967046022415161, -0.5499328374862671, -0.5031610131263733, -0.45638924837112427, -0.40961748361587524, -0.3628457188606262, -0.3160739541053772, -0.2693021595478058, -0.22253039479255676, -0.17575863003730774, -0.12898683547973633, -0.0822150707244873, -0.03544342517852783, 0.011328347027301788, 0.05810011923313141, 0.10487189888954163, 0.15164366364479065, 0.19841542840003967, 0.24518722295761108, 0.2919589877128601, 0.33873075246810913, 0.38550251722335815, 0.4322742819786072, 0.4790460765361786, 0.52581787109375, 0.572589635848999, 0.619361400604248, 0.6661331653594971, 0.7129049301147461, 0.7596766948699951, 0.8064484596252441, 0.8532202243804932, 0.8999919891357422, 0.9467637538909912, 0.993535578250885, 1.0403072834014893, 1.0870790481567383, 1.1338508129119873, 1.1806225776672363, 1.2273943424224854, 1.2741661071777344, 1.3209378719329834, 1.3677096366882324, 1.4144814014434814, 1.46125328540802]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 4.0, 8.0, 16.0, 13.0, 29.0, 32.0, 59.0, 63.0, 91.0, 145.0, 221.0, 310.0, 432.0, 649.0, 979.0, 1634.0, 2692.0, 4463.0, 8613.0, 18235.0, 42246.0, 104633.0, 233815.0, 303695.0, 185127.0, 77609.0, 31516.0, 14316.0, 6932.0, 3787.0, 2143.0, 1417.0, 874.0, 521.0, 384.0, 271.0, 193.0, 121.0, 76.0, 50.0, 37.0, 38.0, 11.0, 15.0, 10.0, 10.0, 11.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4157371520996094, -0.40203094482421875, -0.3883247375488281, -0.3746185302734375, -0.3609123229980469, -0.34720611572265625, -0.3334999084472656, -0.319793701171875, -0.3060874938964844, -0.29238128662109375, -0.2786750793457031, -0.2649688720703125, -0.2512626647949219, -0.23755645751953125, -0.22385025024414062, -0.21014404296875, -0.19643783569335938, -0.18273162841796875, -0.16902542114257812, -0.1553192138671875, -0.14161300659179688, -0.12790679931640625, -0.11420059204101562, -0.100494384765625, -0.08678817749023438, -0.07308197021484375, -0.059375762939453125, -0.0456695556640625, -0.031963348388671875, -0.01825714111328125, -0.004550933837890625, 0.0091552734375, 0.022861480712890625, 0.03656768798828125, 0.050273895263671875, 0.0639801025390625, 0.07768630981445312, 0.09139251708984375, 0.10509872436523438, 0.118804931640625, 0.13251113891601562, 0.14621734619140625, 0.15992355346679688, 0.1736297607421875, 0.18733596801757812, 0.20104217529296875, 0.21474838256835938, 0.22845458984375, 0.24216079711914062, 0.25586700439453125, 0.2695732116699219, 0.2832794189453125, 0.2969856262207031, 0.31069183349609375, 0.3243980407714844, 0.338104248046875, 0.3518104553222656, 0.36551666259765625, 0.3792228698730469, 0.3929290771484375, 0.4066352844238281, 0.42034149169921875, 0.4340476989746094, 0.44775390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 18.0, 15.0, 16.0, 22.0, 18.0, 28.0, 39.0, 31.0, 28.0, 22.0, 29.0, 38.0, 38.0, 41.0, 27.0, 40.0, 33.0, 32.0, 37.0, 41.0, 42.0, 41.0, 37.0, 22.0, 22.0, 30.0, 25.0, 27.0, 23.0, 13.0, 11.0, 18.0, 13.0, 9.0, 8.0, 3.0, 5.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.25830078125, -0.25070953369140625, -0.2431182861328125, -0.23552703857421875, -0.227935791015625, -0.22034454345703125, -0.2127532958984375, -0.20516204833984375, -0.19757080078125, -0.18997955322265625, -0.1823883056640625, -0.17479705810546875, -0.167205810546875, -0.15961456298828125, -0.1520233154296875, -0.14443206787109375, -0.1368408203125, -0.12924957275390625, -0.1216583251953125, -0.11406707763671875, -0.106475830078125, -0.09888458251953125, -0.0912933349609375, -0.08370208740234375, -0.07611083984375, -0.06851959228515625, -0.0609283447265625, -0.05333709716796875, -0.045745849609375, -0.03815460205078125, -0.0305633544921875, -0.02297210693359375, -0.015380859375, -0.00778961181640625, -0.0001983642578125, 0.00739288330078125, 0.014984130859375, 0.02257537841796875, 0.0301666259765625, 0.03775787353515625, 0.04534912109375, 0.05294036865234375, 0.0605316162109375, 0.06812286376953125, 0.075714111328125, 0.08330535888671875, 0.0908966064453125, 0.09848785400390625, 0.1060791015625, 0.11367034912109375, 0.1212615966796875, 0.12885284423828125, 0.136444091796875, 0.14403533935546875, 0.1516265869140625, 0.15921783447265625, 0.16680908203125, 0.17440032958984375, 0.1819915771484375, 0.18958282470703125, 0.197174072265625, 0.20476531982421875, 0.2123565673828125, 0.21994781494140625, 0.2275390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 12.0, 20.0, 25.0, 37.0, 67.0, 98.0, 154.0, 215.0, 450.0, 724.0, 1267.0, 2378.0, 4913.0, 10178.0, 23784.0, 63107.0, 176463.0, 341401.0, 258171.0, 100668.0, 35897.0, 14607.0, 6709.0, 3186.0, 1703.0, 933.0, 516.0, 337.0, 190.0, 114.0, 65.0, 52.0, 32.0, 23.0, 13.0, 11.0, 9.0, 7.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5, -0.4855995178222656, -0.47119903564453125, -0.4567985534667969, -0.4423980712890625, -0.4279975891113281, -0.41359710693359375, -0.3991966247558594, -0.384796142578125, -0.3703956604003906, -0.35599517822265625, -0.3415946960449219, -0.3271942138671875, -0.3127937316894531, -0.29839324951171875, -0.2839927673339844, -0.26959228515625, -0.2551918029785156, -0.24079132080078125, -0.22639083862304688, -0.2119903564453125, -0.19758987426757812, -0.18318939208984375, -0.16878890991210938, -0.154388427734375, -0.13998794555664062, -0.12558746337890625, -0.11118698120117188, -0.0967864990234375, -0.08238601684570312, -0.06798553466796875, -0.053585052490234375, -0.0391845703125, -0.024784088134765625, -0.01038360595703125, 0.004016876220703125, 0.0184173583984375, 0.032817840576171875, 0.04721832275390625, 0.061618804931640625, 0.076019287109375, 0.09041976928710938, 0.10482025146484375, 0.11922073364257812, 0.1336212158203125, 0.14802169799804688, 0.16242218017578125, 0.17682266235351562, 0.19122314453125, 0.20562362670898438, 0.22002410888671875, 0.23442459106445312, 0.2488250732421875, 0.2632255554199219, 0.27762603759765625, 0.2920265197753906, 0.306427001953125, 0.3208274841308594, 0.33522796630859375, 0.3496284484863281, 0.3640289306640625, 0.3784294128417969, 0.39282989501953125, 0.4072303771972656, 0.421630859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 8.0, 5.0, 6.0, 12.0, 14.0, 18.0, 18.0, 22.0, 24.0, 33.0, 39.0, 31.0, 44.0, 47.0, 50.0, 62.0, 39.0, 56.0, 57.0, 43.0, 48.0, 32.0, 27.0, 39.0, 45.0, 31.0, 26.0, 20.0, 21.0, 21.0, 18.0, 8.0, 11.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.844970703125, -0.81884765625, -0.792724609375, -0.7666015625, -0.740478515625, -0.71435546875, -0.688232421875, -0.662109375, -0.635986328125, -0.60986328125, -0.583740234375, -0.5576171875, -0.531494140625, -0.50537109375, -0.479248046875, -0.453125, -0.427001953125, -0.40087890625, -0.374755859375, -0.3486328125, -0.322509765625, -0.29638671875, -0.270263671875, -0.244140625, -0.218017578125, -0.19189453125, -0.165771484375, -0.1396484375, -0.113525390625, -0.08740234375, -0.061279296875, -0.03515625, -0.009033203125, 0.01708984375, 0.043212890625, 0.0693359375, 0.095458984375, 0.12158203125, 0.147705078125, 0.173828125, 0.199951171875, 0.22607421875, 0.252197265625, 0.2783203125, 0.304443359375, 0.33056640625, 0.356689453125, 0.3828125, 0.408935546875, 0.43505859375, 0.461181640625, 0.4873046875, 0.513427734375, 0.53955078125, 0.565673828125, 0.591796875, 0.617919921875, 0.64404296875, 0.670166015625, 0.6962890625, 0.722412109375, 0.74853515625, 0.774658203125, 0.80078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 2.0, 7.0, 11.0, 19.0, 28.0, 47.0, 58.0, 88.0, 148.0, 202.0, 354.0, 542.0, 866.0, 1459.0, 2572.0, 4519.0, 8680.0, 17459.0, 37608.0, 85885.0, 202042.0, 318720.0, 204679.0, 87209.0, 38182.0, 17444.0, 8707.0, 4580.0, 2658.0, 1391.0, 864.0, 544.0, 369.0, 214.0, 119.0, 110.0, 60.0, 35.0, 29.0, 15.0, 12.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1971435546875, -0.1915912628173828, -0.18603897094726562, -0.18048667907714844, -0.17493438720703125, -0.16938209533691406, -0.16382980346679688, -0.1582775115966797, -0.1527252197265625, -0.1471729278564453, -0.14162063598632812, -0.13606834411621094, -0.13051605224609375, -0.12496376037597656, -0.11941146850585938, -0.11385917663574219, -0.108306884765625, -0.10275459289550781, -0.09720230102539062, -0.09165000915527344, -0.08609771728515625, -0.08054542541503906, -0.07499313354492188, -0.06944084167480469, -0.0638885498046875, -0.05833625793457031, -0.052783966064453125, -0.04723167419433594, -0.04167938232421875, -0.03612709045410156, -0.030574798583984375, -0.025022506713867188, -0.01947021484375, -0.013917922973632812, -0.008365631103515625, -0.0028133392333984375, 0.00273895263671875, 0.008291244506835938, 0.013843536376953125, 0.019395828247070312, 0.0249481201171875, 0.030500411987304688, 0.036052703857421875, 0.04160499572753906, 0.04715728759765625, 0.05270957946777344, 0.058261871337890625, 0.06381416320800781, 0.069366455078125, 0.07491874694824219, 0.08047103881835938, 0.08602333068847656, 0.09157562255859375, 0.09712791442871094, 0.10268020629882812, 0.10823249816894531, 0.1137847900390625, 0.11933708190917969, 0.12488937377929688, 0.13044166564941406, 0.13599395751953125, 0.14154624938964844, 0.14709854125976562, 0.1526508331298828, 0.158203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 5.0, 16.0, 19.0, 15.0, 40.0, 36.0, 49.0, 50.0, 85.0, 93.0, 109.0, 95.0, 88.0, 58.0, 43.0, 40.0, 31.0, 23.0, 14.0, 14.0, 9.0, 8.0, 7.0, 4.0, 3.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0677528381347656e-05, -5.8564357459545135e-05, -5.6451186537742615e-05, -5.4338015615940094e-05, -5.222484469413757e-05, -5.011167377233505e-05, -4.799850285053253e-05, -4.588533192873001e-05, -4.377216100692749e-05, -4.165899008512497e-05, -3.954581916332245e-05, -3.743264824151993e-05, -3.531947731971741e-05, -3.3206306397914886e-05, -3.1093135476112366e-05, -2.8979964554309845e-05, -2.6866793632507324e-05, -2.4753622710704803e-05, -2.2640451788902283e-05, -2.0527280867099762e-05, -1.841410994529724e-05, -1.630093902349472e-05, -1.41877681016922e-05, -1.2074597179889679e-05, -9.961426258087158e-06, -7.848255336284637e-06, -5.735084414482117e-06, -3.621913492679596e-06, -1.5087425708770752e-06, 6.044283509254456e-07, 2.7175992727279663e-06, 4.830770194530487e-06, 6.943941116333008e-06, 9.057112038135529e-06, 1.117028295993805e-05, 1.328345388174057e-05, 1.539662480354309e-05, 1.750979572534561e-05, 1.9622966647148132e-05, 2.1736137568950653e-05, 2.3849308490753174e-05, 2.5962479412555695e-05, 2.8075650334358215e-05, 3.0188821256160736e-05, 3.230199217796326e-05, 3.441516309976578e-05, 3.65283340215683e-05, 3.864150494337082e-05, 4.075467586517334e-05, 4.286784678697586e-05, 4.498101770877838e-05, 4.70941886305809e-05, 4.920735955238342e-05, 5.1320530474185944e-05, 5.3433701395988464e-05, 5.5546872317790985e-05, 5.7660043239593506e-05, 5.9773214161396027e-05, 6.188638508319855e-05, 6.399955600500107e-05, 6.611272692680359e-05, 6.822589784860611e-05, 7.033906877040863e-05, 7.245223969221115e-05, 7.456541061401367e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 16.0, 18.0, 22.0, 30.0, 31.0, 59.0, 86.0, 130.0, 203.0, 312.0, 466.0, 765.0, 1239.0, 1903.0, 3109.0, 4933.0, 7859.0, 13276.0, 22626.0, 39405.0, 70163.0, 122539.0, 190666.0, 209918.0, 149748.0, 88356.0, 50058.0, 28355.0, 16436.0, 9813.0, 6109.0, 3648.0, 2285.0, 1480.0, 852.0, 550.0, 346.0, 250.0, 176.0, 105.0, 77.0, 40.0, 30.0, 26.0, 13.0, 9.0, 4.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10792827606201172, -0.10410118103027344, -0.10027408599853516, -0.09644699096679688, -0.0926198959350586, -0.08879280090332031, -0.08496570587158203, -0.08113861083984375, -0.07731151580810547, -0.07348442077636719, -0.0696573257446289, -0.06583023071289062, -0.062003135681152344, -0.05817604064941406, -0.05434894561767578, -0.0505218505859375, -0.04669475555419922, -0.04286766052246094, -0.039040565490722656, -0.035213470458984375, -0.031386375427246094, -0.027559280395507812, -0.02373218536376953, -0.01990509033203125, -0.01607799530029297, -0.012250900268554688, -0.008423805236816406, -0.004596710205078125, -0.0007696151733398438, 0.0030574798583984375, 0.006884574890136719, 0.010711669921875, 0.014538764953613281, 0.018365859985351562, 0.022192955017089844, 0.026020050048828125, 0.029847145080566406, 0.03367424011230469, 0.03750133514404297, 0.04132843017578125, 0.04515552520751953, 0.04898262023925781, 0.052809715270996094, 0.056636810302734375, 0.060463905334472656, 0.06429100036621094, 0.06811809539794922, 0.0719451904296875, 0.07577228546142578, 0.07959938049316406, 0.08342647552490234, 0.08725357055664062, 0.0910806655883789, 0.09490776062011719, 0.09873485565185547, 0.10256195068359375, 0.10638904571533203, 0.11021614074707031, 0.1140432357788086, 0.11787033081054688, 0.12169742584228516, 0.12552452087402344, 0.12935161590576172, 0.1331787109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 15.0, 9.0, 16.0, 20.0, 17.0, 15.0, 20.0, 31.0, 38.0, 38.0, 58.0, 53.0, 60.0, 47.0, 52.0, 66.0, 58.0, 43.0, 49.0, 33.0, 23.0, 24.0, 25.0, 26.0, 22.0, 24.0, 13.0, 12.0, 11.0, 9.0, 7.0, 4.0, 13.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1829833984375, -0.1775360107421875, -0.172088623046875, -0.1666412353515625, -0.16119384765625, -0.1557464599609375, -0.150299072265625, -0.1448516845703125, -0.139404296875, -0.1339569091796875, -0.128509521484375, -0.1230621337890625, -0.11761474609375, -0.1121673583984375, -0.106719970703125, -0.1012725830078125, -0.0958251953125, -0.0903778076171875, -0.084930419921875, -0.0794830322265625, -0.07403564453125, -0.0685882568359375, -0.063140869140625, -0.0576934814453125, -0.05224609375, -0.0467987060546875, -0.041351318359375, -0.0359039306640625, -0.03045654296875, -0.0250091552734375, -0.019561767578125, -0.0141143798828125, -0.0086669921875, -0.0032196044921875, 0.002227783203125, 0.0076751708984375, 0.01312255859375, 0.0185699462890625, 0.024017333984375, 0.0294647216796875, 0.034912109375, 0.0403594970703125, 0.045806884765625, 0.0512542724609375, 0.05670166015625, 0.0621490478515625, 0.067596435546875, 0.0730438232421875, 0.0784912109375, 0.0839385986328125, 0.089385986328125, 0.0948333740234375, 0.10028076171875, 0.1057281494140625, 0.111175537109375, 0.1166229248046875, 0.1220703125, 0.1275177001953125, 0.132965087890625, 0.1384124755859375, 0.14385986328125, 0.1493072509765625, 0.154754638671875, 0.1602020263671875, 0.1656494140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 19.0, 28.0, 113.0, 195.0, 225.0, 206.0, 119.0, 50.0, 19.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.889909744262695, -8.674944877624512, -8.459980010986328, -8.245015144348145, -8.030050277709961, -7.815085411071777, -7.600120544433594, -7.385156154632568, -7.170191287994385, -6.955226421356201, -6.740261554718018, -6.525296688079834, -6.31033182144165, -6.095367431640625, -5.880402565002441, -5.665437698364258, -5.450472831726074, -5.235507965087891, -5.020543098449707, -4.805578231811523, -4.59061336517334, -4.375648498535156, -4.160683631896973, -3.9457192420959473, -3.7307538986206055, -3.515789031982422, -3.3008241653442383, -3.0858592987060547, -2.87089467048645, -2.6559298038482666, -2.440964937210083, -2.2260003089904785, -2.011035442352295, -1.7960705757141113, -1.5811058282852173, -1.3661409616470337, -1.1511762142181396, -0.936211347579956, -0.7212464809417725, -0.5062817335128784, -0.2913168668746948, -0.07635204493999481, 0.1386127769947052, 0.3535776138305664, 0.5685424208641052, 0.783507227897644, 0.9984720945358276, 1.2134368419647217, 1.4284017086029053, 1.6433665752410889, 1.858331322669983, 2.073296070098877, 2.2882609367370605, 2.503225803375244, 2.7181906700134277, 2.9331555366516113, 3.148120403289795, 3.3630852699279785, 3.578050136566162, 3.7930150032043457, 4.007979869842529, 4.222944259643555, 4.437909126281738, 4.652873992919922, 4.8678388595581055]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 6.0, 12.0, 11.0, 11.0, 12.0, 16.0, 18.0, 21.0, 25.0, 20.0, 22.0, 30.0, 31.0, 29.0, 31.0, 36.0, 31.0, 48.0, 30.0, 39.0, 47.0, 45.0, 34.0, 33.0, 38.0, 42.0, 32.0, 26.0, 28.0, 35.0, 17.0, 25.0, 31.0, 7.0, 14.0, 14.0, 7.0, 5.0, 4.0, 4.0, 5.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6282906532287598, -1.573364019393921, -1.5184375047683716, -1.4635108709335327, -1.4085842370986938, -1.3536577224731445, -1.2987310886383057, -1.2438044548034668, -1.1888779401779175, -1.1339513063430786, -1.0790247917175293, -1.0240981578826904, -0.9691715836524963, -0.9142450094223022, -0.8593183755874634, -0.8043918013572693, -0.7494651675224304, -0.6945385932922363, -0.6396119594573975, -0.5846853852272034, -0.5297588109970093, -0.4748322069644928, -0.4199056029319763, -0.3649790287017822, -0.31005242466926575, -0.25512582063674927, -0.20019924640655518, -0.1452726423740387, -0.09034605324268341, -0.035419464111328125, 0.019507139921188354, 0.07443371415138245, 0.12936031818389893, 0.1842869073152542, 0.2392134964466095, 0.294140100479126, 0.34906667470932007, 0.40399327874183655, 0.458919882774353, 0.5138464570045471, 0.5687730312347412, 0.6236996054649353, 0.6786262392997742, 0.7335528135299683, 0.7884793877601624, 0.8434059619903564, 0.8983325958251953, 0.9532591700553894, 1.008185863494873, 1.063112497329712, 1.1180390119552612, 1.1729656457901, 1.227892279624939, 1.2828187942504883, 1.3377454280853271, 1.392672061920166, 1.4475985765457153, 1.5025252103805542, 1.5574517250061035, 1.6123783588409424, 1.6673049926757812, 1.7222315073013306, 1.7771581411361694, 1.8320846557617188, 1.8870112895965576]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 3.0, 9.0, 4.0, 4.0, 15.0, 8.0, 30.0, 32.0, 51.0, 52.0, 98.0, 103.0, 141.0, 185.0, 277.0, 400.0, 633.0, 1063.0, 1803.0, 3130.0, 5997.0, 12554.0, 30390.0, 95868.0, 415304.0, 1652136.0, 1481583.0, 353373.0, 85524.0, 28176.0, 11611.0, 5718.0, 3028.0, 1768.0, 1066.0, 688.0, 394.0, 297.0, 210.0, 157.0, 97.0, 75.0, 65.0, 45.0, 26.0, 13.0, 17.0, 24.0, 11.0, 10.0, 4.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.400146484375, -0.3863258361816406, -0.37250518798828125, -0.3586845397949219, -0.3448638916015625, -0.3310432434082031, -0.31722259521484375, -0.3034019470214844, -0.289581298828125, -0.2757606506347656, -0.26194000244140625, -0.24811935424804688, -0.2342987060546875, -0.22047805786132812, -0.20665740966796875, -0.19283676147460938, -0.17901611328125, -0.16519546508789062, -0.15137481689453125, -0.13755416870117188, -0.1237335205078125, -0.10991287231445312, -0.09609222412109375, -0.08227157592773438, -0.068450927734375, -0.054630279541015625, -0.04080963134765625, -0.026988983154296875, -0.0131683349609375, 0.000652313232421875, 0.01447296142578125, 0.028293609619140625, 0.0421142578125, 0.055934906005859375, 0.06975555419921875, 0.08357620239257812, 0.0973968505859375, 0.11121749877929688, 0.12503814697265625, 0.13885879516601562, 0.152679443359375, 0.16650009155273438, 0.18032073974609375, 0.19414138793945312, 0.2079620361328125, 0.22178268432617188, 0.23560333251953125, 0.24942398071289062, 0.26324462890625, 0.2770652770996094, 0.29088592529296875, 0.3047065734863281, 0.3185272216796875, 0.3323478698730469, 0.34616851806640625, 0.3599891662597656, 0.373809814453125, 0.3876304626464844, 0.40145111083984375, 0.4152717590332031, 0.4290924072265625, 0.4429130554199219, 0.45673370361328125, 0.4705543518066406, 0.484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 8.0, 7.0, 6.0, 13.0, 9.0, 18.0, 16.0, 21.0, 25.0, 32.0, 23.0, 25.0, 39.0, 37.0, 46.0, 46.0, 52.0, 35.0, 34.0, 31.0, 42.0, 45.0, 33.0, 37.0, 33.0, 32.0, 27.0, 35.0, 37.0, 28.0, 29.0, 14.0, 17.0, 16.0, 11.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.287841796875, -0.2797889709472656, -0.27173614501953125, -0.2636833190917969, -0.2556304931640625, -0.24757766723632812, -0.23952484130859375, -0.23147201538085938, -0.223419189453125, -0.21536636352539062, -0.20731353759765625, -0.19926071166992188, -0.1912078857421875, -0.18315505981445312, -0.17510223388671875, -0.16704940795898438, -0.15899658203125, -0.15094375610351562, -0.14289093017578125, -0.13483810424804688, -0.1267852783203125, -0.11873245239257812, -0.11067962646484375, -0.10262680053710938, -0.094573974609375, -0.08652114868164062, -0.07846832275390625, -0.07041549682617188, -0.0623626708984375, -0.054309844970703125, -0.04625701904296875, -0.038204193115234375, -0.0301513671875, -0.022098541259765625, -0.01404571533203125, -0.005992889404296875, 0.0020599365234375, 0.010112762451171875, 0.01816558837890625, 0.026218414306640625, 0.034271240234375, 0.042324066162109375, 0.05037689208984375, 0.058429718017578125, 0.0664825439453125, 0.07453536987304688, 0.08258819580078125, 0.09064102172851562, 0.09869384765625, 0.10674667358398438, 0.11479949951171875, 0.12285232543945312, 0.1309051513671875, 0.13895797729492188, 0.14701080322265625, 0.15506362915039062, 0.163116455078125, 0.17116928100585938, 0.17922210693359375, 0.18727493286132812, 0.1953277587890625, 0.20338058471679688, 0.21143341064453125, 0.21948623657226562, 0.2275390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 14.0, 7.0, 10.0, 11.0, 18.0, 43.0, 42.0, 68.0, 79.0, 123.0, 196.0, 268.0, 383.0, 545.0, 865.0, 1290.0, 1966.0, 3172.0, 5190.0, 9084.0, 17002.0, 33708.0, 76096.0, 204619.0, 743618.0, 2026978.0, 721687.0, 199408.0, 74479.0, 33313.0, 16686.0, 8951.0, 5260.0, 3175.0, 1977.0, 1268.0, 825.0, 583.0, 393.0, 258.0, 177.0, 141.0, 93.0, 63.0, 52.0, 22.0, 25.0, 11.0, 12.0, 10.0, 8.0, 2.0, 2.0, 5.0, 2.0, 3.0], "bins": [-0.40625, -0.3941192626953125, -0.381988525390625, -0.3698577880859375, -0.35772705078125, -0.3455963134765625, -0.333465576171875, -0.3213348388671875, -0.3092041015625, -0.2970733642578125, -0.284942626953125, -0.2728118896484375, -0.26068115234375, -0.2485504150390625, -0.236419677734375, -0.2242889404296875, -0.212158203125, -0.2000274658203125, -0.187896728515625, -0.1757659912109375, -0.16363525390625, -0.1515045166015625, -0.139373779296875, -0.1272430419921875, -0.1151123046875, -0.1029815673828125, -0.090850830078125, -0.0787200927734375, -0.06658935546875, -0.0544586181640625, -0.042327880859375, -0.0301971435546875, -0.01806640625, -0.0059356689453125, 0.006195068359375, 0.0183258056640625, 0.03045654296875, 0.0425872802734375, 0.054718017578125, 0.0668487548828125, 0.0789794921875, 0.0911102294921875, 0.103240966796875, 0.1153717041015625, 0.12750244140625, 0.1396331787109375, 0.151763916015625, 0.1638946533203125, 0.176025390625, 0.1881561279296875, 0.200286865234375, 0.2124176025390625, 0.22454833984375, 0.2366790771484375, 0.248809814453125, 0.2609405517578125, 0.2730712890625, 0.2852020263671875, 0.297332763671875, 0.3094635009765625, 0.32159423828125, 0.3337249755859375, 0.345855712890625, 0.3579864501953125, 0.3701171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 5.0, 10.0, 13.0, 28.0, 25.0, 30.0, 40.0, 65.0, 93.0, 130.0, 183.0, 266.0, 491.0, 644.0, 667.0, 420.0, 320.0, 187.0, 119.0, 84.0, 61.0, 43.0, 29.0, 26.0, 16.0, 16.0, 13.0, 8.0, 7.0, 9.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65673828125, -0.6373977661132812, -0.6180572509765625, -0.5987167358398438, -0.579376220703125, -0.5600357055664062, -0.5406951904296875, -0.5213546752929688, -0.50201416015625, -0.48267364501953125, -0.4633331298828125, -0.44399261474609375, -0.424652099609375, -0.40531158447265625, -0.3859710693359375, -0.36663055419921875, -0.3472900390625, -0.32794952392578125, -0.3086090087890625, -0.28926849365234375, -0.269927978515625, -0.25058746337890625, -0.2312469482421875, -0.21190643310546875, -0.19256591796875, -0.17322540283203125, -0.1538848876953125, -0.13454437255859375, -0.115203857421875, -0.09586334228515625, -0.0765228271484375, -0.05718231201171875, -0.037841796875, -0.01850128173828125, 0.0008392333984375, 0.02017974853515625, 0.039520263671875, 0.05886077880859375, 0.0782012939453125, 0.09754180908203125, 0.11688232421875, 0.13622283935546875, 0.1555633544921875, 0.17490386962890625, 0.194244384765625, 0.21358489990234375, 0.2329254150390625, 0.25226593017578125, 0.2716064453125, 0.29094696044921875, 0.3102874755859375, 0.32962799072265625, 0.348968505859375, 0.36830902099609375, 0.3876495361328125, 0.40699005126953125, 0.42633056640625, 0.44567108154296875, 0.4650115966796875, 0.48435211181640625, 0.503692626953125, 0.5230331420898438, 0.5423736572265625, 0.5617141723632812, 0.5810546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 9.0, 12.0, 17.0, 31.0, 54.0, 84.0, 111.0, 137.0, 130.0, 122.0, 106.0, 61.0, 35.0, 31.0, 24.0, 11.0, 9.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.198857307434082, -3.0600762367248535, -2.921294927597046, -2.7825136184692383, -2.6437325477600098, -2.5049514770507812, -2.3661701679229736, -2.227388858795166, -2.0886077880859375, -1.9498265981674194, -1.8110454082489014, -1.6722642183303833, -1.5334830284118652, -1.3947018384933472, -1.255920648574829, -1.117139458656311, -0.978358268737793, -0.8395770788192749, -0.7007958889007568, -0.5620146989822388, -0.4232335090637207, -0.28445231914520264, -0.14567112922668457, -0.006889939308166504, 0.13189125061035156, 0.27067244052886963, 0.4094536304473877, 0.5482348203659058, 0.6870160102844238, 0.8257972002029419, 0.96457839012146, 1.103359580039978, 1.242140293121338, 1.380921483039856, 1.519702672958374, 1.658483862876892, 1.7972650527954102, 1.9360462427139282, 2.0748274326324463, 2.213608741760254, 2.3523898124694824, 2.491170883178711, 2.6299521923065186, 2.768733501434326, 2.9075145721435547, 3.046295642852783, 3.185076951980591, 3.3238582611083984, 3.462639331817627, 3.6014204025268555, 3.740201711654663, 3.8789830207824707, 4.017764091491699, 4.156545162200928, 4.295326232910156, 4.434107780456543, 4.5728888511657715, 4.711669921875, 4.850451469421387, 4.989232540130615, 5.128013610839844, 5.266794681549072, 5.405575752258301, 5.5443572998046875, 5.683138370513916]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 4.0, 9.0, 5.0, 7.0, 15.0, 16.0, 12.0, 19.0, 21.0, 34.0, 21.0, 26.0, 42.0, 34.0, 39.0, 45.0, 38.0, 38.0, 52.0, 39.0, 39.0, 44.0, 38.0, 42.0, 44.0, 35.0, 24.0, 33.0, 22.0, 30.0, 17.0, 20.0, 17.0, 12.0, 10.0, 11.0, 7.0, 3.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-2.0705385208129883, -2.0139200687408447, -1.9573014974594116, -1.900683045387268, -1.844064474105835, -1.7874460220336914, -1.7308274507522583, -1.6742089986801147, -1.6175904273986816, -1.560971975326538, -1.504353404045105, -1.4477349519729614, -1.3911163806915283, -1.3344979286193848, -1.2778793573379517, -1.221260905265808, -1.164642333984375, -1.1080238819122314, -1.0514053106307983, -0.99478679895401, -0.9381682872772217, -0.8815498352050781, -0.824931263923645, -0.7683128118515015, -0.7116943597793579, -0.6550758481025696, -0.5984573364257812, -0.5418388247489929, -0.4852203130722046, -0.42860183119773865, -0.3719833195209503, -0.315364807844162, -0.25874626636505127, -0.20212775468826294, -0.1455092430114746, -0.08889074623584747, -0.03227223455905914, 0.024346262216567993, 0.08096477389335632, 0.13758328557014465, 0.19420179724693298, 0.2508203089237213, 0.30743882060050964, 0.3640573024749756, 0.4206758141517639, 0.47729432582855225, 0.5339128375053406, 0.5905313491821289, 0.6471498608589172, 0.7037683725357056, 0.7603868842124939, 0.8170053958892822, 0.8736239075660706, 0.9302424192428589, 0.9868608713150024, 1.0434794425964355, 1.100097894668579, 1.1567163467407227, 1.2133349180221558, 1.2699533700942993, 1.3265719413757324, 1.383190393447876, 1.439808964729309, 1.4964274168014526, 1.5530459880828857]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 10.0, 23.0, 22.0, 29.0, 39.0, 78.0, 104.0, 132.0, 228.0, 329.0, 543.0, 970.0, 1476.0, 2451.0, 4113.0, 7023.0, 11828.0, 20595.0, 35713.0, 62053.0, 102763.0, 157048.0, 193805.0, 167764.0, 114289.0, 69529.0, 39847.0, 22944.0, 13450.0, 7746.0, 4460.0, 2648.0, 1660.0, 988.0, 637.0, 422.0, 266.0, 185.0, 100.0, 90.0, 43.0, 26.0, 33.0, 17.0, 12.0, 10.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.255615234375, -0.24800872802734375, -0.2404022216796875, -0.23279571533203125, -0.225189208984375, -0.21758270263671875, -0.2099761962890625, -0.20236968994140625, -0.19476318359375, -0.18715667724609375, -0.1795501708984375, -0.17194366455078125, -0.164337158203125, -0.15673065185546875, -0.1491241455078125, -0.14151763916015625, -0.1339111328125, -0.12630462646484375, -0.1186981201171875, -0.11109161376953125, -0.103485107421875, -0.09587860107421875, -0.0882720947265625, -0.08066558837890625, -0.07305908203125, -0.06545257568359375, -0.0578460693359375, -0.05023956298828125, -0.042633056640625, -0.03502655029296875, -0.0274200439453125, -0.01981353759765625, -0.01220703125, -0.00460052490234375, 0.0030059814453125, 0.01061248779296875, 0.018218994140625, 0.02582550048828125, 0.0334320068359375, 0.04103851318359375, 0.04864501953125, 0.05625152587890625, 0.0638580322265625, 0.07146453857421875, 0.079071044921875, 0.08667755126953125, 0.0942840576171875, 0.10189056396484375, 0.1094970703125, 0.11710357666015625, 0.1247100830078125, 0.13231658935546875, 0.139923095703125, 0.14752960205078125, 0.1551361083984375, 0.16274261474609375, 0.17034912109375, 0.17795562744140625, 0.1855621337890625, 0.19316864013671875, 0.200775146484375, 0.20838165283203125, 0.2159881591796875, 0.22359466552734375, 0.231201171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 2.0, 9.0, 6.0, 13.0, 5.0, 13.0, 8.0, 23.0, 20.0, 29.0, 28.0, 20.0, 24.0, 22.0, 37.0, 46.0, 40.0, 51.0, 45.0, 60.0, 42.0, 42.0, 48.0, 37.0, 37.0, 36.0, 28.0, 27.0, 22.0, 27.0, 24.0, 20.0, 23.0, 12.0, 12.0, 6.0, 11.0, 12.0, 7.0, 4.0, 4.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.355712890625, -0.3458404541015625, -0.335968017578125, -0.3260955810546875, -0.31622314453125, -0.3063507080078125, -0.296478271484375, -0.2866058349609375, -0.2767333984375, -0.2668609619140625, -0.256988525390625, -0.2471160888671875, -0.23724365234375, -0.2273712158203125, -0.217498779296875, -0.2076263427734375, -0.19775390625, -0.1878814697265625, -0.178009033203125, -0.1681365966796875, -0.15826416015625, -0.1483917236328125, -0.138519287109375, -0.1286468505859375, -0.1187744140625, -0.1089019775390625, -0.099029541015625, -0.0891571044921875, -0.07928466796875, -0.0694122314453125, -0.059539794921875, -0.0496673583984375, -0.039794921875, -0.0299224853515625, -0.020050048828125, -0.0101776123046875, -0.00030517578125, 0.0095672607421875, 0.019439697265625, 0.0293121337890625, 0.0391845703125, 0.0490570068359375, 0.058929443359375, 0.0688018798828125, 0.07867431640625, 0.0885467529296875, 0.098419189453125, 0.1082916259765625, 0.1181640625, 0.1280364990234375, 0.137908935546875, 0.1477813720703125, 0.15765380859375, 0.1675262451171875, 0.177398681640625, 0.1872711181640625, 0.1971435546875, 0.2070159912109375, 0.216888427734375, 0.2267608642578125, 0.23663330078125, 0.2465057373046875, 0.256378173828125, 0.2662506103515625, 0.276123046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 6.0, 8.0, 8.0, 13.0, 36.0, 41.0, 62.0, 102.0, 167.0, 294.0, 481.0, 821.0, 1414.0, 2440.0, 4574.0, 8359.0, 15850.0, 30605.0, 59382.0, 110658.0, 190895.0, 261811.0, 165314.0, 92421.0, 48374.0, 25325.0, 13213.0, 7086.0, 3713.0, 2104.0, 1188.0, 695.0, 418.0, 237.0, 162.0, 90.0, 61.0, 41.0, 26.0, 26.0, 14.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24365234375, -0.23505783081054688, -0.22646331787109375, -0.21786880493164062, -0.2092742919921875, -0.20067977905273438, -0.19208526611328125, -0.18349075317382812, -0.174896240234375, -0.16630172729492188, -0.15770721435546875, -0.14911270141601562, -0.1405181884765625, -0.13192367553710938, -0.12332916259765625, -0.11473464965820312, -0.10614013671875, -0.09754562377929688, -0.08895111083984375, -0.08035659790039062, -0.0717620849609375, -0.06316757202148438, -0.05457305908203125, -0.045978546142578125, -0.037384033203125, -0.028789520263671875, -0.02019500732421875, -0.011600494384765625, -0.0030059814453125, 0.005588531494140625, 0.01418304443359375, 0.022777557373046875, 0.0313720703125, 0.039966583251953125, 0.04856109619140625, 0.057155609130859375, 0.0657501220703125, 0.07434463500976562, 0.08293914794921875, 0.09153366088867188, 0.100128173828125, 0.10872268676757812, 0.11731719970703125, 0.12591171264648438, 0.1345062255859375, 0.14310073852539062, 0.15169525146484375, 0.16028976440429688, 0.16888427734375, 0.17747879028320312, 0.18607330322265625, 0.19466781616210938, 0.2032623291015625, 0.21185684204101562, 0.22045135498046875, 0.22904586791992188, 0.237640380859375, 0.24623489379882812, 0.25482940673828125, 0.2634239196777344, 0.2720184326171875, 0.2806129455566406, 0.28920745849609375, 0.2978019714355469, 0.306396484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 7.0, 9.0, 11.0, 16.0, 21.0, 24.0, 24.0, 24.0, 26.0, 30.0, 35.0, 43.0, 31.0, 29.0, 46.0, 49.0, 39.0, 46.0, 41.0, 33.0, 36.0, 46.0, 38.0, 30.0, 34.0, 37.0, 26.0, 25.0, 19.0, 16.0, 22.0, 13.0, 15.0, 10.0, 9.0, 3.0, 4.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7932357788085938, -0.7666473388671875, -0.7400588989257812, -0.713470458984375, -0.6868820190429688, -0.6602935791015625, -0.6337051391601562, -0.60711669921875, -0.5805282592773438, -0.5539398193359375, -0.5273513793945312, -0.500762939453125, -0.47417449951171875, -0.4475860595703125, -0.42099761962890625, -0.3944091796875, -0.36782073974609375, -0.3412322998046875, -0.31464385986328125, -0.288055419921875, -0.26146697998046875, -0.2348785400390625, -0.20829010009765625, -0.18170166015625, -0.15511322021484375, -0.1285247802734375, -0.10193634033203125, -0.075347900390625, -0.04875946044921875, -0.0221710205078125, 0.00441741943359375, 0.031005859375, 0.05759429931640625, 0.0841827392578125, 0.11077117919921875, 0.137359619140625, 0.16394805908203125, 0.1905364990234375, 0.21712493896484375, 0.24371337890625, 0.27030181884765625, 0.2968902587890625, 0.32347869873046875, 0.350067138671875, 0.37665557861328125, 0.4032440185546875, 0.42983245849609375, 0.4564208984375, 0.48300933837890625, 0.5095977783203125, 0.5361862182617188, 0.562774658203125, 0.5893630981445312, 0.6159515380859375, 0.6425399780273438, 0.66912841796875, 0.6957168579101562, 0.7223052978515625, 0.7488937377929688, 0.775482177734375, 0.8020706176757812, 0.8286590576171875, 0.8552474975585938, 0.8818359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 8.0, 14.0, 20.0, 27.0, 49.0, 77.0, 109.0, 193.0, 338.0, 531.0, 920.0, 1580.0, 3004.0, 5326.0, 10571.0, 21009.0, 43107.0, 89487.0, 174100.0, 302363.0, 195240.0, 101246.0, 49334.0, 24025.0, 11954.0, 6199.0, 3348.0, 1807.0, 1033.0, 613.0, 344.0, 204.0, 138.0, 75.0, 58.0, 34.0, 19.0, 13.0, 9.0, 10.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0863037109375, -0.08373451232910156, -0.08116531372070312, -0.07859611511230469, -0.07602691650390625, -0.07345771789550781, -0.07088851928710938, -0.06831932067871094, -0.0657501220703125, -0.06318092346191406, -0.060611724853515625, -0.05804252624511719, -0.05547332763671875, -0.05290412902832031, -0.050334930419921875, -0.04776573181152344, -0.045196533203125, -0.04262733459472656, -0.040058135986328125, -0.03748893737792969, -0.03491973876953125, -0.03235054016113281, -0.029781341552734375, -0.027212142944335938, -0.0246429443359375, -0.022073745727539062, -0.019504547119140625, -0.016935348510742188, -0.01436614990234375, -0.011796951293945312, -0.009227752685546875, -0.0066585540771484375, -0.00408935546875, -0.0015201568603515625, 0.001049041748046875, 0.0036182403564453125, 0.00618743896484375, 0.008756637573242188, 0.011325836181640625, 0.013895034790039062, 0.0164642333984375, 0.019033432006835938, 0.021602630615234375, 0.024171829223632812, 0.02674102783203125, 0.029310226440429688, 0.031879425048828125, 0.03444862365722656, 0.037017822265625, 0.03958702087402344, 0.042156219482421875, 0.04472541809082031, 0.04729461669921875, 0.04986381530761719, 0.052433013916015625, 0.05500221252441406, 0.0575714111328125, 0.06014060974121094, 0.06270980834960938, 0.06527900695800781, 0.06784820556640625, 0.07041740417480469, 0.07298660278320312, 0.07555580139160156, 0.078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 7.0, 8.0, 9.0, 12.0, 15.0, 13.0, 21.0, 21.0, 28.0, 40.0, 45.0, 44.0, 51.0, 59.0, 74.0, 64.0, 70.0, 56.0, 65.0, 49.0, 38.0, 37.0, 24.0, 26.0, 21.0, 19.0, 16.0, 12.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.978462725877762e-05, -2.8813257813453674e-05, -2.784188836812973e-05, -2.6870518922805786e-05, -2.5899149477481842e-05, -2.4927780032157898e-05, -2.3956410586833954e-05, -2.298504114151001e-05, -2.2013671696186066e-05, -2.104230225086212e-05, -2.0070932805538177e-05, -1.9099563360214233e-05, -1.812819391489029e-05, -1.7156824469566345e-05, -1.61854550242424e-05, -1.5214085578918457e-05, -1.4242716133594513e-05, -1.3271346688270569e-05, -1.2299977242946625e-05, -1.132860779762268e-05, -1.0357238352298737e-05, -9.385868906974792e-06, -8.414499461650848e-06, -7.443130016326904e-06, -6.47176057100296e-06, -5.500391125679016e-06, -4.529021680355072e-06, -3.557652235031128e-06, -2.586282789707184e-06, -1.6149133443832397e-06, -6.435438990592957e-07, 3.2782554626464844e-07, 1.2991949915885925e-06, 2.2705644369125366e-06, 3.2419338822364807e-06, 4.213303327560425e-06, 5.184672772884369e-06, 6.156042218208313e-06, 7.127411663532257e-06, 8.098781108856201e-06, 9.070150554180145e-06, 1.004151999950409e-05, 1.1012889444828033e-05, 1.1984258890151978e-05, 1.2955628335475922e-05, 1.3926997780799866e-05, 1.489836722612381e-05, 1.5869736671447754e-05, 1.6841106116771698e-05, 1.7812475562095642e-05, 1.8783845007419586e-05, 1.975521445274353e-05, 2.0726583898067474e-05, 2.169795334339142e-05, 2.2669322788715363e-05, 2.3640692234039307e-05, 2.461206167936325e-05, 2.5583431124687195e-05, 2.655480057001114e-05, 2.7526170015335083e-05, 2.8497539460659027e-05, 2.946890890598297e-05, 3.0440278351306915e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 0.0, 4.0, 6.0, 3.0, 21.0, 14.0, 26.0, 51.0, 62.0, 99.0, 122.0, 171.0, 326.0, 482.0, 824.0, 1400.0, 2385.0, 4502.0, 8369.0, 16581.0, 34178.0, 71138.0, 144588.0, 283685.0, 235741.0, 124244.0, 60090.0, 28780.0, 14112.0, 7141.0, 3880.0, 2188.0, 1309.0, 765.0, 449.0, 270.0, 167.0, 146.0, 72.0, 43.0, 31.0, 30.0, 16.0, 17.0, 10.0, 5.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07803058624267578, -0.07512855529785156, -0.07222652435302734, -0.06932449340820312, -0.0664224624633789, -0.06352043151855469, -0.06061840057373047, -0.05771636962890625, -0.05481433868408203, -0.05191230773925781, -0.049010276794433594, -0.046108245849609375, -0.043206214904785156, -0.04030418395996094, -0.03740215301513672, -0.0345001220703125, -0.03159809112548828, -0.028696060180664062, -0.025794029235839844, -0.022891998291015625, -0.019989967346191406, -0.017087936401367188, -0.014185905456542969, -0.01128387451171875, -0.008381843566894531, -0.0054798126220703125, -0.0025777816772460938, 0.000324249267578125, 0.0032262802124023438, 0.0061283111572265625, 0.009030342102050781, 0.011932373046875, 0.014834403991699219, 0.017736434936523438, 0.020638465881347656, 0.023540496826171875, 0.026442527770996094, 0.029344558715820312, 0.03224658966064453, 0.03514862060546875, 0.03805065155029297, 0.04095268249511719, 0.043854713439941406, 0.046756744384765625, 0.049658775329589844, 0.05256080627441406, 0.05546283721923828, 0.0583648681640625, 0.06126689910888672, 0.06416893005371094, 0.06707096099853516, 0.06997299194335938, 0.0728750228881836, 0.07577705383300781, 0.07867908477783203, 0.08158111572265625, 0.08448314666748047, 0.08738517761230469, 0.0902872085571289, 0.09318923950195312, 0.09609127044677734, 0.09899330139160156, 0.10189533233642578, 0.10479736328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 2.0, 8.0, 7.0, 11.0, 13.0, 13.0, 22.0, 22.0, 18.0, 34.0, 33.0, 51.0, 46.0, 66.0, 64.0, 85.0, 81.0, 59.0, 72.0, 48.0, 44.0, 38.0, 25.0, 30.0, 24.0, 14.0, 10.0, 9.0, 8.0, 13.0, 7.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146484375, -0.1417407989501953, -0.13699722290039062, -0.13225364685058594, -0.12751007080078125, -0.12276649475097656, -0.11802291870117188, -0.11327934265136719, -0.1085357666015625, -0.10379219055175781, -0.09904861450195312, -0.09430503845214844, -0.08956146240234375, -0.08481788635253906, -0.08007431030273438, -0.07533073425292969, -0.070587158203125, -0.06584358215332031, -0.061100006103515625, -0.05635643005371094, -0.05161285400390625, -0.04686927795410156, -0.042125701904296875, -0.03738212585449219, -0.0326385498046875, -0.027894973754882812, -0.023151397705078125, -0.018407821655273438, -0.01366424560546875, -0.008920669555664062, -0.004177093505859375, 0.0005664825439453125, 0.00531005859375, 0.010053634643554688, 0.014797210693359375, 0.019540786743164062, 0.02428436279296875, 0.029027938842773438, 0.033771514892578125, 0.03851509094238281, 0.0432586669921875, 0.04800224304199219, 0.052745819091796875, 0.05748939514160156, 0.06223297119140625, 0.06697654724121094, 0.07172012329101562, 0.07646369934082031, 0.081207275390625, 0.08595085144042969, 0.09069442749023438, 0.09543800354003906, 0.10018157958984375, 0.10492515563964844, 0.10966873168945312, 0.11441230773925781, 0.1191558837890625, 0.12389945983886719, 0.12864303588867188, 0.13338661193847656, 0.13813018798828125, 0.14287376403808594, 0.14761734008789062, 0.1523609161376953, 0.1571044921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 16.0, 25.0, 27.0, 78.0, 94.0, 144.0, 147.0, 156.0, 131.0, 70.0, 42.0, 15.0, 14.0, 12.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.242569923400879, -4.136033535003662, -4.029497146606445, -3.9229609966278076, -3.81642484664917, -3.709888458251953, -3.6033520698547363, -3.4968156814575195, -3.390279531478882, -3.283743143081665, -3.1772069931030273, -3.0706706047058105, -2.9641342163085938, -2.857598066329956, -2.7510616779327393, -2.6445255279541016, -2.5379891395568848, -2.431452751159668, -2.3249166011810303, -2.2183802127838135, -2.111844062805176, -2.005307674407959, -1.8987712860107422, -1.792235016822815, -1.6856987476348877, -1.5791624784469604, -1.4726262092590332, -1.3660898208618164, -1.2595535516738892, -1.153017282485962, -1.0464808940887451, -0.9399446249008179, -0.8334083557128906, -0.7268720865249634, -0.6203357577323914, -0.5137994289398193, -0.4072631597518921, -0.30072689056396484, -0.19419056177139282, -0.0876542329788208, 0.018882036209106445, 0.12541833519935608, 0.2319546341896057, 0.33849093317985535, 0.445027232170105, 0.5515635013580322, 0.6580998301506042, 0.7646361589431763, 0.8711724281311035, 0.9777086973190308, 1.084244966506958, 1.1907813549041748, 1.297317624092102, 1.4038538932800293, 1.510390281677246, 1.6169265508651733, 1.7234628200531006, 1.8299990892410278, 1.936535358428955, 2.043071746826172, 2.1496081352233887, 2.2561442852020264, 2.362680673599243, 2.469216823577881, 2.5757532119750977]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 10.0, 9.0, 9.0, 13.0, 17.0, 23.0, 28.0, 24.0, 27.0, 27.0, 36.0, 35.0, 32.0, 51.0, 40.0, 38.0, 48.0, 56.0, 39.0, 42.0, 41.0, 44.0, 34.0, 41.0, 40.0, 30.0, 24.0, 26.0, 14.0, 18.0, 11.0, 14.0, 6.0, 6.0, 5.0, 6.0, 3.0, 6.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02490234375, -1.95806884765625, -1.8912352323532104, -1.8244017362594604, -1.757568120956421, -1.690734624862671, -1.623901128768921, -1.5570675134658813, -1.4902338981628418, -1.4234004020690918, -1.3565667867660522, -1.2897332906723022, -1.2228996753692627, -1.1560661792755127, -1.0892326831817627, -1.0223990678787231, -0.9555655717849731, -0.8887320160865784, -0.8218984603881836, -0.7550649642944336, -0.688231348991394, -0.621397852897644, -0.5545642971992493, -0.4877307415008545, -0.4208971858024597, -0.35406363010406494, -0.28723007440567017, -0.22039654850959778, -0.153562992811203, -0.08672943711280823, -0.01989591121673584, 0.046937644481658936, 0.11377120018005371, 0.1806047558784485, 0.24743829667568207, 0.31427183747291565, 0.3811053931713104, 0.4479389488697052, 0.5147724747657776, 0.5816060304641724, 0.6484395861625671, 0.7152731418609619, 0.7821066975593567, 0.8489402532577515, 0.9157737493515015, 0.982607364654541, 1.049440860748291, 1.116274356842041, 1.1831079721450806, 1.2499414682388306, 1.3167750835418701, 1.3836085796356201, 1.4504421949386597, 1.5172756910324097, 1.5841093063354492, 1.6509428024291992, 1.7177762985229492, 1.7846097946166992, 1.8514434099197388, 1.9182769060134888, 1.9851105213165283, 2.0519440174102783, 2.1187775135040283, 2.1856112480163574, 2.2524447441101074]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 15.0, 17.0, 17.0, 23.0, 37.0, 58.0, 92.0, 97.0, 165.0, 261.0, 363.0, 598.0, 979.0, 1497.0, 2540.0, 4596.0, 9220.0, 21067.0, 54434.0, 162076.0, 442834.0, 912075.0, 1168746.0, 819447.0, 373995.0, 135724.0, 46654.0, 17874.0, 8025.0, 4253.0, 2458.0, 1450.0, 871.0, 586.0, 364.0, 245.0, 172.0, 97.0, 72.0, 70.0, 38.0, 26.0, 18.0, 13.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.328857421875, -0.3187141418457031, -0.30857086181640625, -0.2984275817871094, -0.2882843017578125, -0.2781410217285156, -0.26799774169921875, -0.2578544616699219, -0.247711181640625, -0.23756790161132812, -0.22742462158203125, -0.21728134155273438, -0.2071380615234375, -0.19699478149414062, -0.18685150146484375, -0.17670822143554688, -0.16656494140625, -0.15642166137695312, -0.14627838134765625, -0.13613510131835938, -0.1259918212890625, -0.11584854125976562, -0.10570526123046875, -0.09556198120117188, -0.085418701171875, -0.07527542114257812, -0.06513214111328125, -0.054988861083984375, -0.0448455810546875, -0.034702301025390625, -0.02455902099609375, -0.014415740966796875, -0.0042724609375, 0.005870819091796875, 0.01601409912109375, 0.026157379150390625, 0.0363006591796875, 0.046443939208984375, 0.05658721923828125, 0.06673049926757812, 0.076873779296875, 0.08701705932617188, 0.09716033935546875, 0.10730361938476562, 0.1174468994140625, 0.12759017944335938, 0.13773345947265625, 0.14787673950195312, 0.15802001953125, 0.16816329956054688, 0.17830657958984375, 0.18844985961914062, 0.1985931396484375, 0.20873641967773438, 0.21887969970703125, 0.22902297973632812, 0.239166259765625, 0.24930953979492188, 0.25945281982421875, 0.2695960998535156, 0.2797393798828125, 0.2898826599121094, 0.30002593994140625, 0.3101692199707031, 0.3203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 9.0, 11.0, 9.0, 15.0, 15.0, 17.0, 24.0, 20.0, 19.0, 28.0, 30.0, 44.0, 30.0, 45.0, 52.0, 40.0, 42.0, 53.0, 37.0, 42.0, 49.0, 37.0, 37.0, 30.0, 45.0, 42.0, 25.0, 22.0, 16.0, 14.0, 16.0, 10.0, 19.0, 8.0, 10.0, 13.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2496337890625, -0.24025535583496094, -0.23087692260742188, -0.2214984893798828, -0.21212005615234375, -0.2027416229248047, -0.19336318969726562, -0.18398475646972656, -0.1746063232421875, -0.16522789001464844, -0.15584945678710938, -0.1464710235595703, -0.13709259033203125, -0.1277141571044922, -0.11833572387695312, -0.10895729064941406, -0.099578857421875, -0.09020042419433594, -0.08082199096679688, -0.07144355773925781, -0.06206512451171875, -0.05268669128417969, -0.043308258056640625, -0.03392982482910156, -0.0245513916015625, -0.015172958374023438, -0.005794525146484375, 0.0035839080810546875, 0.01296234130859375, 0.022340774536132812, 0.031719207763671875, 0.04109764099121094, 0.05047607421875, 0.05985450744628906, 0.06923294067382812, 0.07861137390136719, 0.08798980712890625, 0.09736824035644531, 0.10674667358398438, 0.11612510681152344, 0.1255035400390625, 0.13488197326660156, 0.14426040649414062, 0.1536388397216797, 0.16301727294921875, 0.1723957061767578, 0.18177413940429688, 0.19115257263183594, 0.200531005859375, 0.20990943908691406, 0.21928787231445312, 0.2286663055419922, 0.23804473876953125, 0.2474231719970703, 0.2568016052246094, 0.26618003845214844, 0.2755584716796875, 0.28493690490722656, 0.2943153381347656, 0.3036937713623047, 0.31307220458984375, 0.3224506378173828, 0.3318290710449219, 0.34120750427246094, 0.3505859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 13.0, 20.0, 27.0, 28.0, 59.0, 77.0, 119.0, 162.0, 259.0, 391.0, 627.0, 1024.0, 1720.0, 3259.0, 6819.0, 16631.0, 51844.0, 216994.0, 1263039.0, 2101204.0, 401786.0, 84791.0, 24844.0, 9251.0, 4139.0, 2136.0, 1158.0, 675.0, 421.0, 261.0, 162.0, 102.0, 59.0, 51.0, 36.0, 25.0, 15.0, 10.0, 11.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.48291015625, -0.46691131591796875, -0.4509124755859375, -0.43491363525390625, -0.418914794921875, -0.40291595458984375, -0.3869171142578125, -0.37091827392578125, -0.35491943359375, -0.33892059326171875, -0.3229217529296875, -0.30692291259765625, -0.290924072265625, -0.27492523193359375, -0.2589263916015625, -0.24292755126953125, -0.2269287109375, -0.21092987060546875, -0.1949310302734375, -0.17893218994140625, -0.162933349609375, -0.14693450927734375, -0.1309356689453125, -0.11493682861328125, -0.09893798828125, -0.08293914794921875, -0.0669403076171875, -0.05094146728515625, -0.034942626953125, -0.01894378662109375, -0.0029449462890625, 0.01305389404296875, 0.029052734375, 0.04505157470703125, 0.0610504150390625, 0.07704925537109375, 0.093048095703125, 0.10904693603515625, 0.1250457763671875, 0.14104461669921875, 0.15704345703125, 0.17304229736328125, 0.1890411376953125, 0.20503997802734375, 0.221038818359375, 0.23703765869140625, 0.2530364990234375, 0.26903533935546875, 0.2850341796875, 0.30103302001953125, 0.3170318603515625, 0.33303070068359375, 0.349029541015625, 0.36502838134765625, 0.3810272216796875, 0.39702606201171875, 0.41302490234375, 0.42902374267578125, 0.4450225830078125, 0.46102142333984375, 0.477020263671875, 0.49301910400390625, 0.5090179443359375, 0.5250167846679688, 0.541015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 12.0, 13.0, 19.0, 26.0, 38.0, 55.0, 80.0, 112.0, 179.0, 264.0, 341.0, 437.0, 520.0, 464.0, 408.0, 336.0, 231.0, 137.0, 101.0, 78.0, 56.0, 54.0, 47.0, 16.0, 10.0, 19.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7880859375, -0.7640838623046875, -0.740081787109375, -0.7160797119140625, -0.69207763671875, -0.6680755615234375, -0.644073486328125, -0.6200714111328125, -0.5960693359375, -0.5720672607421875, -0.548065185546875, -0.5240631103515625, -0.50006103515625, -0.4760589599609375, -0.452056884765625, -0.4280548095703125, -0.404052734375, -0.3800506591796875, -0.356048583984375, -0.3320465087890625, -0.30804443359375, -0.2840423583984375, -0.260040283203125, -0.2360382080078125, -0.2120361328125, -0.1880340576171875, -0.164031982421875, -0.1400299072265625, -0.11602783203125, -0.0920257568359375, -0.068023681640625, -0.0440216064453125, -0.02001953125, 0.0039825439453125, 0.027984619140625, 0.0519866943359375, 0.07598876953125, 0.0999908447265625, 0.123992919921875, 0.1479949951171875, 0.1719970703125, 0.1959991455078125, 0.220001220703125, 0.2440032958984375, 0.26800537109375, 0.2920074462890625, 0.316009521484375, 0.3400115966796875, 0.364013671875, 0.3880157470703125, 0.412017822265625, 0.4360198974609375, 0.46002197265625, 0.4840240478515625, 0.508026123046875, 0.5320281982421875, 0.5560302734375, 0.5800323486328125, 0.604034423828125, 0.6280364990234375, 0.65203857421875, 0.6760406494140625, 0.700042724609375, 0.7240447998046875, 0.748046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 14.0, 23.0, 37.0, 64.0, 84.0, 122.0, 134.0, 152.0, 103.0, 81.0, 59.0, 34.0, 17.0, 10.0, 18.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.480592727661133, -4.240296840667725, -4.000000476837158, -3.75970458984375, -3.519408702850342, -3.2791125774383545, -3.038816452026367, -2.798520565032959, -2.5582244396209717, -2.3179283142089844, -2.077632427215576, -1.8373363018035889, -1.5970402956008911, -1.3567442893981934, -1.116448163986206, -0.8761521577835083, -0.6358561515808105, -0.3955601155757904, -0.15526407957077026, 0.08503198623657227, 0.32532799243927, 0.5656239986419678, 0.8059201240539551, 1.0462161302566528, 1.2865121364593506, 1.5268081426620483, 1.767104148864746, 2.0074002742767334, 2.2476963996887207, 2.487992286682129, 2.728288412094116, 2.9685845375061035, 3.2088804244995117, 3.449176549911499, 3.6894724369049072, 3.9297685623168945, 4.170064449310303, 4.410360336303711, 4.650656700134277, 4.8909525871276855, 5.131248474121094, 5.371544361114502, 5.611840724945068, 5.852136611938477, 6.092432498931885, 6.332728385925293, 6.573024749755859, 6.813320636749268, 7.053617000579834, 7.293912887573242, 7.534209251403809, 7.774505138397217, 8.014801025390625, 8.255097389221191, 8.495393753051758, 8.735689163208008, 8.975985527038574, 9.21628189086914, 9.45657730102539, 9.696873664855957, 9.937170028686523, 10.177465438842773, 10.41776180267334, 10.658058166503906, 10.898353576660156]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 14.0, 11.0, 17.0, 22.0, 25.0, 28.0, 33.0, 32.0, 38.0, 48.0, 48.0, 45.0, 46.0, 57.0, 48.0, 49.0, 40.0, 57.0, 43.0, 49.0, 36.0, 44.0, 28.0, 22.0, 19.0, 19.0, 21.0, 13.0, 10.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3806939125061035, -3.2845141887664795, -3.1883344650268555, -3.0921547412872314, -2.9959750175476074, -2.8997952938079834, -2.8036155700683594, -2.7074358463287354, -2.6112561225891113, -2.5150763988494873, -2.4188966751098633, -2.3227169513702393, -2.2265372276306152, -2.130357503890991, -2.034177780151367, -1.9379980564117432, -1.8418183326721191, -1.7456386089324951, -1.649458885192871, -1.553279161453247, -1.457099437713623, -1.360919713973999, -1.264739990234375, -1.168560266494751, -1.072380542755127, -0.9762008190155029, -0.8800210952758789, -0.7838413715362549, -0.6876616477966309, -0.5914819240570068, -0.4953022003173828, -0.3991224765777588, -0.30294275283813477, -0.20676302909851074, -0.11058330535888672, -0.014403581619262695, 0.08177614212036133, 0.17795586585998535, 0.2741355895996094, 0.3703153133392334, 0.4664950370788574, 0.5626747608184814, 0.6588544845581055, 0.7550342082977295, 0.8512139320373535, 0.9473936557769775, 1.0435733795166016, 1.1397531032562256, 1.2359328269958496, 1.3321125507354736, 1.4282922744750977, 1.5244719982147217, 1.6206517219543457, 1.7168314456939697, 1.8130111694335938, 1.9091908931732178, 2.005370616912842, 2.101550340652466, 2.19773006439209, 2.293909788131714, 2.390089511871338, 2.486269235610962, 2.582448959350586, 2.67862868309021, 2.774808406829834]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 19.0, 20.0, 28.0, 42.0, 47.0, 59.0, 77.0, 139.0, 209.0, 255.0, 421.0, 610.0, 918.0, 1472.0, 2348.0, 4094.0, 7971.0, 16673.0, 39611.0, 109596.0, 300710.0, 340174.0, 134493.0, 47882.0, 19640.0, 8987.0, 4846.0, 2638.0, 1548.0, 947.0, 628.0, 461.0, 278.0, 220.0, 144.0, 110.0, 56.0, 44.0, 35.0, 22.0, 20.0, 11.0, 12.0, 9.0, 5.0, 3.0, 2.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.29541015625, -0.2862052917480469, -0.27700042724609375, -0.2677955627441406, -0.2585906982421875, -0.24938583374023438, -0.24018096923828125, -0.23097610473632812, -0.221771240234375, -0.21256637573242188, -0.20336151123046875, -0.19415664672851562, -0.1849517822265625, -0.17574691772460938, -0.16654205322265625, -0.15733718872070312, -0.14813232421875, -0.13892745971679688, -0.12972259521484375, -0.12051773071289062, -0.1113128662109375, -0.10210800170898438, -0.09290313720703125, -0.08369827270507812, -0.074493408203125, -0.06528854370117188, -0.05608367919921875, -0.046878814697265625, -0.0376739501953125, -0.028469085693359375, -0.01926422119140625, -0.010059356689453125, -0.0008544921875, 0.008350372314453125, 0.01755523681640625, 0.026760101318359375, 0.0359649658203125, 0.045169830322265625, 0.05437469482421875, 0.06357955932617188, 0.072784423828125, 0.08198928833007812, 0.09119415283203125, 0.10039901733398438, 0.1096038818359375, 0.11880874633789062, 0.12801361083984375, 0.13721847534179688, 0.14642333984375, 0.15562820434570312, 0.16483306884765625, 0.17403793334960938, 0.1832427978515625, 0.19244766235351562, 0.20165252685546875, 0.21085739135742188, 0.220062255859375, 0.22926712036132812, 0.23847198486328125, 0.24767684936523438, 0.2568817138671875, 0.2660865783691406, 0.27529144287109375, 0.2844963073730469, 0.293701171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 1.0, 6.0, 5.0, 8.0, 8.0, 9.0, 11.0, 21.0, 22.0, 19.0, 24.0, 35.0, 35.0, 32.0, 36.0, 37.0, 53.0, 36.0, 56.0, 45.0, 38.0, 45.0, 47.0, 42.0, 46.0, 43.0, 23.0, 28.0, 31.0, 26.0, 29.0, 16.0, 14.0, 16.0, 13.0, 12.0, 8.0, 8.0, 3.0, 7.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.444580078125, -0.43247222900390625, -0.4203643798828125, -0.40825653076171875, -0.396148681640625, -0.38404083251953125, -0.3719329833984375, -0.35982513427734375, -0.34771728515625, -0.33560943603515625, -0.3235015869140625, -0.31139373779296875, -0.299285888671875, -0.28717803955078125, -0.2750701904296875, -0.26296234130859375, -0.2508544921875, -0.23874664306640625, -0.2266387939453125, -0.21453094482421875, -0.202423095703125, -0.19031524658203125, -0.1782073974609375, -0.16609954833984375, -0.15399169921875, -0.14188385009765625, -0.1297760009765625, -0.11766815185546875, -0.105560302734375, -0.09345245361328125, -0.0813446044921875, -0.06923675537109375, -0.05712890625, -0.04502105712890625, -0.0329132080078125, -0.02080535888671875, -0.008697509765625, 0.00341033935546875, 0.0155181884765625, 0.02762603759765625, 0.03973388671875, 0.05184173583984375, 0.0639495849609375, 0.07605743408203125, 0.088165283203125, 0.10027313232421875, 0.1123809814453125, 0.12448883056640625, 0.1365966796875, 0.14870452880859375, 0.1608123779296875, 0.17292022705078125, 0.185028076171875, 0.19713592529296875, 0.2092437744140625, 0.22135162353515625, 0.23345947265625, 0.24556732177734375, 0.2576751708984375, 0.26978302001953125, 0.281890869140625, 0.29399871826171875, 0.3061065673828125, 0.31821441650390625, 0.330322265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 11.0, 15.0, 9.0, 15.0, 27.0, 42.0, 43.0, 83.0, 128.0, 227.0, 425.0, 797.0, 1521.0, 3308.0, 7021.0, 18218.0, 52956.0, 202322.0, 556519.0, 140149.0, 39437.0, 14115.0, 5693.0, 2678.0, 1234.0, 636.0, 386.0, 191.0, 122.0, 70.0, 47.0, 27.0, 22.0, 16.0, 17.0, 10.0, 10.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.306640625, -0.2971687316894531, -0.28769683837890625, -0.2782249450683594, -0.2687530517578125, -0.2592811584472656, -0.24980926513671875, -0.24033737182617188, -0.230865478515625, -0.22139358520507812, -0.21192169189453125, -0.20244979858398438, -0.1929779052734375, -0.18350601196289062, -0.17403411865234375, -0.16456222534179688, -0.15509033203125, -0.14561843872070312, -0.13614654541015625, -0.12667465209960938, -0.1172027587890625, -0.10773086547851562, -0.09825897216796875, -0.08878707885742188, -0.079315185546875, -0.06984329223632812, -0.06037139892578125, -0.050899505615234375, -0.0414276123046875, -0.031955718994140625, -0.02248382568359375, -0.013011932373046875, -0.0035400390625, 0.005931854248046875, 0.01540374755859375, 0.024875640869140625, 0.0343475341796875, 0.043819427490234375, 0.05329132080078125, 0.06276321411132812, 0.072235107421875, 0.08170700073242188, 0.09117889404296875, 0.10065078735351562, 0.1101226806640625, 0.11959457397460938, 0.12906646728515625, 0.13853836059570312, 0.14801025390625, 0.15748214721679688, 0.16695404052734375, 0.17642593383789062, 0.1858978271484375, 0.19536972045898438, 0.20484161376953125, 0.21431350708007812, 0.223785400390625, 0.23325729370117188, 0.24272918701171875, 0.2522010803222656, 0.2616729736328125, 0.2711448669433594, 0.28061676025390625, 0.2900886535644531, 0.299560546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 8.0, 12.0, 9.0, 11.0, 16.0, 14.0, 17.0, 20.0, 23.0, 23.0, 29.0, 30.0, 29.0, 37.0, 45.0, 50.0, 52.0, 53.0, 39.0, 48.0, 44.0, 40.0, 37.0, 32.0, 35.0, 23.0, 33.0, 26.0, 27.0, 20.0, 23.0, 15.0, 7.0, 10.0, 10.0, 6.0, 4.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72119140625, -0.6980514526367188, -0.6749114990234375, -0.6517715454101562, -0.628631591796875, -0.6054916381835938, -0.5823516845703125, -0.5592117309570312, -0.53607177734375, -0.5129318237304688, -0.4897918701171875, -0.46665191650390625, -0.443511962890625, -0.42037200927734375, -0.3972320556640625, -0.37409210205078125, -0.3509521484375, -0.32781219482421875, -0.3046722412109375, -0.28153228759765625, -0.258392333984375, -0.23525238037109375, -0.2121124267578125, -0.18897247314453125, -0.16583251953125, -0.14269256591796875, -0.1195526123046875, -0.09641265869140625, -0.073272705078125, -0.05013275146484375, -0.0269927978515625, -0.00385284423828125, 0.019287109375, 0.04242706298828125, 0.0655670166015625, 0.08870697021484375, 0.111846923828125, 0.13498687744140625, 0.1581268310546875, 0.18126678466796875, 0.20440673828125, 0.22754669189453125, 0.2506866455078125, 0.27382659912109375, 0.296966552734375, 0.32010650634765625, 0.3432464599609375, 0.36638641357421875, 0.3895263671875, 0.41266632080078125, 0.4358062744140625, 0.45894622802734375, 0.482086181640625, 0.5052261352539062, 0.5283660888671875, 0.5515060424804688, 0.57464599609375, 0.5977859497070312, 0.6209259033203125, 0.6440658569335938, 0.667205810546875, 0.6903457641601562, 0.7134857177734375, 0.7366256713867188, 0.759765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 9.0, 20.0, 33.0, 69.0, 98.0, 178.0, 351.0, 868.0, 3024.0, 22908.0, 542618.0, 452030.0, 21634.0, 2945.0, 916.0, 365.0, 202.0, 114.0, 52.0, 38.0, 17.0, 15.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1932373046875, -0.1873798370361328, -0.18152236938476562, -0.17566490173339844, -0.16980743408203125, -0.16394996643066406, -0.15809249877929688, -0.1522350311279297, -0.1463775634765625, -0.1405200958251953, -0.13466262817382812, -0.12880516052246094, -0.12294769287109375, -0.11709022521972656, -0.11123275756835938, -0.10537528991699219, -0.099517822265625, -0.09366035461425781, -0.08780288696289062, -0.08194541931152344, -0.07608795166015625, -0.07023048400878906, -0.06437301635742188, -0.05851554870605469, -0.0526580810546875, -0.04680061340332031, -0.040943145751953125, -0.03508567810058594, -0.02922821044921875, -0.023370742797851562, -0.017513275146484375, -0.011655807495117188, -0.00579833984375, 5.91278076171875e-05, 0.005916595458984375, 0.011774063110351562, 0.01763153076171875, 0.023488998413085938, 0.029346466064453125, 0.03520393371582031, 0.0410614013671875, 0.04691886901855469, 0.052776336669921875, 0.05863380432128906, 0.06449127197265625, 0.07034873962402344, 0.07620620727539062, 0.08206367492675781, 0.087921142578125, 0.09377861022949219, 0.09963607788085938, 0.10549354553222656, 0.11135101318359375, 0.11720848083496094, 0.12306594848632812, 0.1289234161376953, 0.1347808837890625, 0.1406383514404297, 0.14649581909179688, 0.15235328674316406, 0.15821075439453125, 0.16406822204589844, 0.16992568969726562, 0.1757831573486328, 0.181640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 8.0, 4.0, 5.0, 18.0, 9.0, 9.0, 13.0, 20.0, 20.0, 52.0, 44.0, 47.0, 55.0, 66.0, 60.0, 75.0, 72.0, 55.0, 82.0, 55.0, 42.0, 40.0, 32.0, 19.0, 28.0, 15.0, 16.0, 12.0, 5.0, 10.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.803971827030182e-05, -1.7423182725906372e-05, -1.6806647181510925e-05, -1.619011163711548e-05, -1.5573576092720032e-05, -1.4957040548324585e-05, -1.4340505003929138e-05, -1.3723969459533691e-05, -1.3107433915138245e-05, -1.2490898370742798e-05, -1.1874362826347351e-05, -1.1257827281951904e-05, -1.0641291737556458e-05, -1.002475619316101e-05, -9.408220648765564e-06, -8.791685104370117e-06, -8.17514955997467e-06, -7.558614015579224e-06, -6.942078471183777e-06, -6.32554292678833e-06, -5.709007382392883e-06, -5.0924718379974365e-06, -4.47593629360199e-06, -3.859400749206543e-06, -3.242865204811096e-06, -2.6263296604156494e-06, -2.0097941160202026e-06, -1.3932585716247559e-06, -7.767230272293091e-07, -1.601874828338623e-07, 4.5634806156158447e-07, 1.0728836059570312e-06, 1.689419150352478e-06, 2.305954694747925e-06, 2.9224902391433716e-06, 3.5390257835388184e-06, 4.155561327934265e-06, 4.772096872329712e-06, 5.388632416725159e-06, 6.0051679611206055e-06, 6.621703505516052e-06, 7.238239049911499e-06, 7.854774594306946e-06, 8.471310138702393e-06, 9.08784568309784e-06, 9.704381227493286e-06, 1.0320916771888733e-05, 1.093745231628418e-05, 1.1553987860679626e-05, 1.2170523405075073e-05, 1.278705894947052e-05, 1.3403594493865967e-05, 1.4020130038261414e-05, 1.463666558265686e-05, 1.5253201127052307e-05, 1.5869736671447754e-05, 1.64862722158432e-05, 1.7102807760238647e-05, 1.7719343304634094e-05, 1.833587884902954e-05, 1.8952414393424988e-05, 1.9568949937820435e-05, 2.018548548221588e-05, 2.0802021026611328e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 5.0, 5.0, 17.0, 21.0, 19.0, 19.0, 42.0, 51.0, 72.0, 135.0, 195.0, 336.0, 761.0, 1849.0, 6169.0, 27898.0, 192569.0, 691087.0, 102717.0, 17328.0, 4244.0, 1580.0, 654.0, 316.0, 179.0, 98.0, 54.0, 38.0, 15.0, 19.0, 15.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22216796875, -0.216522216796875, -0.21087646484375, -0.205230712890625, -0.1995849609375, -0.193939208984375, -0.18829345703125, -0.182647705078125, -0.177001953125, -0.171356201171875, -0.16571044921875, -0.160064697265625, -0.1544189453125, -0.148773193359375, -0.14312744140625, -0.137481689453125, -0.1318359375, -0.126190185546875, -0.12054443359375, -0.114898681640625, -0.1092529296875, -0.103607177734375, -0.09796142578125, -0.092315673828125, -0.086669921875, -0.081024169921875, -0.07537841796875, -0.069732666015625, -0.0640869140625, -0.058441162109375, -0.05279541015625, -0.047149658203125, -0.04150390625, -0.035858154296875, -0.03021240234375, -0.024566650390625, -0.0189208984375, -0.013275146484375, -0.00762939453125, -0.001983642578125, 0.003662109375, 0.009307861328125, 0.01495361328125, 0.020599365234375, 0.0262451171875, 0.031890869140625, 0.03753662109375, 0.043182373046875, 0.048828125, 0.054473876953125, 0.06011962890625, 0.065765380859375, 0.0714111328125, 0.077056884765625, 0.08270263671875, 0.088348388671875, 0.093994140625, 0.099639892578125, 0.10528564453125, 0.110931396484375, 0.1165771484375, 0.122222900390625, 0.12786865234375, 0.133514404296875, 0.13916015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 6.0, 11.0, 11.0, 32.0, 40.0, 64.0, 82.0, 149.0, 159.0, 169.0, 109.0, 53.0, 30.0, 38.0, 17.0, 9.0, 9.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2484130859375, -0.24054527282714844, -0.23267745971679688, -0.2248096466064453, -0.21694183349609375, -0.2090740203857422, -0.20120620727539062, -0.19333839416503906, -0.1854705810546875, -0.17760276794433594, -0.16973495483398438, -0.1618671417236328, -0.15399932861328125, -0.1461315155029297, -0.13826370239257812, -0.13039588928222656, -0.122528076171875, -0.11466026306152344, -0.10679244995117188, -0.09892463684082031, -0.09105682373046875, -0.08318901062011719, -0.07532119750976562, -0.06745338439941406, -0.0595855712890625, -0.05171775817871094, -0.043849945068359375, -0.03598213195800781, -0.02811431884765625, -0.020246505737304688, -0.012378692626953125, -0.0045108795166015625, 0.00335693359375, 0.011224746704101562, 0.019092559814453125, 0.026960372924804688, 0.03482818603515625, 0.04269599914550781, 0.050563812255859375, 0.05843162536621094, 0.0662994384765625, 0.07416725158691406, 0.08203506469726562, 0.08990287780761719, 0.09777069091796875, 0.10563850402832031, 0.11350631713867188, 0.12137413024902344, 0.129241943359375, 0.13710975646972656, 0.14497756958007812, 0.1528453826904297, 0.16071319580078125, 0.1685810089111328, 0.17644882202148438, 0.18431663513183594, 0.1921844482421875, 0.20005226135253906, 0.20792007446289062, 0.2157878875732422, 0.22365570068359375, 0.2315235137939453, 0.23939132690429688, 0.24725914001464844, 0.255126953125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 8.0, 2.0, 11.0, 23.0, 51.0, 101.0, 156.0, 196.0, 201.0, 111.0, 66.0, 33.0, 22.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.291089057922363, -6.1569504737854, -6.022811412811279, -5.888672828674316, -5.754533767700195, -5.620395183563232, -5.486256122589111, -5.352117538452148, -5.217978477478027, -5.0838398933410645, -4.949700832366943, -4.8155622482299805, -4.681423187255859, -4.5472846031188965, -4.413145542144775, -4.2790069580078125, -4.14486837387085, -4.010729789733887, -3.8765907287597656, -3.7424519062042236, -3.6083130836486816, -3.4741744995117188, -3.3400356769561768, -3.2058968544006348, -3.0717580318450928, -2.937619209289551, -2.803480386734009, -2.669341564178467, -2.535202980041504, -2.401063919067383, -2.26692533493042, -2.132786512374878, -1.9986474514007568, -1.8645086288452148, -1.7303698062896729, -1.5962311029434204, -1.4620922803878784, -1.3279534578323364, -1.193814754486084, -1.059675931930542, -0.925537109375, -0.791398286819458, -0.6572595238685608, -0.5231207609176636, -0.3889819383621216, -0.2548431158065796, -0.12070435285568237, 0.013434410095214844, 0.14757323265075684, 0.28171202540397644, 0.41585081815719604, 0.5499895811080933, 0.6841284036636353, 0.8182672262191772, 0.9524059891700745, 1.0865447521209717, 1.2206835746765137, 1.3548223972320557, 1.4889612197875977, 1.62309992313385, 1.757238745689392, 1.891377568244934, 2.0255162715911865, 2.1596550941467285, 2.2937939167022705]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 10.0, 9.0, 16.0, 11.0, 12.0, 20.0, 19.0, 15.0, 25.0, 38.0, 30.0, 32.0, 40.0, 55.0, 61.0, 53.0, 73.0, 61.0, 45.0, 40.0, 40.0, 41.0, 34.0, 29.0, 27.0, 14.0, 20.0, 17.0, 20.0, 18.0, 9.0, 6.0, 7.0, 12.0, 7.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.58965802192688, -2.516345977783203, -2.4430336952209473, -2.3697216510772705, -2.2964093685150146, -2.223097324371338, -2.149785041809082, -2.0764729976654053, -2.0031609535217285, -1.9298487901687622, -1.856536626815796, -1.7832244634628296, -1.7099123001098633, -1.6366002559661865, -1.5632880926132202, -1.489975929260254, -1.416663646697998, -1.3433514833450317, -1.2700393199920654, -1.1967271566390991, -1.1234149932861328, -1.050102949142456, -0.9767907857894897, -0.9034786224365234, -0.8301664590835571, -0.7568542957305908, -0.6835421323776245, -0.610230028629303, -0.5369178652763367, -0.46360570192337036, -0.39029356837272644, -0.3169814348220825, -0.2436692714691162, -0.1703571230173111, -0.09704497456550598, -0.023732826113700867, 0.04957932233810425, 0.12289148569107056, 0.19620361924171448, 0.2695157527923584, 0.3428279161453247, 0.416140079498291, 0.48945221304893494, 0.5627643465995789, 0.6360765099525452, 0.7093886733055115, 0.782700777053833, 0.8560129404067993, 0.9293251037597656, 1.002637267112732, 1.0759494304656982, 1.1492615938186646, 1.2225737571716309, 1.2958858013153076, 1.369197964668274, 1.4425101280212402, 1.5158222913742065, 1.5891344547271729, 1.6624466180801392, 1.7357587814331055, 1.8090708255767822, 1.882383108139038, 1.9556951522827148, 2.0290074348449707, 2.1023194789886475]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 4.0, 6.0, 11.0, 8.0, 7.0, 13.0, 9.0, 18.0, 21.0, 28.0, 26.0, 26.0, 46.0, 86.0, 227.0, 157.0, 63.0, 37.0, 22.0, 22.0, 25.0, 15.0, 17.0, 18.0, 17.0, 13.0, 8.0, 8.0, 10.0, 8.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467041015625, -0.4528350830078125, -0.438629150390625, -0.4244232177734375, -0.41021728515625, -0.3960113525390625, -0.381805419921875, -0.3675994873046875, -0.3533935546875, -0.3391876220703125, -0.324981689453125, -0.3107757568359375, -0.29656982421875, -0.2823638916015625, -0.268157958984375, -0.2539520263671875, -0.23974609375, -0.2255401611328125, -0.211334228515625, -0.1971282958984375, -0.18292236328125, -0.1687164306640625, -0.154510498046875, -0.1403045654296875, -0.1260986328125, -0.1118927001953125, -0.097686767578125, -0.0834808349609375, -0.06927490234375, -0.0550689697265625, -0.040863037109375, -0.0266571044921875, -0.012451171875, 0.0017547607421875, 0.015960693359375, 0.0301666259765625, 0.04437255859375, 0.0585784912109375, 0.072784423828125, 0.0869903564453125, 0.1011962890625, 0.1154022216796875, 0.129608154296875, 0.1438140869140625, 0.15802001953125, 0.1722259521484375, 0.186431884765625, 0.2006378173828125, 0.21484375, 0.2290496826171875, 0.243255615234375, 0.2574615478515625, 0.27166748046875, 0.2858734130859375, 0.300079345703125, 0.3142852783203125, 0.3284912109375, 0.3426971435546875, 0.356903076171875, 0.3711090087890625, 0.38531494140625, 0.3995208740234375, 0.413726806640625, 0.4279327392578125, 0.442138671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 8.0, 10.0, 4.0, 7.0, 9.0, 13.0, 20.0, 25.0, 33.0, 38.0, 82.0, 102.0, 192.0, 351.0, 515.0, 889.0, 1848.0, 4271.0, 12277.0, 80936.0, 8233709.0, 37565.0, 8900.0, 3390.0, 1497.0, 779.0, 430.0, 249.0, 145.0, 94.0, 53.0, 39.0, 32.0, 17.0, 14.0, 17.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5548295974731445, -1.5095940828323364, -1.4643585681915283, -1.4191230535507202, -1.373887538909912, -1.3286519050598145, -1.283416509628296, -1.2381808757781982, -1.1929453611373901, -1.147709846496582, -1.102474331855774, -1.0572388172149658, -1.0120033025741577, -0.9667677283287048, -0.9215322136878967, -0.8762966394424438, -0.8310611844062805, -0.7858256697654724, -0.7405901551246643, -0.6953545808792114, -0.6501190662384033, -0.6048835515975952, -0.5596480369567871, -0.514412522315979, -0.4691769778728485, -0.4239414632320404, -0.3787059187889099, -0.3334704041481018, -0.2882348895072937, -0.2429993450641632, -0.1977638304233551, -0.1525282859802246, -0.1072927713394165, -0.0620572455227375, -0.016821719706058502, 0.0284138023853302, 0.0736493319272995, 0.1188848614692688, 0.1641203761100769, 0.2093559205532074, 0.2545914351940155, 0.2998269498348236, 0.3450624942779541, 0.3902980089187622, 0.4355335235595703, 0.4807690680027008, 0.5260045528411865, 0.5712401270866394, 0.6164756417274475, 0.6617111563682556, 0.7069466710090637, 0.7521822452545166, 0.7974177598953247, 0.8426532745361328, 0.8878887891769409, 0.933124303817749, 0.9783598184585571, 1.0235953330993652, 1.0688308477401733, 1.1140663623809814, 1.1593018770217896, 1.2045373916625977, 1.2497730255126953, 1.2950085401535034, 1.3402440547943115]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 4.0, 8.0, 5.0, 6.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5159432888031006, -1.45436429977417, -1.3927853107452393, -1.3312063217163086, -1.269627332687378, -1.2080483436584473, -1.1464693546295166, -1.084890365600586, -1.0233113765716553, -0.9617323875427246, -0.900153398513794, -0.8385744094848633, -0.7769954204559326, -0.715416431427002, -0.6538373827934265, -0.5922583937644958, -0.5306793451309204, -0.46910035610198975, -0.4075213670730591, -0.34594234824180603, -0.28436335921287537, -0.2227843701839447, -0.16120535135269165, -0.09962636232376099, -0.03804737329483032, 0.02353162318468094, 0.0851106196641922, 0.14668962359428406, 0.20826861262321472, 0.2698476016521454, 0.33142662048339844, 0.3930056095123291, 0.45458459854125977, 0.5161635875701904, 0.5777425765991211, 0.6393215656280518, 0.7009005546569824, 0.7624795436859131, 0.8240585923194885, 0.8856375813484192, 0.9472165703773499, 1.0087956190109253, 1.070374608039856, 1.1319535970687866, 1.1935325860977173, 1.255111575126648, 1.3166905641555786, 1.3782695531845093, 1.43984854221344, 1.5014275312423706, 1.5630065202713013, 1.624585509300232, 1.6861644983291626, 1.7477434873580933, 1.8093225955963135, 1.8709015846252441, 1.9324805736541748, 1.9940595626831055, 2.055638551712036, 2.117217540740967, 2.1787965297698975, 2.240375518798828, 2.301954507827759, 2.3635334968566895, 2.42511248588562]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 6.0, 8.0, 9.0, 10.0, 14.0, 14.0, 27.0, 18.0, 26.0, 28.0, 35.0, 47.0, 40.0, 55.0, 42.0, 77.0, 62.0, 54.0, 49.0, 58.0, 47.0, 45.0, 36.0, 36.0, 39.0, 22.0, 26.0, 16.0, 9.0, 13.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19189453125, -0.18624114990234375, -0.1805877685546875, -0.17493438720703125, -0.169281005859375, -0.16362762451171875, -0.1579742431640625, -0.15232086181640625, -0.14666748046875, -0.14101409912109375, -0.1353607177734375, -0.12970733642578125, -0.124053955078125, -0.11840057373046875, -0.1127471923828125, -0.10709381103515625, -0.1014404296875, -0.09578704833984375, -0.0901336669921875, -0.08448028564453125, -0.078826904296875, -0.07317352294921875, -0.0675201416015625, -0.06186676025390625, -0.05621337890625, -0.05055999755859375, -0.0449066162109375, -0.03925323486328125, -0.033599853515625, -0.02794647216796875, -0.0222930908203125, -0.01663970947265625, -0.010986328125, -0.00533294677734375, 0.0003204345703125, 0.00597381591796875, 0.011627197265625, 0.01728057861328125, 0.0229339599609375, 0.02858734130859375, 0.03424072265625, 0.03989410400390625, 0.0455474853515625, 0.05120086669921875, 0.056854248046875, 0.06250762939453125, 0.0681610107421875, 0.07381439208984375, 0.0794677734375, 0.08512115478515625, 0.0907745361328125, 0.09642791748046875, 0.102081298828125, 0.10773468017578125, 0.1133880615234375, 0.11904144287109375, 0.12469482421875, 0.13034820556640625, 0.1360015869140625, 0.14165496826171875, 0.147308349609375, 0.15296173095703125, 0.1586151123046875, 0.16426849365234375, 0.169921875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 4.0, 5.0, 11.0, 14.0, 8.0, 27.0, 24.0, 38.0, 53.0, 73.0, 105.0, 183.0, 302.0, 523.0, 917.0, 1619.0, 3259.0, 7113.0, 19453.0, 74186.0, 258972.0, 113656.0, 26010.0, 9030.0, 3943.0, 2053.0, 1089.0, 613.0, 386.0, 209.0, 131.0, 72.0, 57.0, 34.0, 22.0, 22.0, 11.0, 4.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-6.4140625, -6.23895263671875, -6.0638427734375, -5.88873291015625, -5.713623046875, -5.53851318359375, -5.3634033203125, -5.18829345703125, -5.01318359375, -4.83807373046875, -4.6629638671875, -4.48785400390625, -4.312744140625, -4.13763427734375, -3.9625244140625, -3.78741455078125, -3.6123046875, -3.43719482421875, -3.2620849609375, -3.08697509765625, -2.911865234375, -2.73675537109375, -2.5616455078125, -2.38653564453125, -2.21142578125, -2.03631591796875, -1.8612060546875, -1.68609619140625, -1.510986328125, -1.33587646484375, -1.1607666015625, -0.98565673828125, -0.810546875, -0.63543701171875, -0.4603271484375, -0.28521728515625, -0.110107421875, 0.06500244140625, 0.2401123046875, 0.41522216796875, 0.59033203125, 0.76544189453125, 0.9405517578125, 1.11566162109375, 1.290771484375, 1.46588134765625, 1.6409912109375, 1.81610107421875, 1.9912109375, 2.16632080078125, 2.3414306640625, 2.51654052734375, 2.691650390625, 2.86676025390625, 3.0418701171875, 3.21697998046875, 3.39208984375, 3.56719970703125, 3.7423095703125, 3.91741943359375, 4.092529296875, 4.26763916015625, 4.4427490234375, 4.61785888671875, 4.79296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 8.0, 10.0, 13.0, 11.0, 15.0, 27.0, 37.0, 46.0, 42.0, 41.0, 54.0, 71.0, 73.0, 63.0, 58.0, 48.0, 62.0, 43.0, 41.0, 37.0, 35.0, 33.0, 34.0, 20.0, 12.0, 14.0, 16.0, 13.0, 7.0, 9.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.62158203125, -0.6067695617675781, -0.5919570922851562, -0.5771446228027344, -0.5623321533203125, -0.5475196838378906, -0.5327072143554688, -0.5178947448730469, -0.503082275390625, -0.4882698059082031, -0.47345733642578125, -0.4586448669433594, -0.4438323974609375, -0.4290199279785156, -0.41420745849609375, -0.3993949890136719, -0.38458251953125, -0.3697700500488281, -0.35495758056640625, -0.3401451110839844, -0.3253326416015625, -0.3105201721191406, -0.29570770263671875, -0.2808952331542969, -0.266082763671875, -0.2512702941894531, -0.23645782470703125, -0.22164535522460938, -0.2068328857421875, -0.19202041625976562, -0.17720794677734375, -0.16239547729492188, -0.1475830078125, -0.13277053833007812, -0.11795806884765625, -0.10314559936523438, -0.0883331298828125, -0.07352066040039062, -0.05870819091796875, -0.043895721435546875, -0.029083251953125, -0.014270782470703125, 0.00054168701171875, 0.015354156494140625, 0.0301666259765625, 0.044979095458984375, 0.05979156494140625, 0.07460403442382812, 0.08941650390625, 0.10422897338867188, 0.11904144287109375, 0.13385391235351562, 0.1486663818359375, 0.16347885131835938, 0.17829132080078125, 0.19310379028320312, 0.207916259765625, 0.22272872924804688, 0.23754119873046875, 0.2523536682128906, 0.2671661376953125, 0.2819786071777344, 0.29679107666015625, 0.3116035461425781, 0.326416015625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 11.0, 5.0, 8.0, 15.0, 20.0, 23.0, 20.0, 43.0, 48.0, 43.0, 50.0, 48.0, 37.0, 28.0, 20.0, 12.0, 2.0, 11.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5814498662948608, -1.5361655950546265, -1.490881323814392, -1.4455970525741577, -1.4003127813339233, -1.3550283908843994, -1.309744119644165, -1.2644598484039307, -1.2191755771636963, -1.173891305923462, -1.1286070346832275, -1.0833227634429932, -1.0380384922027588, -0.9927541613578796, -0.9474698901176453, -0.9021855592727661, -0.8569013476371765, -0.8116170763969421, -0.7663328051567078, -0.7210484743118286, -0.6757642030715942, -0.6304799318313599, -0.5851956605911255, -0.5399113893508911, -0.49462708830833435, -0.4493428170681, -0.4040585160255432, -0.35877424478530884, -0.31348997354507446, -0.2682056725025177, -0.22292140126228333, -0.17763710021972656, -0.1323528289794922, -0.08706854283809662, -0.04178426414728165, 0.003500014543533325, 0.048784300684928894, 0.09406858682632446, 0.13935285806655884, 0.1846371591091156, 0.22992143034934998, 0.27520570158958435, 0.3204900026321411, 0.3657742738723755, 0.41105854511260986, 0.4563428461551666, 0.5016270875930786, 0.5469114184379578, 0.5921956896781921, 0.6374799609184265, 0.6827642321586609, 0.72804856300354, 0.7733328342437744, 0.8186171054840088, 0.8639013767242432, 0.9091856479644775, 0.9544699192047119, 0.9997541904449463, 1.0450384616851807, 1.090322732925415, 1.1356070041656494, 1.1808912754058838, 1.2261755466461182, 1.271459937095642, 1.3167442083358765]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 3.0, 11.0, 14.0, 24.0, 32.0, 100.0, 128.0, 63.0, 15.0, 17.0, 5.0, 8.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9290261268615723, -1.8523635864257812, -1.7757010459899902, -1.6990385055541992, -1.6223760843276978, -1.5457135438919067, -1.4690510034561157, -1.3923885822296143, -1.3157260417938232, -1.2390635013580322, -1.1624009609222412, -1.0857384204864502, -1.0090759992599487, -0.9324134588241577, -0.8557509183883667, -0.7790884375572205, -0.7024258375167847, -0.6257632970809937, -0.5491008162498474, -0.4724382758140564, -0.39577576518058777, -0.31911325454711914, -0.24245071411132812, -0.16578823328018188, -0.08912569284439087, -0.012463174760341644, 0.06419934332370758, 0.1408618688583374, 0.21752437949180603, 0.29418689012527466, 0.3708494305610657, 0.4475119113922119, 0.5241744518280029, 0.600836992263794, 0.6774994730949402, 0.7541620135307312, 0.8308244943618774, 0.9074870347976685, 0.9841495752334595, 1.060811996459961, 1.137474536895752, 1.214137077331543, 1.290799617767334, 1.367462158203125, 1.4441245794296265, 1.5207871198654175, 1.5974496603012085, 1.67411208152771, 1.7507747411727905, 1.8274372816085815, 1.9040998220443726, 1.980762243270874, 2.057424783706665, 2.134087324142456, 2.210749864578247, 2.287412405014038, 2.364074945449829, 2.44073748588562, 2.517400026321411, 2.594062566757202, 2.670725107192993, 2.747387409210205, 2.824049949645996, 2.900712490081787, 2.977375030517578]}, "eval/loss": 1.8705445528030396, "eval/bleu": 4.138692653029469e-15, "eval/runtime": 2629.971, "eval/samples_per_second": 5.612, "eval/steps_per_second": 0.702} \ No newline at end of file +{"train/loss": 1.2244, "train/learning_rate": 5.965596330275229e-05, "train/epoch": 2.47, "train/global_step": 4000, "_runtime": 57477, "_timestamp": 1651829775, "_step": 4007, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 24.0, 94.0, 252.0, 347.0, 198.0, 79.0, 16.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6888464093208313, -0.5959274172782898, -0.5030084252357483, -0.4100894629955292, -0.31717047095298767, -0.22425147891044617, -0.13133251667022705, -0.03841352462768555, 0.05450546741485596, 0.14742445945739746, 0.24034343659877777, 0.3332624137401581, 0.4261814057826996, 0.5191004276275635, 0.6120193600654602, 0.7049383521080017, 0.7978573441505432, 0.8907763361930847, 0.9836953282356262, 1.076614260673523, 1.1695332527160645, 1.262452244758606, 1.3553712368011475, 1.448290228843689, 1.5412092208862305, 1.634128212928772, 1.7270472049713135, 1.819966197013855, 1.9128851890563965, 2.0058040618896484, 2.0987231731414795, 2.1916420459747314, 2.2845609188079834, 2.3774797916412354, 2.4703989028930664, 2.5633177757263184, 2.6562368869781494, 2.7491557598114014, 2.8420748710632324, 2.9349937438964844, 3.0279128551483154, 3.1208317279815674, 3.2137508392333984, 3.3066697120666504, 3.3995888233184814, 3.4925076961517334, 3.5854268074035645, 3.6783456802368164, 3.7712645530700684, 3.8641834259033203, 3.9571025371551514, 4.050021648406982, 4.142940521240234, 4.235859394073486, 4.328778266906738, 4.421697616577148, 4.5146164894104, 4.607535362243652, 4.700454235076904, 4.7933735847473145, 4.886292457580566, 4.979211330413818, 5.07213020324707, 5.1650495529174805, 5.257968425750732]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 6.0, 6.0, 9.0, 12.0, 11.0, 13.0, 11.0, 25.0, 22.0, 17.0, 23.0, 23.0, 23.0, 26.0, 27.0, 37.0, 42.0, 36.0, 51.0, 45.0, 38.0, 33.0, 44.0, 50.0, 36.0, 36.0, 23.0, 35.0, 36.0, 31.0, 23.0, 17.0, 26.0, 18.0, 17.0, 13.0, 11.0, 8.0, 6.0, 6.0, 9.0, 5.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.7953662872314453, -0.772705614566803, -0.7500450015068054, -0.7273843288421631, -0.7047237157821655, -0.6820630431175232, -0.6594023704528809, -0.6367417573928833, -0.614081084728241, -0.5914204120635986, -0.5687597990036011, -0.5460991263389587, -0.5234384536743164, -0.5007778406143188, -0.4781171679496765, -0.45545652508735657, -0.4327958822250366, -0.4101352393627167, -0.38747459650039673, -0.3648139238357544, -0.34215328097343445, -0.3194926381111145, -0.29683196544647217, -0.2741713225841522, -0.2515106797218323, -0.22885003685951233, -0.2061893790960312, -0.18352872133255005, -0.1608680784702301, -0.13820743560791016, -0.11554677784442902, -0.09288612008094788, -0.07022547721862793, -0.047564826905727386, -0.024904176592826843, -0.0022435262799263, 0.020417124032974243, 0.043077774345874786, 0.06573842465877533, 0.08839908242225647, 0.11105972528457642, 0.13372036814689636, 0.1563810259103775, 0.17904168367385864, 0.2017023265361786, 0.22436296939849854, 0.24702362716197968, 0.2696842849254608, 0.29234492778778076, 0.3150055706501007, 0.33766621351242065, 0.360326886177063, 0.38298752903938293, 0.4056481719017029, 0.4283088445663452, 0.45096948742866516, 0.4736301302909851, 0.49629077315330505, 0.518951416015625, 0.5416120886802673, 0.5642727613449097, 0.5869333744049072, 0.6095940470695496, 0.6322547197341919, 0.6549153327941895]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 8.0, 14.0, 14.0, 25.0, 39.0, 37.0, 77.0, 105.0, 159.0, 244.0, 403.0, 669.0, 1081.0, 2132.0, 3971.0, 7942.0, 17470.0, 41716.0, 111242.0, 332688.0, 1182498.0, 1739453.0, 494708.0, 155448.0, 57553.0, 23646.0, 10307.0, 4883.0, 2474.0, 1294.0, 731.0, 463.0, 269.0, 154.0, 108.0, 70.0, 58.0, 31.0, 27.0, 18.0, 14.0, 10.0, 8.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.892578125, -0.8639373779296875, -0.835296630859375, -0.8066558837890625, -0.77801513671875, -0.7493743896484375, -0.720733642578125, -0.6920928955078125, -0.6634521484375, -0.6348114013671875, -0.606170654296875, -0.5775299072265625, -0.54888916015625, -0.5202484130859375, -0.491607666015625, -0.4629669189453125, -0.434326171875, -0.4056854248046875, -0.377044677734375, -0.3484039306640625, -0.31976318359375, -0.2911224365234375, -0.262481689453125, -0.2338409423828125, -0.2052001953125, -0.1765594482421875, -0.147918701171875, -0.1192779541015625, -0.09063720703125, -0.0619964599609375, -0.033355712890625, -0.0047149658203125, 0.02392578125, 0.0525665283203125, 0.081207275390625, 0.1098480224609375, 0.13848876953125, 0.1671295166015625, 0.195770263671875, 0.2244110107421875, 0.2530517578125, 0.2816925048828125, 0.310333251953125, 0.3389739990234375, 0.36761474609375, 0.3962554931640625, 0.424896240234375, 0.4535369873046875, 0.482177734375, 0.5108184814453125, 0.539459228515625, 0.5680999755859375, 0.59674072265625, 0.6253814697265625, 0.654022216796875, 0.6826629638671875, 0.7113037109375, 0.7399444580078125, 0.768585205078125, 0.7972259521484375, 0.82586669921875, 0.8545074462890625, 0.883148193359375, 0.9117889404296875, 0.9404296875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 6.0, 5.0, 5.0, 4.0, 4.0, 10.0, 5.0, 14.0, 10.0, 18.0, 13.0, 14.0, 21.0, 23.0, 26.0, 27.0, 19.0, 36.0, 29.0, 52.0, 46.0, 31.0, 47.0, 37.0, 34.0, 31.0, 46.0, 39.0, 40.0, 37.0, 34.0, 33.0, 26.0, 23.0, 24.0, 19.0, 21.0, 18.0, 9.0, 13.0, 8.0, 11.0, 9.0, 8.0, 5.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.1201171875, -1.0888519287109375, -1.057586669921875, -1.0263214111328125, -0.99505615234375, -0.9637908935546875, -0.932525634765625, -0.9012603759765625, -0.8699951171875, -0.8387298583984375, -0.807464599609375, -0.7761993408203125, -0.74493408203125, -0.7136688232421875, -0.682403564453125, -0.6511383056640625, -0.619873046875, -0.5886077880859375, -0.557342529296875, -0.5260772705078125, -0.49481201171875, -0.4635467529296875, -0.432281494140625, -0.4010162353515625, -0.3697509765625, -0.3384857177734375, -0.307220458984375, -0.2759552001953125, -0.24468994140625, -0.2134246826171875, -0.182159423828125, -0.1508941650390625, -0.11962890625, -0.0883636474609375, -0.057098388671875, -0.0258331298828125, 0.00543212890625, 0.0366973876953125, 0.067962646484375, 0.0992279052734375, 0.1304931640625, 0.1617584228515625, 0.193023681640625, 0.2242889404296875, 0.25555419921875, 0.2868194580078125, 0.318084716796875, 0.3493499755859375, 0.380615234375, 0.4118804931640625, 0.443145751953125, 0.4744110107421875, 0.50567626953125, 0.5369415283203125, 0.568206787109375, 0.5994720458984375, 0.6307373046875, 0.6620025634765625, 0.693267822265625, 0.7245330810546875, 0.75579833984375, 0.7870635986328125, 0.818328857421875, 0.8495941162109375, 0.880859375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 13.0, 13.0, 27.0, 30.0, 78.0, 135.0, 309.0, 2570.0, 4189098.0, 1456.0, 276.0, 119.0, 64.0, 39.0, 24.0, 11.0, 5.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.96875, -33.2041015625, -32.439453125, -31.6748046875, -30.91015625, -30.1455078125, -29.380859375, -28.6162109375, -27.8515625, -27.0869140625, -26.322265625, -25.5576171875, -24.79296875, -24.0283203125, -23.263671875, -22.4990234375, -21.734375, -20.9697265625, -20.205078125, -19.4404296875, -18.67578125, -17.9111328125, -17.146484375, -16.3818359375, -15.6171875, -14.8525390625, -14.087890625, -13.3232421875, -12.55859375, -11.7939453125, -11.029296875, -10.2646484375, -9.5, -8.7353515625, -7.970703125, -7.2060546875, -6.44140625, -5.6767578125, -4.912109375, -4.1474609375, -3.3828125, -2.6181640625, -1.853515625, -1.0888671875, -0.32421875, 0.4404296875, 1.205078125, 1.9697265625, 2.734375, 3.4990234375, 4.263671875, 5.0283203125, 5.79296875, 6.5576171875, 7.322265625, 8.0869140625, 8.8515625, 9.6162109375, 10.380859375, 11.1455078125, 11.91015625, 12.6748046875, 13.439453125, 14.2041015625, 14.96875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 5.0, 2.0, 11.0, 20.0, 22.0, 29.0, 72.0, 104.0, 222.0, 683.0, 1707.0, 694.0, 246.0, 102.0, 70.0, 46.0, 19.0, 12.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.251953125, -1.2250328063964844, -1.1981124877929688, -1.1711921691894531, -1.1442718505859375, -1.1173515319824219, -1.0904312133789062, -1.0635108947753906, -1.036590576171875, -1.0096702575683594, -0.9827499389648438, -0.9558296203613281, -0.9289093017578125, -0.9019889831542969, -0.8750686645507812, -0.8481483459472656, -0.82122802734375, -0.7943077087402344, -0.7673873901367188, -0.7404670715332031, -0.7135467529296875, -0.6866264343261719, -0.6597061157226562, -0.6327857971191406, -0.605865478515625, -0.5789451599121094, -0.5520248413085938, -0.5251045227050781, -0.4981842041015625, -0.4712638854980469, -0.44434356689453125, -0.4174232482910156, -0.3905029296875, -0.3635826110839844, -0.33666229248046875, -0.3097419738769531, -0.2828216552734375, -0.2559013366699219, -0.22898101806640625, -0.20206069946289062, -0.175140380859375, -0.14822006225585938, -0.12129974365234375, -0.09437942504882812, -0.0674591064453125, -0.040538787841796875, -0.01361846923828125, 0.013301849365234375, 0.04022216796875, 0.06714248657226562, 0.09406280517578125, 0.12098312377929688, 0.1479034423828125, 0.17482376098632812, 0.20174407958984375, 0.22866439819335938, 0.255584716796875, 0.2825050354003906, 0.30942535400390625, 0.3363456726074219, 0.3632659912109375, 0.3901863098144531, 0.41710662841796875, 0.4440269470214844, 0.470947265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 10.0, 30.0, 26.0, 27.0, 38.0, 48.0, 65.0, 57.0, 71.0, 54.0, 63.0, 72.0, 83.0, 60.0, 58.0, 38.0, 34.0, 30.0, 17.0, 27.0, 19.0, 13.0, 16.0, 5.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.71454656124115, -1.6693570613861084, -1.624167561531067, -1.5789780616760254, -1.5337885618209839, -1.4885990619659424, -1.4434094429016113, -1.3982200622558594, -1.3530304431915283, -1.3078409433364868, -1.2626514434814453, -1.2174619436264038, -1.1722724437713623, -1.1270829439163208, -1.0818934440612793, -1.0367038249969482, -0.9915144443511963, -0.9463249444961548, -0.9011354446411133, -0.8559459447860718, -0.8107564449310303, -0.7655669450759888, -0.7203773856163025, -0.675187885761261, -0.6299983859062195, -0.584808886051178, -0.5396193861961365, -0.4944298565387726, -0.4492403566837311, -0.4040508568286896, -0.3588613271713257, -0.3136718273162842, -0.2684823274612427, -0.22329282760620117, -0.17810331284999847, -0.13291379809379578, -0.08772429823875427, -0.04253479838371277, 0.002654731273651123, 0.04784423112869263, 0.09303373098373413, 0.13822323083877563, 0.18341274559497833, 0.22860226035118103, 0.27379176020622253, 0.31898126006126404, 0.36417078971862793, 0.40936028957366943, 0.45454978942871094, 0.49973928928375244, 0.544928789138794, 0.5901182889938354, 0.635307788848877, 0.6804972887039185, 0.7256868481636047, 0.7708763480186462, 0.8160658478736877, 0.8612553477287292, 0.9064448475837708, 0.951634407043457, 0.9968239068984985, 1.04201340675354, 1.0872029066085815, 1.132392406463623, 1.1775819063186646]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 11.0, 7.0, 9.0, 7.0, 9.0, 18.0, 16.0, 7.0, 19.0, 19.0, 22.0, 18.0, 29.0, 24.0, 43.0, 29.0, 27.0, 36.0, 41.0, 36.0, 39.0, 46.0, 38.0, 32.0, 38.0, 43.0, 26.0, 39.0, 21.0, 25.0, 19.0, 24.0, 27.0, 24.0, 19.0, 16.0, 19.0, 11.0, 8.0, 8.0, 9.0, 4.0, 5.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.9740117788314819, -0.9452316761016846, -0.9164515733718872, -0.8876714706420898, -0.8588913679122925, -0.8301112651824951, -0.8013312220573425, -0.7725511193275452, -0.7437710165977478, -0.7149909138679504, -0.6862108111381531, -0.6574307084083557, -0.6286506652832031, -0.5998705625534058, -0.5710904598236084, -0.542310357093811, -0.5135302543640137, -0.4847501516342163, -0.45597004890441895, -0.42718997597694397, -0.3984098732471466, -0.36962977051734924, -0.34084969758987427, -0.3120695948600769, -0.28328949213027954, -0.2545093894004822, -0.225729301571846, -0.19694921374320984, -0.16816911101341248, -0.1393890082836151, -0.11060892045497894, -0.08182883262634277, -0.053048670291900635, -0.02426857501268387, 0.004511520266532898, 0.033291615545749664, 0.06207171082496643, 0.0908518135547638, 0.11963190138339996, 0.14841198921203613, 0.1771920919418335, 0.20597219467163086, 0.23475228250026703, 0.2635323703289032, 0.29231247305870056, 0.3210925757884979, 0.3498726487159729, 0.37865275144577026, 0.4074328541755676, 0.436212956905365, 0.46499305963516235, 0.49377313256263733, 0.5225532054901123, 0.5513333082199097, 0.580113410949707, 0.6088935136795044, 0.6376736164093018, 0.6664537191390991, 0.6952338218688965, 0.7240139245986938, 0.7527940273284912, 0.7815741300582886, 0.8103541731834412, 0.8391342759132385, 0.8679143786430359]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 17.0, 25.0, 45.0, 72.0, 138.0, 159.0, 304.0, 565.0, 862.0, 1481.0, 2527.0, 4569.0, 8251.0, 15390.0, 29799.0, 58352.0, 116939.0, 214371.0, 252580.0, 166948.0, 85006.0, 42379.0, 21701.0, 11490.0, 6209.0, 3422.0, 1952.0, 1215.0, 687.0, 438.0, 267.0, 143.0, 91.0, 63.0, 36.0, 20.0, 14.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314208984375, -0.30309295654296875, -0.2919769287109375, -0.28086090087890625, -0.269744873046875, -0.25862884521484375, -0.2475128173828125, -0.23639678955078125, -0.22528076171875, -0.21416473388671875, -0.2030487060546875, -0.19193267822265625, -0.180816650390625, -0.16970062255859375, -0.1585845947265625, -0.14746856689453125, -0.1363525390625, -0.12523651123046875, -0.1141204833984375, -0.10300445556640625, -0.091888427734375, -0.08077239990234375, -0.0696563720703125, -0.05854034423828125, -0.04742431640625, -0.03630828857421875, -0.0251922607421875, -0.01407623291015625, -0.002960205078125, 0.00815582275390625, 0.0192718505859375, 0.03038787841796875, 0.04150390625, 0.05261993408203125, 0.0637359619140625, 0.07485198974609375, 0.085968017578125, 0.09708404541015625, 0.1082000732421875, 0.11931610107421875, 0.13043212890625, 0.14154815673828125, 0.1526641845703125, 0.16378021240234375, 0.174896240234375, 0.18601226806640625, 0.1971282958984375, 0.20824432373046875, 0.2193603515625, 0.23047637939453125, 0.2415924072265625, 0.25270843505859375, 0.263824462890625, 0.27494049072265625, 0.2860565185546875, 0.29717254638671875, 0.30828857421875, 0.31940460205078125, 0.3305206298828125, 0.34163665771484375, 0.352752685546875, 0.36386871337890625, 0.3749847412109375, 0.38610076904296875, 0.397216796875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 8.0, 2.0, 4.0, 7.0, 8.0, 3.0, 6.0, 12.0, 6.0, 9.0, 17.0, 19.0, 18.0, 22.0, 27.0, 32.0, 31.0, 40.0, 35.0, 24.0, 34.0, 47.0, 45.0, 54.0, 40.0, 50.0, 56.0, 35.0, 39.0, 31.0, 30.0, 37.0, 32.0, 24.0, 20.0, 21.0, 16.0, 13.0, 13.0, 10.0, 9.0, 5.0, 7.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8203125, -0.7945022583007812, -0.7686920166015625, -0.7428817749023438, -0.717071533203125, -0.6912612915039062, -0.6654510498046875, -0.6396408081054688, -0.61383056640625, -0.5880203247070312, -0.5622100830078125, -0.5363998413085938, -0.510589599609375, -0.48477935791015625, -0.4589691162109375, -0.43315887451171875, -0.4073486328125, -0.38153839111328125, -0.3557281494140625, -0.32991790771484375, -0.304107666015625, -0.27829742431640625, -0.2524871826171875, -0.22667694091796875, -0.20086669921875, -0.17505645751953125, -0.1492462158203125, -0.12343597412109375, -0.097625732421875, -0.07181549072265625, -0.0460052490234375, -0.02019500732421875, 0.005615234375, 0.03142547607421875, 0.0572357177734375, 0.08304595947265625, 0.108856201171875, 0.13466644287109375, 0.1604766845703125, 0.18628692626953125, 0.21209716796875, 0.23790740966796875, 0.2637176513671875, 0.28952789306640625, 0.315338134765625, 0.34114837646484375, 0.3669586181640625, 0.39276885986328125, 0.4185791015625, 0.44438934326171875, 0.4701995849609375, 0.49600982666015625, 0.521820068359375, 0.5476303100585938, 0.5734405517578125, 0.5992507934570312, 0.62506103515625, 0.6508712768554688, 0.6766815185546875, 0.7024917602539062, 0.728302001953125, 0.7541122436523438, 0.7799224853515625, 0.8057327270507812, 0.83154296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 8.0, 13.0, 14.0, 24.0, 26.0, 39.0, 44.0, 63.0, 66.0, 136.0, 156.0, 232.0, 420.0, 790.0, 1515.0, 3516.0, 10149.0, 36092.0, 165408.0, 520174.0, 237856.0, 49998.0, 13159.0, 4482.0, 1841.0, 880.0, 495.0, 305.0, 180.0, 130.0, 92.0, 48.0, 52.0, 38.0, 35.0, 18.0, 18.0, 9.0, 10.0, 5.0, 8.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62353515625, -0.6055221557617188, -0.5875091552734375, -0.5694961547851562, -0.551483154296875, -0.5334701538085938, -0.5154571533203125, -0.49744415283203125, -0.47943115234375, -0.46141815185546875, -0.4434051513671875, -0.42539215087890625, -0.407379150390625, -0.38936614990234375, -0.3713531494140625, -0.35334014892578125, -0.3353271484375, -0.31731414794921875, -0.2993011474609375, -0.28128814697265625, -0.263275146484375, -0.24526214599609375, -0.2272491455078125, -0.20923614501953125, -0.19122314453125, -0.17321014404296875, -0.1551971435546875, -0.13718414306640625, -0.119171142578125, -0.10115814208984375, -0.0831451416015625, -0.06513214111328125, -0.047119140625, -0.02910614013671875, -0.0110931396484375, 0.00691986083984375, 0.024932861328125, 0.04294586181640625, 0.0609588623046875, 0.07897186279296875, 0.09698486328125, 0.11499786376953125, 0.1330108642578125, 0.15102386474609375, 0.169036865234375, 0.18704986572265625, 0.2050628662109375, 0.22307586669921875, 0.2410888671875, 0.25910186767578125, 0.2771148681640625, 0.29512786865234375, 0.313140869140625, 0.33115386962890625, 0.3491668701171875, 0.36717987060546875, 0.38519287109375, 0.40320587158203125, 0.4212188720703125, 0.43923187255859375, 0.457244873046875, 0.47525787353515625, 0.4932708740234375, 0.5112838745117188, 0.529296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 9.0, 4.0, 9.0, 9.0, 11.0, 16.0, 17.0, 17.0, 24.0, 19.0, 20.0, 21.0, 21.0, 27.0, 27.0, 33.0, 45.0, 41.0, 35.0, 41.0, 47.0, 29.0, 30.0, 48.0, 35.0, 35.0, 39.0, 33.0, 36.0, 33.0, 30.0, 14.0, 16.0, 23.0, 16.0, 17.0, 9.0, 14.0, 8.0, 5.0, 14.0, 4.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-1.7236328125, -1.6746368408203125, -1.625640869140625, -1.5766448974609375, -1.52764892578125, -1.4786529541015625, -1.429656982421875, -1.3806610107421875, -1.3316650390625, -1.2826690673828125, -1.233673095703125, -1.1846771240234375, -1.13568115234375, -1.0866851806640625, -1.037689208984375, -0.9886932373046875, -0.939697265625, -0.8907012939453125, -0.841705322265625, -0.7927093505859375, -0.74371337890625, -0.6947174072265625, -0.645721435546875, -0.5967254638671875, -0.5477294921875, -0.4987335205078125, -0.449737548828125, -0.4007415771484375, -0.35174560546875, -0.3027496337890625, -0.253753662109375, -0.2047576904296875, -0.15576171875, -0.1067657470703125, -0.057769775390625, -0.0087738037109375, 0.04022216796875, 0.0892181396484375, 0.138214111328125, 0.1872100830078125, 0.2362060546875, 0.2852020263671875, 0.334197998046875, 0.3831939697265625, 0.43218994140625, 0.4811859130859375, 0.530181884765625, 0.5791778564453125, 0.628173828125, 0.6771697998046875, 0.726165771484375, 0.7751617431640625, 0.82415771484375, 0.8731536865234375, 0.922149658203125, 0.9711456298828125, 1.0201416015625, 1.0691375732421875, 1.118133544921875, 1.1671295166015625, 1.21612548828125, 1.2651214599609375, 1.314117431640625, 1.3631134033203125, 1.412109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 12.0, 12.0, 11.0, 25.0, 35.0, 55.0, 64.0, 98.0, 158.0, 198.0, 261.0, 559.0, 879.0, 1499.0, 2693.0, 5330.0, 11860.0, 31066.0, 98851.0, 402956.0, 355242.0, 86886.0, 27496.0, 10896.0, 5066.0, 2541.0, 1398.0, 810.0, 506.0, 333.0, 223.0, 157.0, 93.0, 65.0, 46.0, 39.0, 28.0, 24.0, 19.0, 9.0, 7.0, 9.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.20751953125, -0.20035171508789062, -0.19318389892578125, -0.18601608276367188, -0.1788482666015625, -0.17168045043945312, -0.16451263427734375, -0.15734481811523438, -0.150177001953125, -0.14300918579101562, -0.13584136962890625, -0.12867355346679688, -0.1215057373046875, -0.11433792114257812, -0.10717010498046875, -0.10000228881835938, -0.09283447265625, -0.08566665649414062, -0.07849884033203125, -0.07133102416992188, -0.0641632080078125, -0.056995391845703125, -0.04982757568359375, -0.042659759521484375, -0.035491943359375, -0.028324127197265625, -0.02115631103515625, -0.013988494873046875, -0.0068206787109375, 0.000347137451171875, 0.00751495361328125, 0.014682769775390625, 0.0218505859375, 0.029018402099609375, 0.03618621826171875, 0.043354034423828125, 0.0505218505859375, 0.057689666748046875, 0.06485748291015625, 0.07202529907226562, 0.079193115234375, 0.08636093139648438, 0.09352874755859375, 0.10069656372070312, 0.1078643798828125, 0.11503219604492188, 0.12220001220703125, 0.12936782836914062, 0.13653564453125, 0.14370346069335938, 0.15087127685546875, 0.15803909301757812, 0.1652069091796875, 0.17237472534179688, 0.17954254150390625, 0.18671035766601562, 0.193878173828125, 0.20104598999023438, 0.20821380615234375, 0.21538162231445312, 0.2225494384765625, 0.22971725463867188, 0.23688507080078125, 0.24405288696289062, 0.251220703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 13.0, 15.0, 25.0, 28.0, 53.0, 62.0, 84.0, 117.0, 132.0, 120.0, 104.0, 68.0, 44.0, 32.0, 31.0, 17.0, 13.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.000247955322265625, -0.0002418775111436844, -0.00023579970002174377, -0.00022972188889980316, -0.00022364407777786255, -0.00021756626665592194, -0.00021148845553398132, -0.0002054106444120407, -0.0001993328332901001, -0.00019325502216815948, -0.00018717721104621887, -0.00018109939992427826, -0.00017502158880233765, -0.00016894377768039703, -0.00016286596655845642, -0.0001567881554365158, -0.0001507103443145752, -0.00014463253319263458, -0.00013855472207069397, -0.00013247691094875336, -0.00012639909982681274, -0.00012032128870487213, -0.00011424347758293152, -0.0001081656664609909, -0.00010208785533905029, -9.601004421710968e-05, -8.993223309516907e-05, -8.385442197322845e-05, -7.777661085128784e-05, -7.169879972934723e-05, -6.562098860740662e-05, -5.9543177485466003e-05, -5.346536636352539e-05, -4.738755524158478e-05, -4.1309744119644165e-05, -3.523193299770355e-05, -2.915412187576294e-05, -2.3076310753822327e-05, -1.6998499631881714e-05, -1.0920688509941101e-05, -4.842877388000488e-06, 1.2349337339401245e-06, 7.312744855880737e-06, 1.339055597782135e-05, 1.9468367099761963e-05, 2.5546178221702576e-05, 3.162398934364319e-05, 3.77018004655838e-05, 4.3779611587524414e-05, 4.985742270946503e-05, 5.593523383140564e-05, 6.201304495334625e-05, 6.809085607528687e-05, 7.416866719722748e-05, 8.024647831916809e-05, 8.63242894411087e-05, 9.240210056304932e-05, 9.847991168498993e-05, 0.00010455772280693054, 0.00011063553392887115, 0.00011671334505081177, 0.00012279115617275238, 0.000128868967294693, 0.0001349467784166336, 0.00014102458953857422]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 9.0, 6.0, 11.0, 11.0, 18.0, 18.0, 29.0, 33.0, 48.0, 64.0, 151.0, 413.0, 2131.0, 21239.0, 440240.0, 554175.0, 26528.0, 2519.0, 435.0, 155.0, 79.0, 44.0, 38.0, 22.0, 22.0, 21.0, 9.0, 23.0, 18.0, 7.0, 6.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74462890625, -0.7220916748046875, -0.699554443359375, -0.6770172119140625, -0.65447998046875, -0.6319427490234375, -0.609405517578125, -0.5868682861328125, -0.5643310546875, -0.5417938232421875, -0.519256591796875, -0.4967193603515625, -0.47418212890625, -0.4516448974609375, -0.429107666015625, -0.4065704345703125, -0.384033203125, -0.3614959716796875, -0.338958740234375, -0.3164215087890625, -0.29388427734375, -0.2713470458984375, -0.248809814453125, -0.2262725830078125, -0.2037353515625, -0.1811981201171875, -0.158660888671875, -0.1361236572265625, -0.11358642578125, -0.0910491943359375, -0.068511962890625, -0.0459747314453125, -0.0234375, -0.0009002685546875, 0.021636962890625, 0.0441741943359375, 0.06671142578125, 0.0892486572265625, 0.111785888671875, 0.1343231201171875, 0.1568603515625, 0.1793975830078125, 0.201934814453125, 0.2244720458984375, 0.24700927734375, 0.2695465087890625, 0.292083740234375, 0.3146209716796875, 0.337158203125, 0.3596954345703125, 0.382232666015625, 0.4047698974609375, 0.42730712890625, 0.4498443603515625, 0.472381591796875, 0.4949188232421875, 0.5174560546875, 0.5399932861328125, 0.562530517578125, 0.5850677490234375, 0.60760498046875, 0.6301422119140625, 0.652679443359375, 0.6752166748046875, 0.69775390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 8.0, 5.0, 12.0, 13.0, 5.0, 19.0, 25.0, 23.0, 31.0, 32.0, 41.0, 45.0, 59.0, 83.0, 77.0, 87.0, 66.0, 60.0, 33.0, 48.0, 37.0, 22.0, 29.0, 26.0, 18.0, 20.0, 9.0, 15.0, 12.0, 9.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0841064453125, -0.08164024353027344, -0.07917404174804688, -0.07670783996582031, -0.07424163818359375, -0.07177543640136719, -0.06930923461914062, -0.06684303283691406, -0.0643768310546875, -0.06191062927246094, -0.059444427490234375, -0.05697822570800781, -0.05451202392578125, -0.05204582214355469, -0.049579620361328125, -0.04711341857910156, -0.044647216796875, -0.04218101501464844, -0.039714813232421875, -0.03724861145019531, -0.03478240966796875, -0.03231620788574219, -0.029850006103515625, -0.027383804321289062, -0.0249176025390625, -0.022451400756835938, -0.019985198974609375, -0.017518997192382812, -0.01505279541015625, -0.012586593627929688, -0.010120391845703125, -0.0076541900634765625, -0.00518798828125, -0.0027217864990234375, -0.000255584716796875, 0.0022106170654296875, 0.00467681884765625, 0.0071430206298828125, 0.009609222412109375, 0.012075424194335938, 0.0145416259765625, 0.017007827758789062, 0.019474029541015625, 0.021940231323242188, 0.02440643310546875, 0.026872634887695312, 0.029338836669921875, 0.03180503845214844, 0.034271240234375, 0.03673744201660156, 0.039203643798828125, 0.04166984558105469, 0.04413604736328125, 0.04660224914550781, 0.049068450927734375, 0.05153465270996094, 0.0540008544921875, 0.05646705627441406, 0.058933258056640625, 0.06139945983886719, 0.06386566162109375, 0.06633186340332031, 0.06879806518554688, 0.07126426696777344, 0.07373046875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 4.0, 10.0, 12.0, 14.0, 28.0, 48.0, 46.0, 81.0, 76.0, 107.0, 99.0, 94.0, 95.0, 84.0, 50.0, 37.0, 35.0, 23.0, 16.0, 13.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.699026346206665, -1.6501072645187378, -1.6011881828308105, -1.5522691011428833, -1.503350019454956, -1.4544309377670288, -1.4055118560791016, -1.3565926551818848, -1.307673692703247, -1.2587546110153198, -1.2098355293273926, -1.1609164476394653, -1.111997365951538, -1.0630782842636108, -1.0141592025756836, -0.9652400612831116, -0.9163209199905396, -0.8674018383026123, -0.8184827566146851, -0.7695636749267578, -0.7206445932388306, -0.6717255115509033, -0.6228063702583313, -0.573887288570404, -0.5249682068824768, -0.47604912519454956, -0.4271300435066223, -0.3782109320163727, -0.32929185032844543, -0.2803727686405182, -0.23145365715026855, -0.1825345754623413, -0.1336156129837036, -0.08469652384519577, -0.03577743470668793, 0.013141661882400513, 0.06206074357032776, 0.110979825258255, 0.15989893674850464, 0.20881801843643188, 0.25773710012435913, 0.3066561818122864, 0.3555752635002136, 0.40449437499046326, 0.4534134566783905, 0.5023325681686401, 0.5512516498565674, 0.6001707315444946, 0.6490898132324219, 0.6980088949203491, 0.7469279766082764, 0.7958470582962036, 0.8447661399841309, 0.8936852216720581, 0.9426043629646301, 0.9915234446525574, 1.0404424667358398, 1.089361548423767, 1.1382806301116943, 1.1871997117996216, 1.2361187934875488, 1.285037875175476, 1.3339569568634033, 1.3828761577606201, 1.4317952394485474]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 7.0, 8.0, 7.0, 8.0, 13.0, 14.0, 9.0, 21.0, 18.0, 20.0, 26.0, 29.0, 26.0, 32.0, 35.0, 31.0, 40.0, 34.0, 51.0, 40.0, 44.0, 38.0, 47.0, 54.0, 34.0, 36.0, 27.0, 34.0, 29.0, 31.0, 17.0, 16.0, 22.0, 15.0, 11.0, 11.0, 16.0, 8.0, 13.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.7725748419761658, -0.7486474514007568, -0.7247201204299927, -0.7007927298545837, -0.6768653988838196, -0.6529380083084106, -0.6290106773376465, -0.6050832867622375, -0.5811558961868286, -0.5572285056114197, -0.5333011746406555, -0.5093737840652466, -0.48544642329216003, -0.4615190625190735, -0.43759170174598694, -0.4136643409729004, -0.38973698019981384, -0.3658096194267273, -0.34188225865364075, -0.3179548978805542, -0.29402750730514526, -0.2701001465320587, -0.24617278575897217, -0.22224541008472443, -0.19831804931163788, -0.17439068853855133, -0.1504633128643036, -0.12653595209121704, -0.1026085838675499, -0.07868121564388275, -0.054753854870796204, -0.030826479196548462, -0.006899118423461914, 0.01702824793756008, 0.04095561429858208, 0.06488297879695892, 0.08881034702062607, 0.11273771524429321, 0.13666507601737976, 0.1605924516916275, 0.18451981246471405, 0.2084471732378006, 0.23237454891204834, 0.2563019096851349, 0.28022927045822144, 0.30415666103363037, 0.32808399200439453, 0.35201138257980347, 0.37593874335289, 0.39986610412597656, 0.4237934648990631, 0.44772082567214966, 0.4716482162475586, 0.49557557702064514, 0.5195029377937317, 0.5434303283691406, 0.5673576593399048, 0.5912850499153137, 0.6152123808860779, 0.6391397714614868, 0.663067102432251, 0.6869944930076599, 0.7109218835830688, 0.734849214553833, 0.7587766051292419]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 8.0, 7.0, 9.0, 21.0, 34.0, 39.0, 53.0, 96.0, 148.0, 208.0, 337.0, 528.0, 934.0, 1639.0, 2763.0, 5082.0, 9939.0, 21263.0, 49998.0, 135916.0, 335861.0, 293712.0, 110593.0, 41853.0, 18085.0, 8736.0, 4540.0, 2555.0, 1453.0, 817.0, 461.0, 295.0, 196.0, 122.0, 71.0, 50.0, 33.0, 22.0, 12.0, 10.0, 5.0, 9.0, 5.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.470947265625, -0.45618438720703125, -0.4414215087890625, -0.42665863037109375, -0.411895751953125, -0.39713287353515625, -0.3823699951171875, -0.36760711669921875, -0.35284423828125, -0.33808135986328125, -0.3233184814453125, -0.30855560302734375, -0.293792724609375, -0.27902984619140625, -0.2642669677734375, -0.24950408935546875, -0.2347412109375, -0.21997833251953125, -0.2052154541015625, -0.19045257568359375, -0.175689697265625, -0.16092681884765625, -0.1461639404296875, -0.13140106201171875, -0.11663818359375, -0.10187530517578125, -0.0871124267578125, -0.07234954833984375, -0.057586669921875, -0.04282379150390625, -0.0280609130859375, -0.01329803466796875, 0.00146484375, 0.01622772216796875, 0.0309906005859375, 0.04575347900390625, 0.060516357421875, 0.07527923583984375, 0.0900421142578125, 0.10480499267578125, 0.11956787109375, 0.13433074951171875, 0.1490936279296875, 0.16385650634765625, 0.178619384765625, 0.19338226318359375, 0.2081451416015625, 0.22290802001953125, 0.2376708984375, 0.25243377685546875, 0.2671966552734375, 0.28195953369140625, 0.296722412109375, 0.31148529052734375, 0.3262481689453125, 0.34101104736328125, 0.35577392578125, 0.37053680419921875, 0.3852996826171875, 0.40006256103515625, 0.414825439453125, 0.42958831787109375, 0.4443511962890625, 0.45911407470703125, 0.473876953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 7.0, 5.0, 4.0, 8.0, 6.0, 7.0, 11.0, 16.0, 17.0, 13.0, 20.0, 25.0, 27.0, 31.0, 38.0, 37.0, 29.0, 40.0, 43.0, 37.0, 42.0, 42.0, 55.0, 43.0, 38.0, 38.0, 43.0, 25.0, 25.0, 38.0, 34.0, 20.0, 26.0, 9.0, 14.0, 17.0, 19.0, 7.0, 4.0, 10.0, 5.0, 5.0, 2.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.037109375, -1.970489501953125, -1.90386962890625, -1.837249755859375, -1.7706298828125, -1.704010009765625, -1.63739013671875, -1.570770263671875, -1.504150390625, -1.437530517578125, -1.37091064453125, -1.304290771484375, -1.2376708984375, -1.171051025390625, -1.10443115234375, -1.037811279296875, -0.97119140625, -0.904571533203125, -0.83795166015625, -0.771331787109375, -0.7047119140625, -0.638092041015625, -0.57147216796875, -0.504852294921875, -0.438232421875, -0.371612548828125, -0.30499267578125, -0.238372802734375, -0.1717529296875, -0.105133056640625, -0.03851318359375, 0.028106689453125, 0.0947265625, 0.161346435546875, 0.22796630859375, 0.294586181640625, 0.3612060546875, 0.427825927734375, 0.49444580078125, 0.561065673828125, 0.627685546875, 0.694305419921875, 0.76092529296875, 0.827545166015625, 0.8941650390625, 0.960784912109375, 1.02740478515625, 1.094024658203125, 1.16064453125, 1.227264404296875, 1.29388427734375, 1.360504150390625, 1.4271240234375, 1.493743896484375, 1.56036376953125, 1.626983642578125, 1.693603515625, 1.760223388671875, 1.82684326171875, 1.893463134765625, 1.9600830078125, 2.026702880859375, 2.09332275390625, 2.159942626953125, 2.2265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 6.0, 4.0, 5.0, 8.0, 10.0, 12.0, 12.0, 21.0, 23.0, 31.0, 51.0, 82.0, 132.0, 193.0, 319.0, 688.0, 3589.0, 85060.0, 921156.0, 33604.0, 2136.0, 596.0, 279.0, 151.0, 100.0, 74.0, 57.0, 30.0, 32.0, 24.0, 24.0, 12.0, 9.0, 8.0, 8.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.115234375, -2.0537109375, -1.9921875, -1.9306640625, -1.869140625, -1.8076171875, -1.74609375, -1.6845703125, -1.623046875, -1.5615234375, -1.5, -1.4384765625, -1.376953125, -1.3154296875, -1.25390625, -1.1923828125, -1.130859375, -1.0693359375, -1.0078125, -0.9462890625, -0.884765625, -0.8232421875, -0.76171875, -0.7001953125, -0.638671875, -0.5771484375, -0.515625, -0.4541015625, -0.392578125, -0.3310546875, -0.26953125, -0.2080078125, -0.146484375, -0.0849609375, -0.0234375, 0.0380859375, 0.099609375, 0.1611328125, 0.22265625, 0.2841796875, 0.345703125, 0.4072265625, 0.46875, 0.5302734375, 0.591796875, 0.6533203125, 0.71484375, 0.7763671875, 0.837890625, 0.8994140625, 0.9609375, 1.0224609375, 1.083984375, 1.1455078125, 1.20703125, 1.2685546875, 1.330078125, 1.3916015625, 1.453125, 1.5146484375, 1.576171875, 1.6376953125, 1.69921875, 1.7607421875, 1.822265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 6.0, 7.0, 8.0, 5.0, 17.0, 6.0, 17.0, 14.0, 17.0, 26.0, 22.0, 14.0, 26.0, 28.0, 44.0, 40.0, 41.0, 45.0, 40.0, 52.0, 51.0, 50.0, 59.0, 42.0, 38.0, 51.0, 39.0, 26.0, 28.0, 20.0, 28.0, 17.0, 12.0, 14.0, 14.0, 11.0, 1.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-2.609375, -2.537872314453125, -2.46636962890625, -2.394866943359375, -2.3233642578125, -2.251861572265625, -2.18035888671875, -2.108856201171875, -2.037353515625, -1.965850830078125, -1.89434814453125, -1.822845458984375, -1.7513427734375, -1.679840087890625, -1.60833740234375, -1.536834716796875, -1.46533203125, -1.393829345703125, -1.32232666015625, -1.250823974609375, -1.1793212890625, -1.107818603515625, -1.03631591796875, -0.964813232421875, -0.893310546875, -0.821807861328125, -0.75030517578125, -0.678802490234375, -0.6072998046875, -0.535797119140625, -0.46429443359375, -0.392791748046875, -0.3212890625, -0.249786376953125, -0.17828369140625, -0.106781005859375, -0.0352783203125, 0.036224365234375, 0.10772705078125, 0.179229736328125, 0.250732421875, 0.322235107421875, 0.39373779296875, 0.465240478515625, 0.5367431640625, 0.608245849609375, 0.67974853515625, 0.751251220703125, 0.82275390625, 0.894256591796875, 0.96575927734375, 1.037261962890625, 1.1087646484375, 1.180267333984375, 1.25177001953125, 1.323272705078125, 1.394775390625, 1.466278076171875, 1.53778076171875, 1.609283447265625, 1.6807861328125, 1.752288818359375, 1.82379150390625, 1.895294189453125, 1.966796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 9.0, 4.0, 25.0, 41.0, 59.0, 122.0, 265.0, 718.0, 2552.0, 14221.0, 367360.0, 642811.0, 16245.0, 2785.0, 754.0, 305.0, 118.0, 72.0, 28.0, 16.0, 17.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390380859375, -0.3734321594238281, -0.35648345947265625, -0.3395347595214844, -0.3225860595703125, -0.3056373596191406, -0.28868865966796875, -0.2717399597167969, -0.254791259765625, -0.23784255981445312, -0.22089385986328125, -0.20394515991210938, -0.1869964599609375, -0.17004776000976562, -0.15309906005859375, -0.13615036010742188, -0.11920166015625, -0.10225296020507812, -0.08530426025390625, -0.06835556030273438, -0.0514068603515625, -0.034458160400390625, -0.01750946044921875, -0.000560760498046875, 0.016387939453125, 0.033336639404296875, 0.05028533935546875, 0.06723403930664062, 0.0841827392578125, 0.10113143920898438, 0.11808013916015625, 0.13502883911132812, 0.1519775390625, 0.16892623901367188, 0.18587493896484375, 0.20282363891601562, 0.2197723388671875, 0.23672103881835938, 0.25366973876953125, 0.2706184387207031, 0.287567138671875, 0.3045158386230469, 0.32146453857421875, 0.3384132385253906, 0.3553619384765625, 0.3723106384277344, 0.38925933837890625, 0.4062080383300781, 0.42315673828125, 0.4401054382324219, 0.45705413818359375, 0.4740028381347656, 0.4909515380859375, 0.5079002380371094, 0.5248489379882812, 0.5417976379394531, 0.558746337890625, 0.5756950378417969, 0.5926437377929688, 0.6095924377441406, 0.6265411376953125, 0.6434898376464844, 0.6604385375976562, 0.6773872375488281, 0.6943359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 8.0, 14.0, 23.0, 20.0, 37.0, 75.0, 105.0, 178.0, 211.0, 125.0, 60.0, 40.0, 20.0, 12.0, 16.0, 10.0, 6.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.431341171264648e-05, -6.261933594942093e-05, -6.0925260186195374e-05, -5.923118442296982e-05, -5.753710865974426e-05, -5.584303289651871e-05, -5.414895713329315e-05, -5.2454881370067596e-05, -5.076080560684204e-05, -4.9066729843616486e-05, -4.737265408039093e-05, -4.5678578317165375e-05, -4.398450255393982e-05, -4.2290426790714264e-05, -4.059635102748871e-05, -3.890227526426315e-05, -3.72081995010376e-05, -3.551412373781204e-05, -3.382004797458649e-05, -3.212597221136093e-05, -3.0431896448135376e-05, -2.873782068490982e-05, -2.7043744921684265e-05, -2.534966915845871e-05, -2.3655593395233154e-05, -2.19615176320076e-05, -2.0267441868782043e-05, -1.8573366105556488e-05, -1.6879290342330933e-05, -1.5185214579105377e-05, -1.3491138815879822e-05, -1.1797063052654266e-05, -1.0102987289428711e-05, -8.408911526203156e-06, -6.7148357629776e-06, -5.020759999752045e-06, -3.3266842365264893e-06, -1.6326084733009338e-06, 6.146728992462158e-08, 1.755543053150177e-06, 3.4496188163757324e-06, 5.143694579601288e-06, 6.837770342826843e-06, 8.531846106052399e-06, 1.0225921869277954e-05, 1.191999763250351e-05, 1.3614073395729065e-05, 1.530814915895462e-05, 1.7002224922180176e-05, 1.869630068540573e-05, 2.0390376448631287e-05, 2.2084452211856842e-05, 2.3778527975082397e-05, 2.5472603738307953e-05, 2.7166679501533508e-05, 2.8860755264759064e-05, 3.055483102798462e-05, 3.2248906791210175e-05, 3.394298255443573e-05, 3.5637058317661285e-05, 3.733113408088684e-05, 3.9025209844112396e-05, 4.071928560733795e-05, 4.241336137056351e-05, 4.410743713378906e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 7.0, 11.0, 18.0, 21.0, 26.0, 60.0, 127.0, 246.0, 549.0, 1503.0, 5356.0, 27228.0, 751422.0, 239050.0, 17011.0, 3786.0, 1190.0, 470.0, 186.0, 104.0, 63.0, 32.0, 14.0, 19.0, 9.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.495849609375, -0.4820289611816406, -0.46820831298828125, -0.4543876647949219, -0.4405670166015625, -0.4267463684082031, -0.41292572021484375, -0.3991050720214844, -0.385284423828125, -0.3714637756347656, -0.35764312744140625, -0.3438224792480469, -0.3300018310546875, -0.3161811828613281, -0.30236053466796875, -0.2885398864746094, -0.27471923828125, -0.2608985900878906, -0.24707794189453125, -0.23325729370117188, -0.2194366455078125, -0.20561599731445312, -0.19179534912109375, -0.17797470092773438, -0.164154052734375, -0.15033340454101562, -0.13651275634765625, -0.12269210815429688, -0.1088714599609375, -0.09505081176757812, -0.08123016357421875, -0.06740951538085938, -0.0535888671875, -0.039768218994140625, -0.02594757080078125, -0.012126922607421875, 0.0016937255859375, 0.015514373779296875, 0.02933502197265625, 0.043155670166015625, 0.056976318359375, 0.07079696655273438, 0.08461761474609375, 0.09843826293945312, 0.1122589111328125, 0.12607955932617188, 0.13990020751953125, 0.15372085571289062, 0.16754150390625, 0.18136215209960938, 0.19518280029296875, 0.20900344848632812, 0.2228240966796875, 0.23664474487304688, 0.25046539306640625, 0.2642860412597656, 0.278106689453125, 0.2919273376464844, 0.30574798583984375, 0.3195686340332031, 0.3333892822265625, 0.3472099304199219, 0.36103057861328125, 0.3748512268066406, 0.388671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 9.0, 3.0, 15.0, 11.0, 22.0, 32.0, 32.0, 43.0, 77.0, 206.0, 241.0, 86.0, 56.0, 36.0, 29.0, 18.0, 15.0, 11.0, 5.0, 8.0, 9.0, 4.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1397705078125, -0.1354198455810547, -0.13106918334960938, -0.12671852111816406, -0.12236785888671875, -0.11801719665527344, -0.11366653442382812, -0.10931587219238281, -0.1049652099609375, -0.10061454772949219, -0.09626388549804688, -0.09191322326660156, -0.08756256103515625, -0.08321189880371094, -0.07886123657226562, -0.07451057434082031, -0.070159912109375, -0.06580924987792969, -0.061458587646484375, -0.05710792541503906, -0.05275726318359375, -0.04840660095214844, -0.044055938720703125, -0.03970527648925781, -0.0353546142578125, -0.031003952026367188, -0.026653289794921875, -0.022302627563476562, -0.01795196533203125, -0.013601303100585938, -0.009250640869140625, -0.0048999786376953125, -0.00054931640625, 0.0038013458251953125, 0.008152008056640625, 0.012502670288085938, 0.01685333251953125, 0.021203994750976562, 0.025554656982421875, 0.029905319213867188, 0.0342559814453125, 0.03860664367675781, 0.042957305908203125, 0.04730796813964844, 0.05165863037109375, 0.05600929260253906, 0.060359954833984375, 0.06471061706542969, 0.069061279296875, 0.07341194152832031, 0.07776260375976562, 0.08211326599121094, 0.08646392822265625, 0.09081459045410156, 0.09516525268554688, 0.09951591491699219, 0.1038665771484375, 0.10821723937988281, 0.11256790161132812, 0.11691856384277344, 0.12126922607421875, 0.12561988830566406, 0.12997055053710938, 0.1343212127685547, 0.138671875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 31.0, 244.0, 527.0, 186.0, 25.0, 3.0], "bins": [-27.2632999420166, -26.81192970275879, -26.36056137084961, -25.909191131591797, -25.457820892333984, -25.006450653076172, -24.555082321166992, -24.10371208190918, -23.652341842651367, -23.200971603393555, -22.749603271484375, -22.298233032226562, -21.84686279296875, -21.395492553710938, -20.944124221801758, -20.492753982543945, -20.041383743286133, -19.59001350402832, -19.13864517211914, -18.687274932861328, -18.235904693603516, -17.784534454345703, -17.333166122436523, -16.88179588317871, -16.4304256439209, -15.979056358337402, -15.52768611907959, -15.076316833496094, -14.624946594238281, -14.173577308654785, -13.722207069396973, -13.270837783813477, -12.819467544555664, -12.368098258972168, -11.916728019714355, -11.46535873413086, -11.013988494873047, -10.56261920928955, -10.111248970031738, -9.659879684448242, -9.208510398864746, -8.75714111328125, -8.305770874023438, -7.854401111602783, -7.403031349182129, -6.951662063598633, -6.50029182434082, -6.048922538757324, -5.597552299499512, -5.146182537078857, -4.694812774658203, -4.243443012237549, -3.7920732498168945, -3.3407037258148193, -2.889333963394165, -2.4379642009735107, -1.986594319343567, -1.5352245569229126, -1.0838549137115479, -0.6324851512908936, -0.18111538887023926, 0.2702542543411255, 0.7216240167617798, 1.172993779182434, 1.6243635416030884]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 0.0, 7.0, 7.0, 2.0, 12.0, 9.0, 9.0, 20.0, 16.0, 20.0, 23.0, 26.0, 34.0, 28.0, 34.0, 47.0, 42.0, 38.0, 48.0, 53.0, 33.0, 41.0, 33.0, 48.0, 35.0, 30.0, 33.0, 35.0, 31.0, 25.0, 31.0, 25.0, 17.0, 19.0, 21.0, 8.0, 21.0, 9.0, 3.0, 9.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.401885509490967, -3.2952685356140137, -3.1886515617370605, -3.0820345878601074, -2.9754176139831543, -2.868800640106201, -2.762183666229248, -2.655566930770874, -2.548949956893921, -2.4423329830169678, -2.3357160091400146, -2.2290990352630615, -2.1224820613861084, -2.0158653259277344, -1.9092482328414917, -1.8026313781738281, -1.6960142850875854, -1.5893973112106323, -1.4827803373336792, -1.3761634826660156, -1.2695465087890625, -1.1629295349121094, -1.0563125610351562, -0.9496956467628479, -0.8430786728858948, -0.7364616990089417, -0.6298447847366333, -0.5232278108596802, -0.41661086678504944, -0.3099939227104187, -0.20337694883346558, -0.09676003456115723, 0.009856939315795898, 0.11647389084100723, 0.22309084236621857, 0.3297078013420105, 0.43632474541664124, 0.542941689491272, 0.6495586633682251, 0.7561755776405334, 0.8627925515174866, 0.9694095253944397, 1.076026439666748, 1.1826434135437012, 1.2892603874206543, 1.3958773612976074, 1.5024943351745605, 1.6091111898422241, 1.7157281637191772, 1.8223451375961304, 1.9289621114730835, 2.035578966140747, 2.1421959400177, 2.2488129138946533, 2.3554298877716064, 2.4620468616485596, 2.5686638355255127, 2.675280809402466, 2.781897783279419, 2.888514757156372, 2.995131731033325, 3.101748466491699, 3.2083654403686523, 3.3149824142456055, 3.4215993881225586]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 11.0, 13.0, 33.0, 40.0, 72.0, 116.0, 192.0, 333.0, 587.0, 1300.0, 3002.0, 8016.0, 27069.0, 151431.0, 1556061.0, 2187759.0, 209210.0, 33390.0, 9303.0, 3301.0, 1449.0, 746.0, 360.0, 233.0, 103.0, 62.0, 34.0, 21.0, 13.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.8642578125, -1.8152923583984375, -1.766326904296875, -1.7173614501953125, -1.66839599609375, -1.6194305419921875, -1.570465087890625, -1.5214996337890625, -1.4725341796875, -1.4235687255859375, -1.374603271484375, -1.3256378173828125, -1.27667236328125, -1.2277069091796875, -1.178741455078125, -1.1297760009765625, -1.080810546875, -1.0318450927734375, -0.982879638671875, -0.9339141845703125, -0.88494873046875, -0.8359832763671875, -0.787017822265625, -0.7380523681640625, -0.6890869140625, -0.6401214599609375, -0.591156005859375, -0.5421905517578125, -0.49322509765625, -0.4442596435546875, -0.395294189453125, -0.3463287353515625, -0.29736328125, -0.2483978271484375, -0.199432373046875, -0.1504669189453125, -0.10150146484375, -0.0525360107421875, -0.003570556640625, 0.0453948974609375, 0.0943603515625, 0.1433258056640625, 0.192291259765625, 0.2412567138671875, 0.29022216796875, 0.3391876220703125, 0.388153076171875, 0.4371185302734375, 0.486083984375, 0.5350494384765625, 0.584014892578125, 0.6329803466796875, 0.68194580078125, 0.7309112548828125, 0.779876708984375, 0.8288421630859375, 0.8778076171875, 0.9267730712890625, 0.975738525390625, 1.0247039794921875, 1.07366943359375, 1.1226348876953125, 1.171600341796875, 1.2205657958984375, 1.26953125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 5.0, 6.0, 9.0, 12.0, 12.0, 16.0, 16.0, 15.0, 16.0, 28.0, 18.0, 21.0, 50.0, 36.0, 59.0, 46.0, 55.0, 55.0, 58.0, 47.0, 64.0, 44.0, 47.0, 36.0, 36.0, 35.0, 32.0, 24.0, 17.0, 11.0, 20.0, 9.0, 11.0, 14.0, 6.0, 4.0, 4.0, 0.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9804840087890625, -0.948272705078125, -0.9160614013671875, -0.88385009765625, -0.8516387939453125, -0.819427490234375, -0.7872161865234375, -0.7550048828125, -0.7227935791015625, -0.690582275390625, -0.6583709716796875, -0.62615966796875, -0.5939483642578125, -0.561737060546875, -0.5295257568359375, -0.497314453125, -0.4651031494140625, -0.432891845703125, -0.4006805419921875, -0.36846923828125, -0.3362579345703125, -0.304046630859375, -0.2718353271484375, -0.2396240234375, -0.2074127197265625, -0.175201416015625, -0.1429901123046875, -0.11077880859375, -0.0785675048828125, -0.046356201171875, -0.0141448974609375, 0.01806640625, 0.0502777099609375, 0.082489013671875, 0.1147003173828125, 0.14691162109375, 0.1791229248046875, 0.211334228515625, 0.2435455322265625, 0.2757568359375, 0.3079681396484375, 0.340179443359375, 0.3723907470703125, 0.40460205078125, 0.4368133544921875, 0.469024658203125, 0.5012359619140625, 0.533447265625, 0.5656585693359375, 0.597869873046875, 0.6300811767578125, 0.66229248046875, 0.6945037841796875, 0.726715087890625, 0.7589263916015625, 0.7911376953125, 0.8233489990234375, 0.855560302734375, 0.8877716064453125, 0.91998291015625, 0.9521942138671875, 0.984405517578125, 1.0166168212890625, 1.048828125]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 7.0, 5.0, 6.0, 21.0, 32.0, 50.0, 141.0, 338.0, 9701.0, 4181941.0, 1593.0, 248.0, 109.0, 39.0, 18.0, 12.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.09375, -15.6846923828125, -15.275634765625, -14.8665771484375, -14.45751953125, -14.0484619140625, -13.639404296875, -13.2303466796875, -12.8212890625, -12.4122314453125, -12.003173828125, -11.5941162109375, -11.18505859375, -10.7760009765625, -10.366943359375, -9.9578857421875, -9.548828125, -9.1397705078125, -8.730712890625, -8.3216552734375, -7.91259765625, -7.5035400390625, -7.094482421875, -6.6854248046875, -6.2763671875, -5.8673095703125, -5.458251953125, -5.0491943359375, -4.64013671875, -4.2310791015625, -3.822021484375, -3.4129638671875, -3.00390625, -2.5948486328125, -2.185791015625, -1.7767333984375, -1.36767578125, -0.9586181640625, -0.549560546875, -0.1405029296875, 0.2685546875, 0.6776123046875, 1.086669921875, 1.4957275390625, 1.90478515625, 2.3138427734375, 2.722900390625, 3.1319580078125, 3.541015625, 3.9500732421875, 4.359130859375, 4.7681884765625, 5.17724609375, 5.5863037109375, 5.995361328125, 6.4044189453125, 6.8134765625, 7.2225341796875, 7.631591796875, 8.0406494140625, 8.44970703125, 8.8587646484375, 9.267822265625, 9.6768798828125, 10.0859375]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 8.0, 9.0, 12.0, 14.0, 31.0, 50.0, 63.0, 86.0, 145.0, 278.0, 488.0, 1024.0, 771.0, 454.0, 249.0, 150.0, 79.0, 54.0, 45.0, 29.0, 14.0, 4.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451416015625, -0.4346351623535156, -0.41785430908203125, -0.4010734558105469, -0.3842926025390625, -0.3675117492675781, -0.35073089599609375, -0.3339500427246094, -0.317169189453125, -0.3003883361816406, -0.28360748291015625, -0.2668266296386719, -0.2500457763671875, -0.23326492309570312, -0.21648406982421875, -0.19970321655273438, -0.18292236328125, -0.16614151000976562, -0.14936065673828125, -0.13257980346679688, -0.1157989501953125, -0.09901809692382812, -0.08223724365234375, -0.06545639038085938, -0.048675537109375, -0.031894683837890625, -0.01511383056640625, 0.001667022705078125, 0.0184478759765625, 0.035228729248046875, 0.05200958251953125, 0.06879043579101562, 0.0855712890625, 0.10235214233398438, 0.11913299560546875, 0.13591384887695312, 0.1526947021484375, 0.16947555541992188, 0.18625640869140625, 0.20303726196289062, 0.219818115234375, 0.23659896850585938, 0.25337982177734375, 0.2701606750488281, 0.2869415283203125, 0.3037223815917969, 0.32050323486328125, 0.3372840881347656, 0.35406494140625, 0.3708457946777344, 0.38762664794921875, 0.4044075012207031, 0.4211883544921875, 0.4379692077636719, 0.45475006103515625, 0.4715309143066406, 0.488311767578125, 0.5050926208496094, 0.5218734741210938, 0.5386543273925781, 0.5554351806640625, 0.5722160339355469, 0.5889968872070312, 0.6057777404785156, 0.62255859375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 6.0, 22.0, 25.0, 34.0, 54.0, 53.0, 88.0, 100.0, 108.0, 117.0, 91.0, 80.0, 71.0, 51.0, 46.0, 14.0, 14.0, 10.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.731008768081665, -2.6662120819091797, -2.6014151573181152, -2.53661847114563, -2.4718217849731445, -2.40702486038208, -2.3422281742095947, -2.2774312496185303, -2.212634563446045, -2.1478378772735596, -2.083040952682495, -2.0182442665100098, -1.9534474611282349, -1.88865065574646, -1.8238539695739746, -1.7590571641921997, -1.6942603588104248, -1.62946355342865, -1.564666748046875, -1.4998700618743896, -1.4350732564926147, -1.3702764511108398, -1.3054797649383545, -1.2406829595565796, -1.1758861541748047, -1.1110893487930298, -1.0462925434112549, -0.9814958572387695, -0.9166990518569946, -0.8519022464752197, -0.7871055006980896, -0.7223087549209595, -0.6575121879577637, -0.5927153825759888, -0.5279186367988586, -0.46312186121940613, -0.3983250856399536, -0.3335283100605011, -0.2687315344810486, -0.20393475890159607, -0.13913798332214355, -0.07434120774269104, -0.009544432163238525, 0.05525234341621399, 0.1200491189956665, 0.18484589457511902, 0.24964267015457153, 0.31443944573402405, 0.37923622131347656, 0.4440329968929291, 0.5088297724723816, 0.5736265182495117, 0.6384233236312866, 0.7032201290130615, 0.7680168747901917, 0.8328136205673218, 0.8976104259490967, 0.9624072313308716, 1.0272040367126465, 1.0920007228851318, 1.1567975282669067, 1.2215943336486816, 1.286391019821167, 1.351187825202942, 1.4159846305847168]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 6.0, 6.0, 8.0, 9.0, 15.0, 14.0, 18.0, 25.0, 23.0, 20.0, 24.0, 29.0, 30.0, 32.0, 31.0, 40.0, 37.0, 41.0, 33.0, 42.0, 42.0, 42.0, 44.0, 39.0, 29.0, 42.0, 30.0, 39.0, 25.0, 21.0, 29.0, 14.0, 14.0, 21.0, 9.0, 10.0, 6.0, 6.0, 8.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.851571261882782, -0.823901891708374, -0.7962325811386108, -0.7685632109642029, -0.7408938407897949, -0.7132245302200317, -0.6855551600456238, -0.6578857898712158, -0.6302164793014526, -0.6025471091270447, -0.5748777985572815, -0.5472084283828735, -0.5195390582084656, -0.49186971783638, -0.46420037746429443, -0.4365310072898865, -0.4088616371154785, -0.38119229674339294, -0.353522926568985, -0.3258535861968994, -0.29818421602249146, -0.2705148756504059, -0.2428455352783203, -0.21517618000507355, -0.18750682473182678, -0.15983746945858002, -0.13216811418533325, -0.10449877381324768, -0.07682941854000092, -0.04916006326675415, -0.02149072289466858, 0.006178632378578186, 0.03384804725646973, 0.06151739880442619, 0.08918675035238266, 0.11685609817504883, 0.1445254534482956, 0.17219480872154236, 0.19986414909362793, 0.2275335043668747, 0.25520285964012146, 0.28287220001220703, 0.310541570186615, 0.33821091055870056, 0.36588025093078613, 0.3935496211051941, 0.42121896147727966, 0.44888830184936523, 0.4765576720237732, 0.5042270421981812, 0.5318963527679443, 0.5595657229423523, 0.5872350931167603, 0.6149044036865234, 0.6425737738609314, 0.6702431440353394, 0.6979124546051025, 0.7255818247795105, 0.7532511353492737, 0.7809205055236816, 0.8085898756980896, 0.8362592458724976, 0.8639285564422607, 0.8915979266166687, 0.9192672967910767]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 8.0, 6.0, 12.0, 15.0, 22.0, 27.0, 57.0, 86.0, 123.0, 240.0, 399.0, 769.0, 1389.0, 2667.0, 5396.0, 11975.0, 28928.0, 77863.0, 219293.0, 407441.0, 182798.0, 64842.0, 23990.0, 10158.0, 4781.0, 2469.0, 1239.0, 658.0, 398.0, 192.0, 130.0, 67.0, 47.0, 29.0, 21.0, 12.0, 5.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394287109375, -0.3799018859863281, -0.36551666259765625, -0.3511314392089844, -0.3367462158203125, -0.3223609924316406, -0.30797576904296875, -0.2935905456542969, -0.279205322265625, -0.2648200988769531, -0.25043487548828125, -0.23604965209960938, -0.2216644287109375, -0.20727920532226562, -0.19289398193359375, -0.17850875854492188, -0.16412353515625, -0.14973831176757812, -0.13535308837890625, -0.12096786499023438, -0.1065826416015625, -0.09219741821289062, -0.07781219482421875, -0.06342697143554688, -0.049041748046875, -0.034656524658203125, -0.02027130126953125, -0.005886077880859375, 0.0084991455078125, 0.022884368896484375, 0.03726959228515625, 0.051654815673828125, 0.0660400390625, 0.08042526245117188, 0.09481048583984375, 0.10919570922851562, 0.1235809326171875, 0.13796615600585938, 0.15235137939453125, 0.16673660278320312, 0.181121826171875, 0.19550704956054688, 0.20989227294921875, 0.22427749633789062, 0.2386627197265625, 0.2530479431152344, 0.26743316650390625, 0.2818183898925781, 0.29620361328125, 0.3105888366699219, 0.32497406005859375, 0.3393592834472656, 0.3537445068359375, 0.3681297302246094, 0.38251495361328125, 0.3969001770019531, 0.411285400390625, 0.4256706237792969, 0.44005584716796875, 0.4544410705566406, 0.4688262939453125, 0.4832115173339844, 0.49759674072265625, 0.5119819641113281, 0.5263671875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 3.0, 10.0, 8.0, 16.0, 12.0, 12.0, 17.0, 24.0, 33.0, 30.0, 25.0, 48.0, 54.0, 51.0, 40.0, 70.0, 67.0, 55.0, 66.0, 54.0, 62.0, 43.0, 34.0, 37.0, 31.0, 21.0, 23.0, 10.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.6595611572265625, -0.632598876953125, -0.6056365966796875, -0.57867431640625, -0.5517120361328125, -0.524749755859375, -0.4977874755859375, -0.4708251953125, -0.4438629150390625, -0.416900634765625, -0.3899383544921875, -0.36297607421875, -0.3360137939453125, -0.309051513671875, -0.2820892333984375, -0.255126953125, -0.2281646728515625, -0.201202392578125, -0.1742401123046875, -0.14727783203125, -0.1203155517578125, -0.093353271484375, -0.0663909912109375, -0.0394287109375, -0.0124664306640625, 0.014495849609375, 0.0414581298828125, 0.06842041015625, 0.0953826904296875, 0.122344970703125, 0.1493072509765625, 0.17626953125, 0.2032318115234375, 0.230194091796875, 0.2571563720703125, 0.28411865234375, 0.3110809326171875, 0.338043212890625, 0.3650054931640625, 0.3919677734375, 0.4189300537109375, 0.445892333984375, 0.4728546142578125, 0.49981689453125, 0.5267791748046875, 0.553741455078125, 0.5807037353515625, 0.607666015625, 0.6346282958984375, 0.661590576171875, 0.6885528564453125, 0.71551513671875, 0.7424774169921875, 0.769439697265625, 0.7964019775390625, 0.8233642578125, 0.8503265380859375, 0.877288818359375, 0.9042510986328125, 0.93121337890625, 0.9581756591796875, 0.985137939453125, 1.0121002197265625, 1.0390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 10.0, 8.0, 12.0, 13.0, 16.0, 25.0, 35.0, 45.0, 65.0, 79.0, 125.0, 175.0, 332.0, 486.0, 1106.0, 2572.0, 7582.0, 28642.0, 151773.0, 630373.0, 178444.0, 32703.0, 8433.0, 2795.0, 1198.0, 543.0, 325.0, 179.0, 136.0, 82.0, 64.0, 49.0, 25.0, 31.0, 20.0, 9.0, 10.0, 9.0, 9.0, 7.0, 6.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.6142578125, -0.5953826904296875, -0.576507568359375, -0.5576324462890625, -0.53875732421875, -0.5198822021484375, -0.501007080078125, -0.4821319580078125, -0.4632568359375, -0.4443817138671875, -0.425506591796875, -0.4066314697265625, -0.38775634765625, -0.3688812255859375, -0.350006103515625, -0.3311309814453125, -0.312255859375, -0.2933807373046875, -0.274505615234375, -0.2556304931640625, -0.23675537109375, -0.2178802490234375, -0.199005126953125, -0.1801300048828125, -0.1612548828125, -0.1423797607421875, -0.123504638671875, -0.1046295166015625, -0.08575439453125, -0.0668792724609375, -0.048004150390625, -0.0291290283203125, -0.01025390625, 0.0086212158203125, 0.027496337890625, 0.0463714599609375, 0.06524658203125, 0.0841217041015625, 0.102996826171875, 0.1218719482421875, 0.1407470703125, 0.1596221923828125, 0.178497314453125, 0.1973724365234375, 0.21624755859375, 0.2351226806640625, 0.253997802734375, 0.2728729248046875, 0.291748046875, 0.3106231689453125, 0.329498291015625, 0.3483734130859375, 0.36724853515625, 0.3861236572265625, 0.404998779296875, 0.4238739013671875, 0.4427490234375, 0.4616241455078125, 0.480499267578125, 0.4993743896484375, 0.51824951171875, 0.5371246337890625, 0.555999755859375, 0.5748748779296875, 0.59375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 11.0, 11.0, 12.0, 20.0, 22.0, 20.0, 15.0, 32.0, 33.0, 29.0, 32.0, 48.0, 45.0, 45.0, 45.0, 41.0, 50.0, 47.0, 52.0, 43.0, 44.0, 37.0, 30.0, 21.0, 23.0, 29.0, 24.0, 23.0, 18.0, 10.0, 16.0, 9.0, 7.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4423828125, -1.3988189697265625, -1.355255126953125, -1.3116912841796875, -1.26812744140625, -1.2245635986328125, -1.180999755859375, -1.1374359130859375, -1.0938720703125, -1.0503082275390625, -1.006744384765625, -0.9631805419921875, -0.91961669921875, -0.8760528564453125, -0.832489013671875, -0.7889251708984375, -0.745361328125, -0.7017974853515625, -0.658233642578125, -0.6146697998046875, -0.57110595703125, -0.5275421142578125, -0.483978271484375, -0.4404144287109375, -0.3968505859375, -0.3532867431640625, -0.309722900390625, -0.2661590576171875, -0.22259521484375, -0.1790313720703125, -0.135467529296875, -0.0919036865234375, -0.04833984375, -0.0047760009765625, 0.038787841796875, 0.0823516845703125, 0.12591552734375, 0.1694793701171875, 0.213043212890625, 0.2566070556640625, 0.3001708984375, 0.3437347412109375, 0.387298583984375, 0.4308624267578125, 0.47442626953125, 0.5179901123046875, 0.561553955078125, 0.6051177978515625, 0.648681640625, 0.6922454833984375, 0.735809326171875, 0.7793731689453125, 0.82293701171875, 0.8665008544921875, 0.910064697265625, 0.9536285400390625, 0.9971923828125, 1.0407562255859375, 1.084320068359375, 1.1278839111328125, 1.17144775390625, 1.2150115966796875, 1.258575439453125, 1.3021392822265625, 1.345703125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 14.0, 16.0, 14.0, 21.0, 44.0, 65.0, 92.0, 139.0, 277.0, 458.0, 926.0, 1883.0, 4142.0, 10770.0, 35130.0, 176538.0, 618200.0, 150680.0, 31784.0, 9770.0, 3848.0, 1708.0, 870.0, 461.0, 250.0, 159.0, 93.0, 61.0, 36.0, 37.0, 16.0, 13.0, 9.0, 5.0, 6.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.21378517150878906, -0.20698928833007812, -0.2001934051513672, -0.19339752197265625, -0.1866016387939453, -0.17980575561523438, -0.17300987243652344, -0.1662139892578125, -0.15941810607910156, -0.15262222290039062, -0.1458263397216797, -0.13903045654296875, -0.1322345733642578, -0.12543869018554688, -0.11864280700683594, -0.111846923828125, -0.10505104064941406, -0.09825515747070312, -0.09145927429199219, -0.08466339111328125, -0.07786750793457031, -0.07107162475585938, -0.06427574157714844, -0.0574798583984375, -0.05068397521972656, -0.043888092041015625, -0.03709220886230469, -0.03029632568359375, -0.023500442504882812, -0.016704559326171875, -0.009908676147460938, -0.00311279296875, 0.0036830902099609375, 0.010478973388671875, 0.017274856567382812, 0.02407073974609375, 0.030866622924804688, 0.037662506103515625, 0.04445838928222656, 0.0512542724609375, 0.05805015563964844, 0.06484603881835938, 0.07164192199707031, 0.07843780517578125, 0.08523368835449219, 0.09202957153320312, 0.09882545471191406, 0.105621337890625, 0.11241722106933594, 0.11921310424804688, 0.1260089874267578, 0.13280487060546875, 0.1396007537841797, 0.14639663696289062, 0.15319252014160156, 0.1599884033203125, 0.16678428649902344, 0.17358016967773438, 0.1803760528564453, 0.18717193603515625, 0.1939678192138672, 0.20076370239257812, 0.20755958557128906, 0.21435546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 14.0, 12.0, 20.0, 30.0, 37.0, 45.0, 77.0, 103.0, 120.0, 131.0, 94.0, 83.0, 60.0, 49.0, 38.0, 23.0, 18.0, 14.0, 9.0, 5.0, 4.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00020599365234375, -0.0002013491466641426, -0.00019670464098453522, -0.00019206013530492783, -0.00018741562962532043, -0.00018277112394571304, -0.00017812661826610565, -0.00017348211258649826, -0.00016883760690689087, -0.00016419310122728348, -0.00015954859554767609, -0.0001549040898680687, -0.0001502595841884613, -0.0001456150785088539, -0.00014097057282924652, -0.00013632606714963913, -0.00013168156147003174, -0.00012703705579042435, -0.00012239255011081696, -0.00011774804443120956, -0.00011310353875160217, -0.00010845903307199478, -0.00010381452739238739, -9.917002171278e-05, -9.452551603317261e-05, -8.988101035356522e-05, -8.523650467395782e-05, -8.059199899435043e-05, -7.594749331474304e-05, -7.130298763513565e-05, -6.665848195552826e-05, -6.201397627592087e-05, -5.7369470596313477e-05, -5.2724964916706085e-05, -4.8080459237098694e-05, -4.34359535574913e-05, -3.879144787788391e-05, -3.414694219827652e-05, -2.950243651866913e-05, -2.4857930839061737e-05, -2.0213425159454346e-05, -1.5568919479846954e-05, -1.0924413800239563e-05, -6.279908120632172e-06, -1.6354024410247803e-06, 3.009103238582611e-06, 7.653608918190002e-06, 1.2298114597797394e-05, 1.6942620277404785e-05, 2.1587125957012177e-05, 2.6231631636619568e-05, 3.087613731622696e-05, 3.552064299583435e-05, 4.016514867544174e-05, 4.480965435504913e-05, 4.9454160034656525e-05, 5.4098665714263916e-05, 5.874317139387131e-05, 6.33876770734787e-05, 6.803218275308609e-05, 7.267668843269348e-05, 7.732119411230087e-05, 8.196569979190826e-05, 8.661020547151566e-05, 9.125471115112305e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 13.0, 25.0, 93.0, 431.0, 9390.0, 993528.0, 44019.0, 820.0, 122.0, 43.0, 18.0, 14.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0166015625, -0.9823150634765625, -0.948028564453125, -0.9137420654296875, -0.87945556640625, -0.8451690673828125, -0.810882568359375, -0.7765960693359375, -0.7423095703125, -0.7080230712890625, -0.673736572265625, -0.6394500732421875, -0.60516357421875, -0.5708770751953125, -0.536590576171875, -0.5023040771484375, -0.468017578125, -0.4337310791015625, -0.399444580078125, -0.3651580810546875, -0.33087158203125, -0.2965850830078125, -0.262298583984375, -0.2280120849609375, -0.1937255859375, -0.1594390869140625, -0.125152587890625, -0.0908660888671875, -0.05657958984375, -0.0222930908203125, 0.011993408203125, 0.0462799072265625, 0.08056640625, 0.1148529052734375, 0.149139404296875, 0.1834259033203125, 0.21771240234375, 0.2519989013671875, 0.286285400390625, 0.3205718994140625, 0.3548583984375, 0.3891448974609375, 0.423431396484375, 0.4577178955078125, 0.49200439453125, 0.5262908935546875, 0.560577392578125, 0.5948638916015625, 0.629150390625, 0.6634368896484375, 0.697723388671875, 0.7320098876953125, 0.76629638671875, 0.8005828857421875, 0.834869384765625, 0.8691558837890625, 0.9034423828125, 0.9377288818359375, 0.972015380859375, 1.0063018798828125, 1.04058837890625, 1.0748748779296875, 1.109161376953125, 1.1434478759765625, 1.177734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 11.0, 7.0, 10.0, 12.0, 5.0, 15.0, 19.0, 30.0, 35.0, 34.0, 61.0, 69.0, 81.0, 81.0, 78.0, 90.0, 74.0, 66.0, 54.0, 34.0, 33.0, 25.0, 11.0, 16.0, 11.0, 5.0, 6.0, 4.0, 5.0, 3.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04632568359375, -0.0447239875793457, -0.043122291564941406, -0.04152059555053711, -0.03991889953613281, -0.038317203521728516, -0.03671550750732422, -0.03511381149291992, -0.033512115478515625, -0.03191041946411133, -0.03030872344970703, -0.028707027435302734, -0.027105331420898438, -0.02550363540649414, -0.023901939392089844, -0.022300243377685547, -0.02069854736328125, -0.019096851348876953, -0.017495155334472656, -0.01589345932006836, -0.014291763305664062, -0.012690067291259766, -0.011088371276855469, -0.009486675262451172, -0.007884979248046875, -0.006283283233642578, -0.004681587219238281, -0.0030798912048339844, -0.0014781951904296875, 0.00012350082397460938, 0.0017251968383789062, 0.003326892852783203, 0.0049285888671875, 0.006530284881591797, 0.008131980895996094, 0.00973367691040039, 0.011335372924804688, 0.012937068939208984, 0.014538764953613281, 0.016140460968017578, 0.017742156982421875, 0.019343852996826172, 0.02094554901123047, 0.022547245025634766, 0.024148941040039062, 0.02575063705444336, 0.027352333068847656, 0.028954029083251953, 0.03055572509765625, 0.03215742111206055, 0.033759117126464844, 0.03536081314086914, 0.03696250915527344, 0.038564205169677734, 0.04016590118408203, 0.04176759719848633, 0.043369293212890625, 0.04497098922729492, 0.04657268524169922, 0.048174381256103516, 0.04977607727050781, 0.05137777328491211, 0.052979469299316406, 0.0545811653137207, 0.056182861328125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 18.0, 30.0, 38.0, 72.0, 108.0, 153.0, 179.0, 155.0, 107.0, 56.0, 39.0, 17.0, 11.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.115662097930908, -2.0558879375457764, -1.996113896369934, -1.9363398551940918, -1.8765658140182495, -1.8167917728424072, -1.7570176124572754, -1.697243571281433, -1.6374695301055908, -1.5776954889297485, -1.5179213285446167, -1.4581472873687744, -1.3983732461929321, -1.3385992050170898, -1.278825044631958, -1.2190510034561157, -1.1592768430709839, -1.0995028018951416, -1.0397286415100098, -0.9799546003341675, -0.9201805591583252, -0.8604064583778381, -0.8006323575973511, -0.7408583164215088, -0.6810842156410217, -0.6213101148605347, -0.5615360736846924, -0.5017619729042053, -0.44198790192604065, -0.382213830947876, -0.3224397301673889, -0.26266565918922424, -0.20289170742034912, -0.14311763644218445, -0.08334355056285858, -0.023569464683532715, 0.03620460629463196, 0.09597867727279663, 0.1557527780532837, 0.21552684903144836, 0.27530092000961304, 0.3350749909877777, 0.3948490619659424, 0.45462316274642944, 0.5143972635269165, 0.5741713047027588, 0.6339454054832458, 0.6937195062637329, 0.7534935474395752, 0.8132676482200623, 0.8730416893959045, 0.9328157901763916, 0.9925898313522339, 1.0523638725280762, 1.112138032913208, 1.1719120740890503, 1.2316861152648926, 1.2914601564407349, 1.3512343168258667, 1.411008358001709, 1.4707823991775513, 1.5305564403533936, 1.5903306007385254, 1.6501046419143677, 1.7098788022994995]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 9.0, 7.0, 7.0, 9.0, 14.0, 21.0, 29.0, 15.0, 35.0, 36.0, 40.0, 51.0, 49.0, 60.0, 56.0, 61.0, 61.0, 62.0, 62.0, 57.0, 47.0, 44.0, 28.0, 38.0, 21.0, 11.0, 11.0, 15.0, 17.0, 7.0, 5.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6563366055488586, -0.6297059655189514, -0.603075385093689, -0.5764447450637817, -0.5498141050338745, -0.5231835246086121, -0.49655288457870483, -0.46992227435112, -0.44329166412353516, -0.4166610538959503, -0.3900304436683655, -0.36339980363845825, -0.3367691934108734, -0.3101385831832886, -0.28350794315338135, -0.2568773329257965, -0.23024672269821167, -0.20361611247062683, -0.1769854873418808, -0.15035486221313477, -0.12372425198554993, -0.09709364175796509, -0.07046301662921906, -0.04383239150047302, -0.017201781272888184, 0.009428836405277252, 0.03605945408344269, 0.06269007176160812, 0.08932068943977356, 0.1159512996673584, 0.14258192479610443, 0.16921254992485046, 0.19584321975708008, 0.22247382998466492, 0.24910445511341095, 0.275735080242157, 0.3023656904697418, 0.32899630069732666, 0.3556269407272339, 0.3822575509548187, 0.40888816118240356, 0.4355187714099884, 0.46214938163757324, 0.48878002166748047, 0.5154106616973877, 0.5420412421226501, 0.5686718821525574, 0.5953024625778198, 0.621933102607727, 0.6485637426376343, 0.6751943230628967, 0.701824963092804, 0.7284555435180664, 0.7550861835479736, 0.7817168235778809, 0.8083474636077881, 0.8349780440330505, 0.8616086840629578, 0.8882392644882202, 0.9148699045181274, 0.9415005445480347, 0.9681311249732971, 0.9947617650032043, 1.0213923454284668, 1.048022985458374]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 10.0, 14.0, 17.0, 34.0, 48.0, 79.0, 148.0, 236.0, 460.0, 882.0, 1679.0, 3797.0, 9652.0, 27480.0, 98375.0, 483103.0, 322032.0, 67118.0, 19961.0, 7438.0, 3052.0, 1445.0, 633.0, 340.0, 187.0, 110.0, 74.0, 35.0, 39.0, 19.0, 13.0, 9.0, 9.0, 1.0, 3.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.98681640625, -0.9600448608398438, -0.9332733154296875, -0.9065017700195312, -0.879730224609375, -0.8529586791992188, -0.8261871337890625, -0.7994155883789062, -0.77264404296875, -0.7458724975585938, -0.7191009521484375, -0.6923294067382812, -0.665557861328125, -0.6387863159179688, -0.6120147705078125, -0.5852432250976562, -0.5584716796875, -0.5317001342773438, -0.5049285888671875, -0.47815704345703125, -0.451385498046875, -0.42461395263671875, -0.3978424072265625, -0.37107086181640625, -0.34429931640625, -0.31752777099609375, -0.2907562255859375, -0.26398468017578125, -0.237213134765625, -0.21044158935546875, -0.1836700439453125, -0.15689849853515625, -0.130126953125, -0.10335540771484375, -0.0765838623046875, -0.04981231689453125, -0.023040771484375, 0.00373077392578125, 0.0305023193359375, 0.05727386474609375, 0.08404541015625, 0.11081695556640625, 0.1375885009765625, 0.16436004638671875, 0.191131591796875, 0.21790313720703125, 0.2446746826171875, 0.27144622802734375, 0.2982177734375, 0.32498931884765625, 0.3517608642578125, 0.37853240966796875, 0.405303955078125, 0.43207550048828125, 0.4588470458984375, 0.48561859130859375, 0.51239013671875, 0.5391616821289062, 0.5659332275390625, 0.5927047729492188, 0.619476318359375, 0.6462478637695312, 0.6730194091796875, 0.6997909545898438, 0.7265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 8.0, 5.0, 11.0, 15.0, 18.0, 24.0, 33.0, 47.0, 45.0, 40.0, 70.0, 78.0, 69.0, 75.0, 80.0, 74.0, 74.0, 49.0, 34.0, 36.0, 33.0, 24.0, 20.0, 9.0, 6.0, 11.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.478973388671875, -1.40716552734375, -1.335357666015625, -1.2635498046875, -1.191741943359375, -1.11993408203125, -1.048126220703125, -0.976318359375, -0.904510498046875, -0.83270263671875, -0.760894775390625, -0.6890869140625, -0.617279052734375, -0.54547119140625, -0.473663330078125, -0.40185546875, -0.330047607421875, -0.25823974609375, -0.186431884765625, -0.1146240234375, -0.042816162109375, 0.02899169921875, 0.100799560546875, 0.172607421875, 0.244415283203125, 0.31622314453125, 0.388031005859375, 0.4598388671875, 0.531646728515625, 0.60345458984375, 0.675262451171875, 0.7470703125, 0.818878173828125, 0.89068603515625, 0.962493896484375, 1.0343017578125, 1.106109619140625, 1.17791748046875, 1.249725341796875, 1.321533203125, 1.393341064453125, 1.46514892578125, 1.536956787109375, 1.6087646484375, 1.680572509765625, 1.75238037109375, 1.824188232421875, 1.89599609375, 1.967803955078125, 2.03961181640625, 2.111419677734375, 2.1832275390625, 2.255035400390625, 2.32684326171875, 2.398651123046875, 2.470458984375, 2.542266845703125, 2.61407470703125, 2.685882568359375, 2.7576904296875, 2.829498291015625, 2.90130615234375, 2.973114013671875, 3.044921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 7.0, 5.0, 11.0, 9.0, 18.0, 17.0, 25.0, 25.0, 33.0, 44.0, 47.0, 66.0, 99.0, 199.0, 5208.0, 1040210.0, 1942.0, 175.0, 96.0, 71.0, 53.0, 44.0, 34.0, 21.0, 20.0, 12.0, 17.0, 10.0, 10.0, 4.0, 3.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.92724609375, -7.6826171875, -7.43798828125, -7.193359375, -6.94873046875, -6.7041015625, -6.45947265625, -6.21484375, -5.97021484375, -5.7255859375, -5.48095703125, -5.236328125, -4.99169921875, -4.7470703125, -4.50244140625, -4.2578125, -4.01318359375, -3.7685546875, -3.52392578125, -3.279296875, -3.03466796875, -2.7900390625, -2.54541015625, -2.30078125, -2.05615234375, -1.8115234375, -1.56689453125, -1.322265625, -1.07763671875, -0.8330078125, -0.58837890625, -0.34375, -0.09912109375, 0.1455078125, 0.39013671875, 0.634765625, 0.87939453125, 1.1240234375, 1.36865234375, 1.61328125, 1.85791015625, 2.1025390625, 2.34716796875, 2.591796875, 2.83642578125, 3.0810546875, 3.32568359375, 3.5703125, 3.81494140625, 4.0595703125, 4.30419921875, 4.548828125, 4.79345703125, 5.0380859375, 5.28271484375, 5.52734375, 5.77197265625, 6.0166015625, 6.26123046875, 6.505859375, 6.75048828125, 6.9951171875, 7.23974609375, 7.484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 6.0, 3.0, 9.0, 12.0, 17.0, 14.0, 26.0, 29.0, 30.0, 35.0, 47.0, 37.0, 54.0, 66.0, 50.0, 78.0, 62.0, 68.0, 51.0, 59.0, 42.0, 39.0, 44.0, 17.0, 22.0, 15.0, 13.0, 15.0, 11.0, 2.0, 6.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.42578125, -2.353271484375, -2.28076171875, -2.208251953125, -2.1357421875, -2.063232421875, -1.99072265625, -1.918212890625, -1.845703125, -1.773193359375, -1.70068359375, -1.628173828125, -1.5556640625, -1.483154296875, -1.41064453125, -1.338134765625, -1.265625, -1.193115234375, -1.12060546875, -1.048095703125, -0.9755859375, -0.903076171875, -0.83056640625, -0.758056640625, -0.685546875, -0.613037109375, -0.54052734375, -0.468017578125, -0.3955078125, -0.322998046875, -0.25048828125, -0.177978515625, -0.10546875, -0.032958984375, 0.03955078125, 0.112060546875, 0.1845703125, 0.257080078125, 0.32958984375, 0.402099609375, 0.474609375, 0.547119140625, 0.61962890625, 0.692138671875, 0.7646484375, 0.837158203125, 0.90966796875, 0.982177734375, 1.0546875, 1.127197265625, 1.19970703125, 1.272216796875, 1.3447265625, 1.417236328125, 1.48974609375, 1.562255859375, 1.634765625, 1.707275390625, 1.77978515625, 1.852294921875, 1.9248046875, 1.997314453125, 2.06982421875, 2.142333984375, 2.21484375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 8.0, 8.0, 13.0, 35.0, 40.0, 108.0, 246.0, 775.0, 3769.0, 52794.0, 946471.0, 39779.0, 3354.0, 693.0, 241.0, 89.0, 49.0, 20.0, 21.0, 17.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86767578125, -0.8400955200195312, -0.8125152587890625, -0.7849349975585938, -0.757354736328125, -0.7297744750976562, -0.7021942138671875, -0.6746139526367188, -0.64703369140625, -0.6194534301757812, -0.5918731689453125, -0.5642929077148438, -0.536712646484375, -0.5091323852539062, -0.4815521240234375, -0.45397186279296875, -0.4263916015625, -0.39881134033203125, -0.3712310791015625, -0.34365081787109375, -0.316070556640625, -0.28849029541015625, -0.2609100341796875, -0.23332977294921875, -0.20574951171875, -0.17816925048828125, -0.1505889892578125, -0.12300872802734375, -0.095428466796875, -0.06784820556640625, -0.0402679443359375, -0.01268768310546875, 0.014892578125, 0.04247283935546875, 0.0700531005859375, 0.09763336181640625, 0.125213623046875, 0.15279388427734375, 0.1803741455078125, 0.20795440673828125, 0.23553466796875, 0.26311492919921875, 0.2906951904296875, 0.31827545166015625, 0.345855712890625, 0.37343597412109375, 0.4010162353515625, 0.42859649658203125, 0.4561767578125, 0.48375701904296875, 0.5113372802734375, 0.5389175415039062, 0.566497802734375, 0.5940780639648438, 0.6216583251953125, 0.6492385864257812, 0.67681884765625, 0.7043991088867188, 0.7319793701171875, 0.7595596313476562, 0.787139892578125, 0.8147201538085938, 0.8423004150390625, 0.8698806762695312, 0.8974609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 11.0, 19.0, 16.0, 59.0, 63.0, 78.0, 126.0, 146.0, 134.0, 110.0, 81.0, 41.0, 31.0, 20.0, 13.0, 10.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.592273712158203e-05, -6.41215592622757e-05, -6.232038140296936e-05, -6.0519203543663025e-05, -5.871802568435669e-05, -5.6916847825050354e-05, -5.511566996574402e-05, -5.331449210643768e-05, -5.151331424713135e-05, -4.971213638782501e-05, -4.791095852851868e-05, -4.610978066921234e-05, -4.4308602809906006e-05, -4.250742495059967e-05, -4.0706247091293335e-05, -3.8905069231987e-05, -3.7103891372680664e-05, -3.530271351337433e-05, -3.350153565406799e-05, -3.170035779476166e-05, -2.9899179935455322e-05, -2.8098002076148987e-05, -2.629682421684265e-05, -2.4495646357536316e-05, -2.269446849822998e-05, -2.0893290638923645e-05, -1.909211277961731e-05, -1.7290934920310974e-05, -1.548975706100464e-05, -1.3688579201698303e-05, -1.1887401342391968e-05, -1.0086223483085632e-05, -8.285045623779297e-06, -6.4838677644729614e-06, -4.682689905166626e-06, -2.8815120458602905e-06, -1.080334186553955e-06, 7.208436727523804e-07, 2.522021532058716e-06, 4.323199391365051e-06, 6.124377250671387e-06, 7.925555109977722e-06, 9.726732969284058e-06, 1.1527910828590393e-05, 1.3329088687896729e-05, 1.5130266547203064e-05, 1.69314444065094e-05, 1.8732622265815735e-05, 2.053380012512207e-05, 2.2334977984428406e-05, 2.413615584373474e-05, 2.5937333703041077e-05, 2.7738511562347412e-05, 2.9539689421653748e-05, 3.134086728096008e-05, 3.314204514026642e-05, 3.4943222999572754e-05, 3.674440085887909e-05, 3.8545578718185425e-05, 4.034675657749176e-05, 4.2147934436798096e-05, 4.394911229610443e-05, 4.5750290155410767e-05, 4.75514680147171e-05, 4.935264587402344e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 9.0, 14.0, 14.0, 18.0, 26.0, 35.0, 77.0, 156.0, 416.0, 1154.0, 5200.0, 43516.0, 827321.0, 155902.0, 11416.0, 2145.0, 626.0, 240.0, 95.0, 50.0, 30.0, 22.0, 20.0, 12.0, 9.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.6533203125, -0.633941650390625, -0.61456298828125, -0.595184326171875, -0.5758056640625, -0.556427001953125, -0.53704833984375, -0.517669677734375, -0.498291015625, -0.478912353515625, -0.45953369140625, -0.440155029296875, -0.4207763671875, -0.401397705078125, -0.38201904296875, -0.362640380859375, -0.34326171875, -0.323883056640625, -0.30450439453125, -0.285125732421875, -0.2657470703125, -0.246368408203125, -0.22698974609375, -0.207611083984375, -0.188232421875, -0.168853759765625, -0.14947509765625, -0.130096435546875, -0.1107177734375, -0.091339111328125, -0.07196044921875, -0.052581787109375, -0.033203125, -0.013824462890625, 0.00555419921875, 0.024932861328125, 0.0443115234375, 0.063690185546875, 0.08306884765625, 0.102447509765625, 0.121826171875, 0.141204833984375, 0.16058349609375, 0.179962158203125, 0.1993408203125, 0.218719482421875, 0.23809814453125, 0.257476806640625, 0.27685546875, 0.296234130859375, 0.31561279296875, 0.334991455078125, 0.3543701171875, 0.373748779296875, 0.39312744140625, 0.412506103515625, 0.431884765625, 0.451263427734375, 0.47064208984375, 0.490020751953125, 0.5093994140625, 0.528778076171875, 0.54815673828125, 0.567535400390625, 0.5869140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 7.0, 9.0, 7.0, 13.0, 11.0, 12.0, 24.0, 35.0, 42.0, 60.0, 60.0, 76.0, 129.0, 141.0, 79.0, 61.0, 39.0, 36.0, 33.0, 20.0, 27.0, 17.0, 12.0, 14.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11578369140625, -0.11164379119873047, -0.10750389099121094, -0.1033639907836914, -0.09922409057617188, -0.09508419036865234, -0.09094429016113281, -0.08680438995361328, -0.08266448974609375, -0.07852458953857422, -0.07438468933105469, -0.07024478912353516, -0.06610488891601562, -0.061964988708496094, -0.05782508850097656, -0.05368518829345703, -0.0495452880859375, -0.04540538787841797, -0.04126548767089844, -0.037125587463378906, -0.032985687255859375, -0.028845787048339844, -0.024705886840820312, -0.02056598663330078, -0.01642608642578125, -0.012286186218261719, -0.008146286010742188, -0.004006385803222656, 0.000133514404296875, 0.004273414611816406, 0.008413314819335938, 0.012553215026855469, 0.016693115234375, 0.02083301544189453, 0.024972915649414062, 0.029112815856933594, 0.033252716064453125, 0.037392616271972656, 0.04153251647949219, 0.04567241668701172, 0.04981231689453125, 0.05395221710205078, 0.05809211730957031, 0.062232017517089844, 0.06637191772460938, 0.0705118179321289, 0.07465171813964844, 0.07879161834716797, 0.0829315185546875, 0.08707141876220703, 0.09121131896972656, 0.0953512191772461, 0.09949111938476562, 0.10363101959228516, 0.10777091979980469, 0.11191082000732422, 0.11605072021484375, 0.12019062042236328, 0.12433052062988281, 0.12847042083740234, 0.13261032104492188, 0.1367502212524414, 0.14089012145996094, 0.14503002166748047, 0.149169921875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 33.0, 127.0, 350.0, 341.0, 117.0, 30.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0455448627471924, -2.768306255340576, -2.491067409515381, -2.2138285636901855, -1.9365899562835693, -1.6593512296676636, -1.3821125030517578, -1.104873776435852, -0.8276350498199463, -0.5503963232040405, -0.27315759658813477, 0.004081130027770996, 0.28131985664367676, 0.5585585832595825, 0.8357973098754883, 1.113036036491394, 1.3902747631072998, 1.6675134897232056, 1.9447522163391113, 2.2219910621643066, 2.499229669570923, 2.776468276977539, 3.0537071228027344, 3.3309459686279297, 3.608184576034546, 3.885423183441162, 4.162662029266357, 4.439900875091553, 4.71713924407959, 4.994378089904785, 5.2716169357299805, 5.548855781555176, 5.826093673706055, 6.10333251953125, 6.380571365356445, 6.657809734344482, 6.935048580169678, 7.212287425994873, 7.48952579498291, 7.7667646408081055, 8.0440034866333, 8.321242332458496, 8.598481178283691, 8.875720024108887, 9.152957916259766, 9.430196762084961, 9.707435607910156, 9.984674453735352, 10.261913299560547, 10.539152145385742, 10.816390991210938, 11.093629837036133, 11.370868682861328, 11.648106575012207, 11.925345420837402, 12.202584266662598, 12.479823112487793, 12.757061958312988, 13.034300804138184, 13.311539649963379, 13.588777542114258, 13.866016387939453, 14.143255233764648, 14.420494079589844, 14.697732925415039]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 12.0, 11.0, 8.0, 21.0, 30.0, 30.0, 26.0, 31.0, 40.0, 39.0, 41.0, 31.0, 37.0, 44.0, 50.0, 46.0, 49.0, 44.0, 39.0, 52.0, 41.0, 41.0, 36.0, 31.0, 34.0, 20.0, 22.0, 15.0, 16.0, 17.0, 6.0, 4.0, 4.0, 6.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.479503631591797, -2.396390914916992, -2.3132781982421875, -2.230165481567383, -2.147052764892578, -2.0639400482177734, -1.9808273315429688, -1.897714614868164, -1.8146018981933594, -1.7314891815185547, -1.64837646484375, -1.5652637481689453, -1.4821510314941406, -1.399038314819336, -1.3159255981445312, -1.2328128814697266, -1.1497001647949219, -1.0665874481201172, -0.9834747314453125, -0.9003620147705078, -0.8172492980957031, -0.7341365814208984, -0.6510238647460938, -0.5679111480712891, -0.4847984313964844, -0.4016857147216797, -0.318572998046875, -0.2354602813720703, -0.15234756469726562, -0.06923484802246094, 0.01387786865234375, 0.09699058532714844, 0.18010330200195312, 0.2632160186767578, 0.3463287353515625, 0.4294414520263672, 0.5125541687011719, 0.5956668853759766, 0.6787796020507812, 0.7618923187255859, 0.8450050354003906, 0.9281177520751953, 1.01123046875, 1.0943431854248047, 1.1774559020996094, 1.260568618774414, 1.3436813354492188, 1.4267940521240234, 1.5099067687988281, 1.5930194854736328, 1.6761322021484375, 1.7592449188232422, 1.8423576354980469, 1.9254703521728516, 2.0085830688476562, 2.091695785522461, 2.1748085021972656, 2.2579212188720703, 2.341033935546875, 2.4241466522216797, 2.5072593688964844, 2.590372085571289, 2.6734848022460938, 2.7565975189208984, 2.839710235595703]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 3.0, 5.0, 9.0, 19.0, 18.0, 26.0, 28.0, 35.0, 58.0, 80.0, 113.0, 239.0, 425.0, 814.0, 1987.0, 5028.0, 17814.0, 97891.0, 1240326.0, 2596762.0, 191418.0, 28820.0, 7412.0, 2645.0, 1057.0, 513.0, 251.0, 172.0, 92.0, 55.0, 43.0, 23.0, 18.0, 9.0, 16.0, 9.0, 13.0, 5.0, 6.0, 3.0, 7.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.6455078125, -1.594329833984375, -1.54315185546875, -1.491973876953125, -1.4407958984375, -1.389617919921875, -1.33843994140625, -1.287261962890625, -1.236083984375, -1.184906005859375, -1.13372802734375, -1.082550048828125, -1.0313720703125, -0.980194091796875, -0.92901611328125, -0.877838134765625, -0.82666015625, -0.775482177734375, -0.72430419921875, -0.673126220703125, -0.6219482421875, -0.570770263671875, -0.51959228515625, -0.468414306640625, -0.417236328125, -0.366058349609375, -0.31488037109375, -0.263702392578125, -0.2125244140625, -0.161346435546875, -0.11016845703125, -0.058990478515625, -0.0078125, 0.043365478515625, 0.09454345703125, 0.145721435546875, 0.1968994140625, 0.248077392578125, 0.29925537109375, 0.350433349609375, 0.401611328125, 0.452789306640625, 0.50396728515625, 0.555145263671875, 0.6063232421875, 0.657501220703125, 0.70867919921875, 0.759857177734375, 0.81103515625, 0.862213134765625, 0.91339111328125, 0.964569091796875, 1.0157470703125, 1.066925048828125, 1.11810302734375, 1.169281005859375, 1.220458984375, 1.271636962890625, 1.32281494140625, 1.373992919921875, 1.4251708984375, 1.476348876953125, 1.52752685546875, 1.578704833984375, 1.6298828125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 6.0, 10.0, 12.0, 13.0, 11.0, 10.0, 22.0, 22.0, 19.0, 30.0, 31.0, 46.0, 34.0, 50.0, 57.0, 50.0, 56.0, 57.0, 55.0, 38.0, 48.0, 28.0, 34.0, 45.0, 38.0, 24.0, 27.0, 19.0, 21.0, 14.0, 12.0, 9.0, 7.0, 3.0, 10.0, 4.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.8531646728515625, -0.827423095703125, -0.8016815185546875, -0.77593994140625, -0.7501983642578125, -0.724456787109375, -0.6987152099609375, -0.6729736328125, -0.6472320556640625, -0.621490478515625, -0.5957489013671875, -0.57000732421875, -0.5442657470703125, -0.518524169921875, -0.4927825927734375, -0.467041015625, -0.4412994384765625, -0.415557861328125, -0.3898162841796875, -0.36407470703125, -0.3383331298828125, -0.312591552734375, -0.2868499755859375, -0.2611083984375, -0.2353668212890625, -0.209625244140625, -0.1838836669921875, -0.15814208984375, -0.1324005126953125, -0.106658935546875, -0.0809173583984375, -0.05517578125, -0.0294342041015625, -0.003692626953125, 0.0220489501953125, 0.04779052734375, 0.0735321044921875, 0.099273681640625, 0.1250152587890625, 0.1507568359375, 0.1764984130859375, 0.202239990234375, 0.2279815673828125, 0.25372314453125, 0.2794647216796875, 0.305206298828125, 0.3309478759765625, 0.356689453125, 0.3824310302734375, 0.408172607421875, 0.4339141845703125, 0.45965576171875, 0.4853973388671875, 0.511138916015625, 0.5368804931640625, 0.5626220703125, 0.5883636474609375, 0.614105224609375, 0.6398468017578125, 0.66558837890625, 0.6913299560546875, 0.717071533203125, 0.7428131103515625, 0.7685546875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 9.0, 14.0, 12.0, 57.0, 124.0, 333.0, 2187.0, 2320971.0, 1868054.0, 2018.0, 305.0, 90.0, 38.0, 14.0, 11.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.24395751953125, -8.0269775390625, -7.80999755859375, -7.593017578125, -7.37603759765625, -7.1590576171875, -6.94207763671875, -6.72509765625, -6.50811767578125, -6.2911376953125, -6.07415771484375, -5.857177734375, -5.64019775390625, -5.4232177734375, -5.20623779296875, -4.9892578125, -4.77227783203125, -4.5552978515625, -4.33831787109375, -4.121337890625, -3.90435791015625, -3.6873779296875, -3.47039794921875, -3.25341796875, -3.03643798828125, -2.8194580078125, -2.60247802734375, -2.385498046875, -2.16851806640625, -1.9515380859375, -1.73455810546875, -1.517578125, -1.30059814453125, -1.0836181640625, -0.86663818359375, -0.649658203125, -0.43267822265625, -0.2156982421875, 0.00128173828125, 0.21826171875, 0.43524169921875, 0.6522216796875, 0.86920166015625, 1.086181640625, 1.30316162109375, 1.5201416015625, 1.73712158203125, 1.9541015625, 2.17108154296875, 2.3880615234375, 2.60504150390625, 2.822021484375, 3.03900146484375, 3.2559814453125, 3.47296142578125, 3.68994140625, 3.90692138671875, 4.1239013671875, 4.34088134765625, 4.557861328125, 4.77484130859375, 4.9918212890625, 5.20880126953125, 5.42578125]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 9.0, 20.0, 24.0, 51.0, 70.0, 133.0, 163.0, 297.0, 525.0, 968.0, 714.0, 432.0, 273.0, 146.0, 78.0, 58.0, 28.0, 25.0, 14.0, 7.0, 8.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.483154296875, -0.4674339294433594, -0.45171356201171875, -0.4359931945800781, -0.4202728271484375, -0.4045524597167969, -0.38883209228515625, -0.3731117248535156, -0.357391357421875, -0.3416709899902344, -0.32595062255859375, -0.3102302551269531, -0.2945098876953125, -0.2787895202636719, -0.26306915283203125, -0.24734878540039062, -0.23162841796875, -0.21590805053710938, -0.20018768310546875, -0.18446731567382812, -0.1687469482421875, -0.15302658081054688, -0.13730621337890625, -0.12158584594726562, -0.105865478515625, -0.09014511108398438, -0.07442474365234375, -0.058704376220703125, -0.0429840087890625, -0.027263641357421875, -0.01154327392578125, 0.004177093505859375, 0.0198974609375, 0.035617828369140625, 0.05133819580078125, 0.06705856323242188, 0.0827789306640625, 0.09849929809570312, 0.11421966552734375, 0.12994003295898438, 0.145660400390625, 0.16138076782226562, 0.17710113525390625, 0.19282150268554688, 0.2085418701171875, 0.22426223754882812, 0.23998260498046875, 0.2557029724121094, 0.27142333984375, 0.2871437072753906, 0.30286407470703125, 0.3185844421386719, 0.3343048095703125, 0.3500251770019531, 0.36574554443359375, 0.3814659118652344, 0.397186279296875, 0.4129066467285156, 0.42862701416015625, 0.4443473815917969, 0.4600677490234375, 0.4757881164550781, 0.49150848388671875, 0.5072288513183594, 0.52294921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 10.0, 8.0, 23.0, 29.0, 48.0, 73.0, 80.0, 125.0, 142.0, 134.0, 113.0, 66.0, 54.0, 23.0, 20.0, 21.0, 8.0, 11.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.304504871368408, -2.238032579421997, -2.171560287475586, -2.105087995529175, -2.0386157035827637, -1.972143530845642, -1.905671238899231, -1.8391989469528198, -1.7727267742156982, -1.706254482269287, -1.639782190322876, -1.5733098983764648, -1.5068377256393433, -1.4403654336929321, -1.373893141746521, -1.3074208498001099, -1.2409485578536987, -1.1744762659072876, -1.1080039739608765, -1.0415318012237549, -0.9750595092773438, -0.9085872173309326, -0.8421149253845215, -0.7756426334381104, -0.709170401096344, -0.6426981091499329, -0.5762258768081665, -0.5097535848617554, -0.4432813227176666, -0.3768090605735779, -0.31033676862716675, -0.243864506483078, -0.17739224433898926, -0.11091997474431992, -0.044447705149650574, 0.022024571895599365, 0.08849683403968811, 0.15496909618377686, 0.221441388130188, 0.28791365027427673, 0.3543859124183655, 0.4208581745624542, 0.48733043670654297, 0.5538027286529541, 0.6202750205993652, 0.6867472529411316, 0.7532195448875427, 0.8196917772293091, 0.8861640691757202, 0.9526363611221313, 1.0191086530685425, 1.085580825805664, 1.1520531177520752, 1.2185254096984863, 1.2849977016448975, 1.3514699935913086, 1.4179422855377197, 1.4844145774841309, 1.550886869430542, 1.6173591613769531, 1.6838313341140747, 1.7503036260604858, 1.816775918006897, 1.883248209953308, 1.9497203826904297]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 8.0, 3.0, 12.0, 10.0, 7.0, 8.0, 17.0, 11.0, 12.0, 22.0, 32.0, 23.0, 25.0, 35.0, 38.0, 33.0, 38.0, 37.0, 43.0, 43.0, 36.0, 49.0, 39.0, 39.0, 37.0, 48.0, 40.0, 41.0, 29.0, 35.0, 30.0, 20.0, 17.0, 9.0, 10.0, 6.0, 17.0, 11.0, 8.0, 4.0, 2.0, 4.0, 6.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7993125319480896, -0.7729784846305847, -0.7466443777084351, -0.7203103303909302, -0.6939762830734253, -0.6676422357559204, -0.6413081288337708, -0.6149740815162659, -0.588640034198761, -0.5623059868812561, -0.5359718799591064, -0.5096378326416016, -0.4833037853240967, -0.4569697082042694, -0.43063563108444214, -0.40430158376693726, -0.37796750664711, -0.3516334295272827, -0.32529938220977783, -0.29896530508995056, -0.2726312577724457, -0.2462971806526184, -0.21996311843395233, -0.19362905621528625, -0.16729499399662018, -0.1409609317779541, -0.11462686955928802, -0.08829279989004135, -0.061958737671375275, -0.0356246680021286, -0.009290605783462524, 0.017043456435203552, 0.04337751865386963, 0.0697115808725357, 0.09604564309120178, 0.12237971276044846, 0.14871376752853394, 0.1750478446483612, 0.20138190686702728, 0.22771596908569336, 0.25405001640319824, 0.2803840935230255, 0.3067181408405304, 0.33305221796035767, 0.35938626527786255, 0.3857203423976898, 0.4120544195175171, 0.438388466835022, 0.46472254395484924, 0.4910566210746765, 0.5173906683921814, 0.5437247157096863, 0.5700588226318359, 0.5963928699493408, 0.6227269172668457, 0.6490609645843506, 0.6753950715065002, 0.7017291188240051, 0.7280632257461548, 0.7543972730636597, 0.7807313203811646, 0.8070653676986694, 0.8333994746208191, 0.859733521938324, 0.8860675692558289]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 15.0, 17.0, 31.0, 55.0, 133.0, 254.0, 716.0, 2304.0, 9024.0, 47473.0, 389196.0, 518046.0, 65426.0, 11561.0, 2783.0, 867.0, 308.0, 146.0, 65.0, 37.0, 32.0, 15.0, 10.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.8798828125, -0.8561553955078125, -0.832427978515625, -0.8087005615234375, -0.78497314453125, -0.7612457275390625, -0.737518310546875, -0.7137908935546875, -0.6900634765625, -0.6663360595703125, -0.642608642578125, -0.6188812255859375, -0.59515380859375, -0.5714263916015625, -0.547698974609375, -0.5239715576171875, -0.500244140625, -0.4765167236328125, -0.452789306640625, -0.4290618896484375, -0.40533447265625, -0.3816070556640625, -0.357879638671875, -0.3341522216796875, -0.3104248046875, -0.2866973876953125, -0.262969970703125, -0.2392425537109375, -0.21551513671875, -0.1917877197265625, -0.168060302734375, -0.1443328857421875, -0.12060546875, -0.0968780517578125, -0.073150634765625, -0.0494232177734375, -0.02569580078125, -0.0019683837890625, 0.021759033203125, 0.0454864501953125, 0.0692138671875, 0.0929412841796875, 0.116668701171875, 0.1403961181640625, 0.16412353515625, 0.1878509521484375, 0.211578369140625, 0.2353057861328125, 0.259033203125, 0.2827606201171875, 0.306488037109375, 0.3302154541015625, 0.35394287109375, 0.3776702880859375, 0.401397705078125, 0.4251251220703125, 0.4488525390625, 0.4725799560546875, 0.496307373046875, 0.5200347900390625, 0.54376220703125, 0.5674896240234375, 0.591217041015625, 0.6149444580078125, 0.638671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 16.0, 25.0, 29.0, 58.0, 60.0, 80.0, 96.0, 116.0, 106.0, 91.0, 93.0, 75.0, 57.0, 31.0, 27.0, 14.0, 9.0, 8.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.6082763671875, -0.568115234375, -0.5279541015625, -0.48779296875, -0.4476318359375, -0.407470703125, -0.3673095703125, -0.3271484375, -0.2869873046875, -0.246826171875, -0.2066650390625, -0.16650390625, -0.1263427734375, -0.086181640625, -0.0460205078125, -0.005859375, 0.0343017578125, 0.074462890625, 0.1146240234375, 0.15478515625, 0.1949462890625, 0.235107421875, 0.2752685546875, 0.3154296875, 0.3555908203125, 0.395751953125, 0.4359130859375, 0.47607421875, 0.5162353515625, 0.556396484375, 0.5965576171875, 0.63671875, 0.6768798828125, 0.717041015625, 0.7572021484375, 0.79736328125, 0.8375244140625, 0.877685546875, 0.9178466796875, 0.9580078125, 0.9981689453125, 1.038330078125, 1.0784912109375, 1.11865234375, 1.1588134765625, 1.198974609375, 1.2391357421875, 1.279296875, 1.3194580078125, 1.359619140625, 1.3997802734375, 1.43994140625, 1.4801025390625, 1.520263671875, 1.5604248046875, 1.6005859375, 1.6407470703125, 1.680908203125, 1.7210693359375, 1.76123046875, 1.8013916015625, 1.841552734375, 1.8817138671875, 1.921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 6.0, 3.0, 3.0, 2.0, 13.0, 10.0, 16.0, 26.0, 42.0, 37.0, 44.0, 69.0, 148.0, 211.0, 372.0, 627.0, 1190.0, 2568.0, 6379.0, 19377.0, 77700.0, 386217.0, 428795.0, 89569.0, 21929.0, 7155.0, 3004.0, 1340.0, 674.0, 358.0, 220.0, 144.0, 87.0, 57.0, 44.0, 35.0, 22.0, 11.0, 12.0, 14.0, 9.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.40087890625, -0.3887481689453125, -0.376617431640625, -0.3644866943359375, -0.35235595703125, -0.3402252197265625, -0.328094482421875, -0.3159637451171875, -0.3038330078125, -0.2917022705078125, -0.279571533203125, -0.2674407958984375, -0.25531005859375, -0.2431793212890625, -0.231048583984375, -0.2189178466796875, -0.206787109375, -0.1946563720703125, -0.182525634765625, -0.1703948974609375, -0.15826416015625, -0.1461334228515625, -0.134002685546875, -0.1218719482421875, -0.1097412109375, -0.0976104736328125, -0.085479736328125, -0.0733489990234375, -0.06121826171875, -0.0490875244140625, -0.036956787109375, -0.0248260498046875, -0.0126953125, -0.0005645751953125, 0.011566162109375, 0.0236968994140625, 0.03582763671875, 0.0479583740234375, 0.060089111328125, 0.0722198486328125, 0.0843505859375, 0.0964813232421875, 0.108612060546875, 0.1207427978515625, 0.13287353515625, 0.1450042724609375, 0.157135009765625, 0.1692657470703125, 0.181396484375, 0.1935272216796875, 0.205657958984375, 0.2177886962890625, 0.22991943359375, 0.2420501708984375, 0.254180908203125, 0.2663116455078125, 0.2784423828125, 0.2905731201171875, 0.302703857421875, 0.3148345947265625, 0.32696533203125, 0.3390960693359375, 0.351226806640625, 0.3633575439453125, 0.37548828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 7.0, 5.0, 6.0, 9.0, 8.0, 11.0, 19.0, 29.0, 25.0, 23.0, 24.0, 35.0, 36.0, 27.0, 40.0, 40.0, 37.0, 56.0, 45.0, 45.0, 46.0, 49.0, 37.0, 41.0, 39.0, 36.0, 28.0, 26.0, 22.0, 22.0, 23.0, 18.0, 18.0, 18.0, 9.0, 7.0, 4.0, 7.0, 8.0, 6.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.052734375, -1.0214614868164062, -0.9901885986328125, -0.9589157104492188, -0.927642822265625, -0.8963699340820312, -0.8650970458984375, -0.8338241577148438, -0.80255126953125, -0.7712783813476562, -0.7400054931640625, -0.7087326049804688, -0.677459716796875, -0.6461868286132812, -0.6149139404296875, -0.5836410522460938, -0.5523681640625, -0.5210952758789062, -0.4898223876953125, -0.45854949951171875, -0.427276611328125, -0.39600372314453125, -0.3647308349609375, -0.33345794677734375, -0.30218505859375, -0.27091217041015625, -0.2396392822265625, -0.20836639404296875, -0.177093505859375, -0.14582061767578125, -0.1145477294921875, -0.08327484130859375, -0.052001953125, -0.02072906494140625, 0.0105438232421875, 0.04181671142578125, 0.073089599609375, 0.10436248779296875, 0.1356353759765625, 0.16690826416015625, 0.19818115234375, 0.22945404052734375, 0.2607269287109375, 0.29199981689453125, 0.323272705078125, 0.35454559326171875, 0.3858184814453125, 0.41709136962890625, 0.4483642578125, 0.47963714599609375, 0.5109100341796875, 0.5421829223632812, 0.573455810546875, 0.6047286987304688, 0.6360015869140625, 0.6672744750976562, 0.69854736328125, 0.7298202514648438, 0.7610931396484375, 0.7923660278320312, 0.823638916015625, 0.8549118041992188, 0.8861846923828125, 0.9174575805664062, 0.94873046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 8.0, 17.0, 25.0, 49.0, 60.0, 104.0, 203.0, 353.0, 700.0, 1621.0, 4773.0, 17321.0, 102348.0, 658973.0, 220144.0, 30254.0, 7266.0, 2342.0, 948.0, 452.0, 229.0, 114.0, 81.0, 48.0, 26.0, 23.0, 15.0, 16.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.197998046875, -0.19057464599609375, -0.1831512451171875, -0.17572784423828125, -0.168304443359375, -0.16088104248046875, -0.1534576416015625, -0.14603424072265625, -0.13861083984375, -0.13118743896484375, -0.1237640380859375, -0.11634063720703125, -0.108917236328125, -0.10149383544921875, -0.0940704345703125, -0.08664703369140625, -0.0792236328125, -0.07180023193359375, -0.0643768310546875, -0.05695343017578125, -0.049530029296875, -0.04210662841796875, -0.0346832275390625, -0.02725982666015625, -0.01983642578125, -0.01241302490234375, -0.0049896240234375, 0.00243377685546875, 0.009857177734375, 0.01728057861328125, 0.0247039794921875, 0.03212738037109375, 0.03955078125, 0.04697418212890625, 0.0543975830078125, 0.06182098388671875, 0.069244384765625, 0.07666778564453125, 0.0840911865234375, 0.09151458740234375, 0.09893798828125, 0.10636138916015625, 0.1137847900390625, 0.12120819091796875, 0.128631591796875, 0.13605499267578125, 0.1434783935546875, 0.15090179443359375, 0.1583251953125, 0.16574859619140625, 0.1731719970703125, 0.18059539794921875, 0.188018798828125, 0.19544219970703125, 0.2028656005859375, 0.21028900146484375, 0.21771240234375, 0.22513580322265625, 0.2325592041015625, 0.23998260498046875, 0.247406005859375, 0.25482940673828125, 0.2622528076171875, 0.26967620849609375, 0.277099609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 11.0, 14.0, 16.0, 25.0, 21.0, 27.0, 37.0, 44.0, 57.0, 77.0, 103.0, 95.0, 96.0, 85.0, 66.0, 50.0, 30.0, 36.0, 25.0, 15.0, 14.0, 6.0, 5.0, 6.0, 10.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.322166442871094e-05, -9.017251431941986e-05, -8.712336421012878e-05, -8.407421410083771e-05, -8.102506399154663e-05, -7.797591388225555e-05, -7.492676377296448e-05, -7.18776136636734e-05, -6.882846355438232e-05, -6.577931344509125e-05, -6.273016333580017e-05, -5.9681013226509094e-05, -5.663186311721802e-05, -5.358271300792694e-05, -5.0533562898635864e-05, -4.748441278934479e-05, -4.443526268005371e-05, -4.1386112570762634e-05, -3.833696246147156e-05, -3.528781235218048e-05, -3.2238662242889404e-05, -2.9189512133598328e-05, -2.614036202430725e-05, -2.3091211915016174e-05, -2.0042061805725098e-05, -1.699291169643402e-05, -1.3943761587142944e-05, -1.0894611477851868e-05, -7.845461368560791e-06, -4.796311259269714e-06, -1.7471611499786377e-06, 1.301988959312439e-06, 4.351139068603516e-06, 7.400289177894592e-06, 1.0449439287185669e-05, 1.3498589396476746e-05, 1.6547739505767822e-05, 1.95968896150589e-05, 2.2646039724349976e-05, 2.5695189833641052e-05, 2.874433994293213e-05, 3.1793490052223206e-05, 3.484264016151428e-05, 3.789179027080536e-05, 4.0940940380096436e-05, 4.399009048938751e-05, 4.703924059867859e-05, 5.0088390707969666e-05, 5.313754081726074e-05, 5.618669092655182e-05, 5.9235841035842896e-05, 6.228499114513397e-05, 6.533414125442505e-05, 6.838329136371613e-05, 7.14324414730072e-05, 7.448159158229828e-05, 7.753074169158936e-05, 8.057989180088043e-05, 8.362904191017151e-05, 8.667819201946259e-05, 8.972734212875366e-05, 9.277649223804474e-05, 9.582564234733582e-05, 9.887479245662689e-05, 0.00010192394256591797]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 7.0, 9.0, 19.0, 21.0, 30.0, 36.0, 65.0, 98.0, 158.0, 244.0, 451.0, 813.0, 1530.0, 3332.0, 7646.0, 19743.0, 62244.0, 226705.0, 468977.0, 177695.0, 49829.0, 16508.0, 6474.0, 2810.0, 1363.0, 698.0, 394.0, 227.0, 143.0, 105.0, 50.0, 39.0, 28.0, 25.0, 12.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16467857360839844, -0.15943527221679688, -0.1541919708251953, -0.14894866943359375, -0.1437053680419922, -0.13846206665039062, -0.13321876525878906, -0.1279754638671875, -0.12273216247558594, -0.11748886108398438, -0.11224555969238281, -0.10700225830078125, -0.10175895690917969, -0.09651565551757812, -0.09127235412597656, -0.086029052734375, -0.08078575134277344, -0.07554244995117188, -0.07029914855957031, -0.06505584716796875, -0.05981254577636719, -0.054569244384765625, -0.04932594299316406, -0.0440826416015625, -0.03883934020996094, -0.033596038818359375, -0.028352737426757812, -0.02310943603515625, -0.017866134643554688, -0.012622833251953125, -0.0073795318603515625, -0.00213623046875, 0.0031070709228515625, 0.008350372314453125, 0.013593673706054688, 0.01883697509765625, 0.024080276489257812, 0.029323577880859375, 0.03456687927246094, 0.0398101806640625, 0.04505348205566406, 0.050296783447265625, 0.05554008483886719, 0.06078338623046875, 0.06602668762207031, 0.07126998901367188, 0.07651329040527344, 0.081756591796875, 0.08699989318847656, 0.09224319458007812, 0.09748649597167969, 0.10272979736328125, 0.10797309875488281, 0.11321640014648438, 0.11845970153808594, 0.1237030029296875, 0.12894630432128906, 0.13418960571289062, 0.1394329071044922, 0.14467620849609375, 0.1499195098876953, 0.15516281127929688, 0.16040611267089844, 0.1656494140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 10.0, 6.0, 11.0, 10.0, 10.0, 22.0, 21.0, 32.0, 32.0, 55.0, 51.0, 70.0, 85.0, 79.0, 97.0, 77.0, 52.0, 57.0, 35.0, 31.0, 41.0, 18.0, 18.0, 16.0, 11.0, 10.0, 8.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040069580078125, -0.038767337799072266, -0.03746509552001953, -0.0361628532409668, -0.03486061096191406, -0.03355836868286133, -0.032256126403808594, -0.03095388412475586, -0.029651641845703125, -0.02834939956665039, -0.027047157287597656, -0.025744915008544922, -0.024442672729492188, -0.023140430450439453, -0.02183818817138672, -0.020535945892333984, -0.01923370361328125, -0.017931461334228516, -0.01662921905517578, -0.015326976776123047, -0.014024734497070312, -0.012722492218017578, -0.011420249938964844, -0.01011800765991211, -0.008815765380859375, -0.007513523101806641, -0.006211280822753906, -0.004909038543701172, -0.0036067962646484375, -0.002304553985595703, -0.0010023117065429688, 0.0002999305725097656, 0.0016021728515625, 0.0029044151306152344, 0.004206657409667969, 0.005508899688720703, 0.0068111419677734375, 0.008113384246826172, 0.009415626525878906, 0.01071786880493164, 0.012020111083984375, 0.01332235336303711, 0.014624595642089844, 0.015926837921142578, 0.017229080200195312, 0.018531322479248047, 0.01983356475830078, 0.021135807037353516, 0.02243804931640625, 0.023740291595458984, 0.02504253387451172, 0.026344776153564453, 0.027647018432617188, 0.028949260711669922, 0.030251502990722656, 0.03155374526977539, 0.032855987548828125, 0.03415822982788086, 0.035460472106933594, 0.03676271438598633, 0.03806495666503906, 0.0393671989440918, 0.04066944122314453, 0.041971683502197266, 0.04327392578125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 10.0, 16.0, 25.0, 55.0, 86.0, 132.0, 192.0, 181.0, 123.0, 73.0, 45.0, 25.0, 13.0, 10.0, 10.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5391407012939453, -1.4858746528625488, -1.4326084852218628, -1.3793424367904663, -1.3260763883590698, -1.2728102207183838, -1.2195441722869873, -1.1662781238555908, -1.1130120754241943, -1.0597460269927979, -1.0064798593521118, -0.9532138109207153, -0.8999477624893188, -0.8466816544532776, -0.7934155464172363, -0.7401494979858398, -0.6868833303451538, -0.6336172223091125, -0.5803511738777161, -0.5270850658416748, -0.47381898760795593, -0.42055290937423706, -0.3672868013381958, -0.31402072310447693, -0.26075464487075806, -0.20748856663703918, -0.15422247350215912, -0.10095638036727905, -0.04769030213356018, 0.005575776100158691, 0.05884188413619995, 0.11210796236991882, 0.16537415981292725, 0.21864023804664612, 0.271906316280365, 0.32517242431640625, 0.3784385025501251, 0.431704580783844, 0.48497068881988525, 0.5382367372512817, 0.591502845287323, 0.6447689533233643, 0.6980350017547607, 0.751301109790802, 0.8045672178268433, 0.8578332662582397, 0.911099374294281, 0.9643654823303223, 1.0176315307617188, 1.0708975791931152, 1.1241637468338013, 1.1774297952651978, 1.2306958436965942, 1.2839620113372803, 1.3372280597686768, 1.3904941082000732, 1.4437601566314697, 1.4970262050628662, 1.5502923727035522, 1.6035584211349487, 1.6568244695663452, 1.7100906372070312, 1.7633566856384277, 1.8166227340698242, 1.8698889017105103]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 7.0, 3.0, 7.0, 15.0, 16.0, 23.0, 34.0, 33.0, 47.0, 70.0, 73.0, 79.0, 86.0, 92.0, 81.0, 82.0, 69.0, 51.0, 45.0, 26.0, 24.0, 17.0, 11.0, 6.0, 7.0, 5.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5590842366218567, -0.5281316637992859, -0.4971791207790375, -0.46622657775878906, -0.43527400493621826, -0.40432143211364746, -0.37336888909339905, -0.34241634607315063, -0.31146377325057983, -0.28051120042800903, -0.24955865740776062, -0.218606099486351, -0.1876535415649414, -0.1567009836435318, -0.1257484257221222, -0.09479586780071259, -0.06384330987930298, -0.03289075195789337, -0.0019381940364837646, 0.029014363884925842, 0.05996692180633545, 0.09091947972774506, 0.12187203764915466, 0.15282459557056427, 0.18377715349197388, 0.21472971141338348, 0.2456822693347931, 0.2766348123550415, 0.3075873851776123, 0.3385399580001831, 0.3694925010204315, 0.40044504404067993, 0.4313976764678955, 0.4623502492904663, 0.4933027923107147, 0.5242553353309631, 0.5552079081535339, 0.5861604809761047, 0.6171129941940308, 0.6480655670166016, 0.6790181398391724, 0.7099707126617432, 0.740923285484314, 0.77187579870224, 0.8028283715248108, 0.8337809443473816, 0.8647334575653076, 0.8956860303878784, 0.9266386032104492, 0.95759117603302, 0.9885437488555908, 1.0194963216781616, 1.0504488945007324, 1.0814013481140137, 1.1123539209365845, 1.1433064937591553, 1.174259066581726, 1.2052116394042969, 1.2361642122268677, 1.2671167850494385, 1.2980692386627197, 1.3290218114852905, 1.3599743843078613, 1.3909269571304321, 1.421879529953003]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 13.0, 23.0, 20.0, 45.0, 68.0, 100.0, 155.0, 317.0, 586.0, 1156.0, 2518.0, 5950.0, 15053.0, 44390.0, 159425.0, 479333.0, 240627.0, 64245.0, 20609.0, 7689.0, 3138.0, 1421.0, 758.0, 359.0, 205.0, 122.0, 67.0, 44.0, 29.0, 19.0, 15.0, 11.0, 3.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-0.9140625, -0.8891220092773438, -0.8641815185546875, -0.8392410278320312, -0.814300537109375, -0.7893600463867188, -0.7644195556640625, -0.7394790649414062, -0.71453857421875, -0.6895980834960938, -0.6646575927734375, -0.6397171020507812, -0.614776611328125, -0.5898361206054688, -0.5648956298828125, -0.5399551391601562, -0.5150146484375, -0.49007415771484375, -0.4651336669921875, -0.44019317626953125, -0.415252685546875, -0.39031219482421875, -0.3653717041015625, -0.34043121337890625, -0.31549072265625, -0.29055023193359375, -0.2656097412109375, -0.24066925048828125, -0.215728759765625, -0.19078826904296875, -0.1658477783203125, -0.14090728759765625, -0.115966796875, -0.09102630615234375, -0.0660858154296875, -0.04114532470703125, -0.016204833984375, 0.00873565673828125, 0.0336761474609375, 0.05861663818359375, 0.08355712890625, 0.10849761962890625, 0.1334381103515625, 0.15837860107421875, 0.183319091796875, 0.20825958251953125, 0.2332000732421875, 0.25814056396484375, 0.2830810546875, 0.30802154541015625, 0.3329620361328125, 0.35790252685546875, 0.382843017578125, 0.40778350830078125, 0.4327239990234375, 0.45766448974609375, 0.48260498046875, 0.5075454711914062, 0.5324859619140625, 0.5574264526367188, 0.582366943359375, 0.6073074340820312, 0.6322479248046875, 0.6571884155273438, 0.68212890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 9.0, 8.0, 6.0, 13.0, 11.0, 16.0, 32.0, 26.0, 42.0, 56.0, 52.0, 65.0, 70.0, 65.0, 69.0, 71.0, 64.0, 65.0, 54.0, 53.0, 44.0, 33.0, 21.0, 8.0, 17.0, 6.0, 4.0, 6.0, 8.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0439453125, -0.9874725341796875, -0.930999755859375, -0.8745269775390625, -0.81805419921875, -0.7615814208984375, -0.705108642578125, -0.6486358642578125, -0.5921630859375, -0.5356903076171875, -0.479217529296875, -0.4227447509765625, -0.36627197265625, -0.3097991943359375, -0.253326416015625, -0.1968536376953125, -0.140380859375, -0.0839080810546875, -0.027435302734375, 0.0290374755859375, 0.08551025390625, 0.1419830322265625, 0.198455810546875, 0.2549285888671875, 0.3114013671875, 0.3678741455078125, 0.424346923828125, 0.4808197021484375, 0.53729248046875, 0.5937652587890625, 0.650238037109375, 0.7067108154296875, 0.76318359375, 0.8196563720703125, 0.876129150390625, 0.9326019287109375, 0.98907470703125, 1.0455474853515625, 1.102020263671875, 1.1584930419921875, 1.2149658203125, 1.2714385986328125, 1.327911376953125, 1.3843841552734375, 1.44085693359375, 1.4973297119140625, 1.553802490234375, 1.6102752685546875, 1.666748046875, 1.7232208251953125, 1.779693603515625, 1.8361663818359375, 1.89263916015625, 1.9491119384765625, 2.005584716796875, 2.0620574951171875, 2.1185302734375, 2.1750030517578125, 2.231475830078125, 2.2879486083984375, 2.34442138671875, 2.4008941650390625, 2.457366943359375, 2.5138397216796875, 2.5703125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 9.0, 3.0, 5.0, 5.0, 11.0, 15.0, 11.0, 12.0, 20.0, 25.0, 28.0, 30.0, 42.0, 22.0, 33.0, 45.0, 48.0, 70.0, 270.0, 8176.0, 1013953.0, 24816.0, 459.0, 73.0, 55.0, 41.0, 40.0, 35.0, 36.0, 27.0, 25.0, 16.0, 20.0, 14.0, 10.0, 8.0, 11.0, 7.0, 9.0, 4.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.35546875, -4.225830078125, -4.09619140625, -3.966552734375, -3.8369140625, -3.707275390625, -3.57763671875, -3.447998046875, -3.318359375, -3.188720703125, -3.05908203125, -2.929443359375, -2.7998046875, -2.670166015625, -2.54052734375, -2.410888671875, -2.28125, -2.151611328125, -2.02197265625, -1.892333984375, -1.7626953125, -1.633056640625, -1.50341796875, -1.373779296875, -1.244140625, -1.114501953125, -0.98486328125, -0.855224609375, -0.7255859375, -0.595947265625, -0.46630859375, -0.336669921875, -0.20703125, -0.077392578125, 0.05224609375, 0.181884765625, 0.3115234375, 0.441162109375, 0.57080078125, 0.700439453125, 0.830078125, 0.959716796875, 1.08935546875, 1.218994140625, 1.3486328125, 1.478271484375, 1.60791015625, 1.737548828125, 1.8671875, 1.996826171875, 2.12646484375, 2.256103515625, 2.3857421875, 2.515380859375, 2.64501953125, 2.774658203125, 2.904296875, 3.033935546875, 3.16357421875, 3.293212890625, 3.4228515625, 3.552490234375, 3.68212890625, 3.811767578125, 3.94140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 8.0, 3.0, 6.0, 11.0, 8.0, 15.0, 8.0, 21.0, 23.0, 26.0, 31.0, 32.0, 24.0, 34.0, 34.0, 39.0, 29.0, 40.0, 48.0, 39.0, 41.0, 39.0, 45.0, 42.0, 38.0, 44.0, 38.0, 25.0, 31.0, 28.0, 27.0, 24.0, 19.0, 13.0, 11.0, 13.0, 9.0, 9.0, 11.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3408203125, -1.3018341064453125, -1.262847900390625, -1.2238616943359375, -1.18487548828125, -1.1458892822265625, -1.106903076171875, -1.0679168701171875, -1.0289306640625, -0.9899444580078125, -0.950958251953125, -0.9119720458984375, -0.87298583984375, -0.8339996337890625, -0.795013427734375, -0.7560272216796875, -0.717041015625, -0.6780548095703125, -0.639068603515625, -0.6000823974609375, -0.56109619140625, -0.5221099853515625, -0.483123779296875, -0.4441375732421875, -0.4051513671875, -0.3661651611328125, -0.327178955078125, -0.2881927490234375, -0.24920654296875, -0.2102203369140625, -0.171234130859375, -0.1322479248046875, -0.09326171875, -0.0542755126953125, -0.015289306640625, 0.0236968994140625, 0.06268310546875, 0.1016693115234375, 0.140655517578125, 0.1796417236328125, 0.2186279296875, 0.2576141357421875, 0.296600341796875, 0.3355865478515625, 0.37457275390625, 0.4135589599609375, 0.452545166015625, 0.4915313720703125, 0.530517578125, 0.5695037841796875, 0.608489990234375, 0.6474761962890625, 0.68646240234375, 0.7254486083984375, 0.764434814453125, 0.8034210205078125, 0.8424072265625, 0.8813934326171875, 0.920379638671875, 0.9593658447265625, 0.99835205078125, 1.0373382568359375, 1.076324462890625, 1.1153106689453125, 1.154296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 9.0, 6.0, 11.0, 12.0, 23.0, 22.0, 55.0, 90.0, 163.0, 372.0, 822.0, 2415.0, 7686.0, 36335.0, 286706.0, 610858.0, 82200.0, 14658.0, 3786.0, 1329.0, 499.0, 218.0, 105.0, 56.0, 37.0, 24.0, 17.0, 9.0, 7.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4853515625, -0.4723091125488281, -0.45926666259765625, -0.4462242126464844, -0.4331817626953125, -0.4201393127441406, -0.40709686279296875, -0.3940544128417969, -0.381011962890625, -0.3679695129394531, -0.35492706298828125, -0.3418846130371094, -0.3288421630859375, -0.3157997131347656, -0.30275726318359375, -0.2897148132324219, -0.27667236328125, -0.2636299133300781, -0.25058746337890625, -0.23754501342773438, -0.2245025634765625, -0.21146011352539062, -0.19841766357421875, -0.18537521362304688, -0.172332763671875, -0.15929031372070312, -0.14624786376953125, -0.13320541381835938, -0.1201629638671875, -0.10712051391601562, -0.09407806396484375, -0.08103561401367188, -0.0679931640625, -0.054950714111328125, -0.04190826416015625, -0.028865814208984375, -0.0158233642578125, -0.002780914306640625, 0.01026153564453125, 0.023303985595703125, 0.036346435546875, 0.049388885498046875, 0.06243133544921875, 0.07547378540039062, 0.0885162353515625, 0.10155868530273438, 0.11460113525390625, 0.12764358520507812, 0.14068603515625, 0.15372848510742188, 0.16677093505859375, 0.17981338500976562, 0.1928558349609375, 0.20589828491210938, 0.21894073486328125, 0.23198318481445312, 0.245025634765625, 0.2580680847167969, 0.27111053466796875, 0.2841529846191406, 0.2971954345703125, 0.3102378845214844, 0.32328033447265625, 0.3363227844238281, 0.349365234375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 5.0, 3.0, 6.0, 8.0, 12.0, 11.0, 24.0, 28.0, 42.0, 52.0, 60.0, 93.0, 103.0, 116.0, 112.0, 74.0, 46.0, 34.0, 39.0, 27.0, 16.0, 15.0, 13.0, 6.0, 10.0, 9.0, 7.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2869319915771484e-05, -5.1233917474746704e-05, -4.9598515033721924e-05, -4.7963112592697144e-05, -4.632771015167236e-05, -4.469230771064758e-05, -4.30569052696228e-05, -4.142150282859802e-05, -3.978610038757324e-05, -3.815069794654846e-05, -3.651529550552368e-05, -3.48798930644989e-05, -3.324449062347412e-05, -3.160908818244934e-05, -2.997368574142456e-05, -2.833828330039978e-05, -2.6702880859375e-05, -2.506747841835022e-05, -2.343207597732544e-05, -2.179667353630066e-05, -2.016127109527588e-05, -1.85258686542511e-05, -1.689046621322632e-05, -1.5255063772201538e-05, -1.3619661331176758e-05, -1.1984258890151978e-05, -1.0348856449127197e-05, -8.713454008102417e-06, -7.078051567077637e-06, -5.4426491260528564e-06, -3.807246685028076e-06, -2.171844244003296e-06, -5.364418029785156e-07, 1.0989606380462646e-06, 2.734363079071045e-06, 4.369765520095825e-06, 6.0051679611206055e-06, 7.640570402145386e-06, 9.275972843170166e-06, 1.0911375284194946e-05, 1.2546777725219727e-05, 1.4182180166244507e-05, 1.5817582607269287e-05, 1.7452985048294067e-05, 1.9088387489318848e-05, 2.0723789930343628e-05, 2.2359192371368408e-05, 2.399459481239319e-05, 2.562999725341797e-05, 2.726539969444275e-05, 2.890080213546753e-05, 3.053620457649231e-05, 3.217160701751709e-05, 3.380700945854187e-05, 3.544241189956665e-05, 3.707781434059143e-05, 3.871321678161621e-05, 4.034861922264099e-05, 4.198402166366577e-05, 4.361942410469055e-05, 4.525482654571533e-05, 4.689022898674011e-05, 4.852563142776489e-05, 5.016103386878967e-05, 5.179643630981445e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 10.0, 17.0, 37.0, 64.0, 114.0, 236.0, 584.0, 1455.0, 4921.0, 20978.0, 137670.0, 688680.0, 161962.0, 23499.0, 5428.0, 1683.0, 642.0, 261.0, 124.0, 73.0, 32.0, 22.0, 15.0, 15.0, 3.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43701171875, -0.4243583679199219, -0.41170501708984375, -0.3990516662597656, -0.3863983154296875, -0.3737449645996094, -0.36109161376953125, -0.3484382629394531, -0.335784912109375, -0.3231315612792969, -0.31047821044921875, -0.2978248596191406, -0.2851715087890625, -0.2725181579589844, -0.25986480712890625, -0.24721145629882812, -0.23455810546875, -0.22190475463867188, -0.20925140380859375, -0.19659805297851562, -0.1839447021484375, -0.17129135131835938, -0.15863800048828125, -0.14598464965820312, -0.133331298828125, -0.12067794799804688, -0.10802459716796875, -0.09537124633789062, -0.0827178955078125, -0.07006454467773438, -0.05741119384765625, -0.044757843017578125, -0.0321044921875, -0.019451141357421875, -0.00679779052734375, 0.005855560302734375, 0.0185089111328125, 0.031162261962890625, 0.04381561279296875, 0.056468963623046875, 0.069122314453125, 0.08177566528320312, 0.09442901611328125, 0.10708236694335938, 0.1197357177734375, 0.13238906860351562, 0.14504241943359375, 0.15769577026367188, 0.17034912109375, 0.18300247192382812, 0.19565582275390625, 0.20830917358398438, 0.2209625244140625, 0.23361587524414062, 0.24626922607421875, 0.2589225769042969, 0.271575927734375, 0.2842292785644531, 0.29688262939453125, 0.3095359802246094, 0.3221893310546875, 0.3348426818847656, 0.34749603271484375, 0.3601493835449219, 0.372802734375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 8.0, 8.0, 17.0, 19.0, 14.0, 24.0, 39.0, 35.0, 41.0, 69.0, 76.0, 94.0, 82.0, 88.0, 76.0, 73.0, 44.0, 44.0, 25.0, 30.0, 20.0, 18.0, 12.0, 11.0, 6.0, 5.0, 7.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125732421875, -0.12132644653320312, -0.11692047119140625, -0.11251449584960938, -0.1081085205078125, -0.10370254516601562, -0.09929656982421875, -0.09489059448242188, -0.090484619140625, -0.08607864379882812, -0.08167266845703125, -0.07726669311523438, -0.0728607177734375, -0.06845474243164062, -0.06404876708984375, -0.059642791748046875, -0.05523681640625, -0.050830841064453125, -0.04642486572265625, -0.042018890380859375, -0.0376129150390625, -0.033206939697265625, -0.02880096435546875, -0.024394989013671875, -0.019989013671875, -0.015583038330078125, -0.01117706298828125, -0.006771087646484375, -0.0023651123046875, 0.002040863037109375, 0.00644683837890625, 0.010852813720703125, 0.0152587890625, 0.019664764404296875, 0.02407073974609375, 0.028476715087890625, 0.0328826904296875, 0.037288665771484375, 0.04169464111328125, 0.046100616455078125, 0.050506591796875, 0.054912567138671875, 0.05931854248046875, 0.06372451782226562, 0.0681304931640625, 0.07253646850585938, 0.07694244384765625, 0.08134841918945312, 0.08575439453125, 0.09016036987304688, 0.09456634521484375, 0.09897232055664062, 0.1033782958984375, 0.10778427124023438, 0.11219024658203125, 0.11659622192382812, 0.121002197265625, 0.12540817260742188, 0.12981414794921875, 0.13422012329101562, 0.1386260986328125, 0.14303207397460938, 0.14743804931640625, 0.15184402465820312, 0.15625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 42.0, 184.0, 452.0, 235.0, 70.0, 13.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6620383262634277, -2.3855512142181396, -2.1090641021728516, -1.8325772285461426, -1.5560901165008545, -1.2796030044555664, -1.0031160116195679, -0.7266290187835693, -0.45014190673828125, -0.17365485429763794, 0.10283219814300537, 0.3793192505836487, 0.655806303024292, 0.9322934150695801, 1.2087804079055786, 1.4852674007415771, 1.7617545127868652, 2.0382416248321533, 2.3147287368774414, 2.5912156105041504, 2.8677027225494385, 3.1441898345947266, 3.4206767082214355, 3.6971638202667236, 3.9736509323120117, 4.250137805938721, 4.526625156402588, 4.803112030029297, 5.079599380493164, 5.356086254119873, 5.632573127746582, 5.909060478210449, 6.185546875, 6.462033748626709, 6.738521099090576, 7.015007972717285, 7.291495323181152, 7.567982196807861, 7.84446907043457, 8.120956420898438, 8.397443771362305, 8.673931121826172, 8.950417518615723, 9.22690486907959, 9.503392219543457, 9.779878616333008, 10.056365966796875, 10.332853317260742, 10.609339714050293, 10.88582706451416, 11.162313461303711, 11.438800811767578, 11.715288162231445, 11.991775512695312, 12.268261909484863, 12.54474925994873, 12.821235656738281, 13.097723007202148, 13.3742094039917, 13.650696754455566, 13.927184104919434, 14.203670501708984, 14.480157852172852, 14.756645202636719, 15.033132553100586]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 11.0, 14.0, 22.0, 17.0, 28.0, 17.0, 30.0, 29.0, 44.0, 33.0, 35.0, 48.0, 51.0, 50.0, 53.0, 49.0, 50.0, 43.0, 46.0, 38.0, 42.0, 32.0, 29.0, 22.0, 18.0, 23.0, 17.0, 9.0, 16.0, 15.0, 10.0, 5.0, 6.0, 10.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8404380083084106, -1.7729066610336304, -1.70537531375885, -1.6378439664840698, -1.570312738418579, -1.5027813911437988, -1.4352500438690186, -1.3677186965942383, -1.300187349319458, -1.2326560020446777, -1.1651246547698975, -1.0975933074951172, -1.030061960220337, -0.9625306725502014, -0.8949993848800659, -0.8274680376052856, -0.7599366903305054, -0.6924053430557251, -0.6248739957809448, -0.5573427081108093, -0.48981136083602905, -0.4222800135612488, -0.3547486960887909, -0.287217378616333, -0.21968603134155273, -0.15215469896793365, -0.08462336659431458, -0.017092034220695496, 0.050439298152923584, 0.11797064542770386, 0.18550196290016174, 0.25303328037261963, 0.32056474685668945, 0.3880960941314697, 0.4556274116039276, 0.5231587290763855, 0.5906900763511658, 0.658221423625946, 0.7257527112960815, 0.7932840585708618, 0.8608154058456421, 0.9283467531204224, 0.9958781003952026, 1.063409447669983, 1.1309406757354736, 1.198472023010254, 1.2660033702850342, 1.3335347175598145, 1.4010660648345947, 1.468597412109375, 1.5361287593841553, 1.6036601066589355, 1.6711914539337158, 1.738722801208496, 1.8062540292739868, 1.873785376548767, 1.9413167238235474, 2.008847951889038, 2.0763792991638184, 2.1439106464385986, 2.211441993713379, 2.278973340988159, 2.3465046882629395, 2.4140360355377197, 2.4815673828125]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 20.0, 18.0, 14.0, 45.0, 68.0, 90.0, 127.0, 231.0, 434.0, 798.0, 1512.0, 3397.0, 8999.0, 28163.0, 126145.0, 848908.0, 2583456.0, 484240.0, 76305.0, 19230.0, 6500.0, 2657.0, 1223.0, 659.0, 412.0, 218.0, 143.0, 74.0, 68.0, 35.0, 29.0, 17.0, 11.0, 15.0, 2.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86669921875, -0.8325271606445312, -0.7983551025390625, -0.7641830444335938, -0.730010986328125, -0.6958389282226562, -0.6616668701171875, -0.6274948120117188, -0.59332275390625, -0.5591506958007812, -0.5249786376953125, -0.49080657958984375, -0.456634521484375, -0.42246246337890625, -0.3882904052734375, -0.35411834716796875, -0.3199462890625, -0.28577423095703125, -0.2516021728515625, -0.21743011474609375, -0.183258056640625, -0.14908599853515625, -0.1149139404296875, -0.08074188232421875, -0.04656982421875, -0.01239776611328125, 0.0217742919921875, 0.05594635009765625, 0.090118408203125, 0.12429046630859375, 0.1584625244140625, 0.19263458251953125, 0.226806640625, 0.26097869873046875, 0.2951507568359375, 0.32932281494140625, 0.363494873046875, 0.39766693115234375, 0.4318389892578125, 0.46601104736328125, 0.50018310546875, 0.5343551635742188, 0.5685272216796875, 0.6026992797851562, 0.636871337890625, 0.6710433959960938, 0.7052154541015625, 0.7393875122070312, 0.7735595703125, 0.8077316284179688, 0.8419036865234375, 0.8760757446289062, 0.910247802734375, 0.9444198608398438, 0.9785919189453125, 1.0127639770507812, 1.04693603515625, 1.0811080932617188, 1.1152801513671875, 1.1494522094726562, 1.183624267578125, 1.2177963256835938, 1.2519683837890625, 1.2861404418945312, 1.3203125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 11.0, 5.0, 18.0, 14.0, 20.0, 26.0, 24.0, 40.0, 35.0, 48.0, 53.0, 30.0, 49.0, 48.0, 54.0, 64.0, 74.0, 54.0, 49.0, 53.0, 34.0, 29.0, 35.0, 23.0, 20.0, 18.0, 9.0, 12.0, 10.0, 2.0, 8.0, 2.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80078125, -0.7739486694335938, -0.7471160888671875, -0.7202835083007812, -0.693450927734375, -0.6666183471679688, -0.6397857666015625, -0.6129531860351562, -0.58612060546875, -0.5592880249023438, -0.5324554443359375, -0.5056228637695312, -0.478790283203125, -0.45195770263671875, -0.4251251220703125, -0.39829254150390625, -0.3714599609375, -0.34462738037109375, -0.3177947998046875, -0.29096221923828125, -0.264129638671875, -0.23729705810546875, -0.2104644775390625, -0.18363189697265625, -0.15679931640625, -0.12996673583984375, -0.1031341552734375, -0.07630157470703125, -0.049468994140625, -0.02263641357421875, 0.0041961669921875, 0.03102874755859375, 0.057861328125, 0.08469390869140625, 0.1115264892578125, 0.13835906982421875, 0.165191650390625, 0.19202423095703125, 0.2188568115234375, 0.24568939208984375, 0.27252197265625, 0.29935455322265625, 0.3261871337890625, 0.35301971435546875, 0.379852294921875, 0.40668487548828125, 0.4335174560546875, 0.46035003662109375, 0.4871826171875, 0.5140151977539062, 0.5408477783203125, 0.5676803588867188, 0.594512939453125, 0.6213455200195312, 0.6481781005859375, 0.6750106811523438, 0.70184326171875, 0.7286758422851562, 0.7555084228515625, 0.7823410034179688, 0.809173583984375, 0.8360061645507812, 0.8628387451171875, 0.8896713256835938, 0.91650390625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 11.0, 7.0, 10.0, 18.0, 25.0, 51.0, 83.0, 152.0, 440.0, 2545.0, 80467.0, 4067324.0, 40517.0, 1906.0, 391.0, 167.0, 73.0, 37.0, 20.0, 14.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.857635498046875, -2.74066162109375, -2.623687744140625, -2.5067138671875, -2.389739990234375, -2.27276611328125, -2.155792236328125, -2.038818359375, -1.921844482421875, -1.80487060546875, -1.687896728515625, -1.5709228515625, -1.453948974609375, -1.33697509765625, -1.220001220703125, -1.10302734375, -0.986053466796875, -0.86907958984375, -0.752105712890625, -0.6351318359375, -0.518157958984375, -0.40118408203125, -0.284210205078125, -0.167236328125, -0.050262451171875, 0.06671142578125, 0.183685302734375, 0.3006591796875, 0.417633056640625, 0.53460693359375, 0.651580810546875, 0.7685546875, 0.885528564453125, 1.00250244140625, 1.119476318359375, 1.2364501953125, 1.353424072265625, 1.47039794921875, 1.587371826171875, 1.704345703125, 1.821319580078125, 1.93829345703125, 2.055267333984375, 2.1722412109375, 2.289215087890625, 2.40618896484375, 2.523162841796875, 2.64013671875, 2.757110595703125, 2.87408447265625, 2.991058349609375, 3.1080322265625, 3.225006103515625, 3.34197998046875, 3.458953857421875, 3.575927734375, 3.692901611328125, 3.80987548828125, 3.926849365234375, 4.0438232421875, 4.160797119140625, 4.27777099609375, 4.394744873046875, 4.51171875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 10.0, 13.0, 25.0, 43.0, 45.0, 86.0, 118.0, 195.0, 308.0, 450.0, 724.0, 701.0, 509.0, 289.0, 168.0, 109.0, 81.0, 52.0, 34.0, 30.0, 19.0, 14.0, 9.0, 4.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47900390625, -0.4675941467285156, -0.45618438720703125, -0.4447746276855469, -0.4333648681640625, -0.4219551086425781, -0.41054534912109375, -0.3991355895996094, -0.387725830078125, -0.3763160705566406, -0.36490631103515625, -0.3534965515136719, -0.3420867919921875, -0.3306770324707031, -0.31926727294921875, -0.3078575134277344, -0.29644775390625, -0.2850379943847656, -0.27362823486328125, -0.2622184753417969, -0.2508087158203125, -0.23939895629882812, -0.22798919677734375, -0.21657943725585938, -0.205169677734375, -0.19375991821289062, -0.18235015869140625, -0.17094039916992188, -0.1595306396484375, -0.14812088012695312, -0.13671112060546875, -0.12530136108398438, -0.1138916015625, -0.10248184204101562, -0.09107208251953125, -0.07966232299804688, -0.0682525634765625, -0.056842803955078125, -0.04543304443359375, -0.034023284912109375, -0.022613525390625, -0.011203765869140625, 0.00020599365234375, 0.011615753173828125, 0.0230255126953125, 0.034435272216796875, 0.04584503173828125, 0.057254791259765625, 0.06866455078125, 0.08007431030273438, 0.09148406982421875, 0.10289382934570312, 0.1143035888671875, 0.12571334838867188, 0.13712310791015625, 0.14853286743164062, 0.159942626953125, 0.17135238647460938, 0.18276214599609375, 0.19417190551757812, 0.2055816650390625, 0.21699142456054688, 0.22840118408203125, 0.23981094360351562, 0.251220703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 15.0, 14.0, 16.0, 36.0, 34.0, 56.0, 94.0, 102.0, 123.0, 127.0, 86.0, 76.0, 53.0, 54.0, 37.0, 14.0, 16.0, 10.0, 9.0, 5.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.471360206604004, -1.4225925207138062, -1.3738248348236084, -1.3250571489334106, -1.276289463043213, -1.2275218963623047, -1.178754210472107, -1.1299865245819092, -1.0812188386917114, -1.0324511528015137, -0.9836834669113159, -0.9349158406257629, -0.8861481547355652, -0.8373804688453674, -0.7886128425598145, -0.7398451566696167, -0.691077470779419, -0.6423097848892212, -0.5935420989990234, -0.5447744727134705, -0.4960067868232727, -0.44723910093307495, -0.3984714448451996, -0.3497037887573242, -0.30093610286712646, -0.2521684169769287, -0.20340076088905334, -0.15463308990001678, -0.10586541891098022, -0.057097747921943665, -0.008330076932907104, 0.04043757915496826, 0.08920514583587646, 0.13797281682491302, 0.18674048781394958, 0.23550815880298615, 0.2842758297920227, 0.33304351568222046, 0.3818111717700958, 0.4305788278579712, 0.47934651374816895, 0.5281141996383667, 0.5768818855285645, 0.6256495118141174, 0.6744171977043152, 0.7231848835945129, 0.7719525098800659, 0.8207201957702637, 0.8694878816604614, 0.9182555675506592, 0.9670232534408569, 1.0157909393310547, 1.064558506011963, 1.1133261919021606, 1.1620938777923584, 1.2108615636825562, 1.259629249572754, 1.3083969354629517, 1.3571646213531494, 1.4059323072433472, 1.454699993133545, 1.5034675598144531, 1.5522352457046509, 1.6010029315948486, 1.6497706174850464]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 13.0, 11.0, 16.0, 9.0, 11.0, 14.0, 19.0, 18.0, 21.0, 31.0, 31.0, 28.0, 41.0, 32.0, 41.0, 36.0, 46.0, 48.0, 56.0, 45.0, 32.0, 50.0, 42.0, 29.0, 35.0, 25.0, 34.0, 26.0, 28.0, 19.0, 13.0, 22.0, 12.0, 18.0, 5.0, 10.0, 8.0, 4.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7723848819732666, -0.7480835318565369, -0.7237821221351624, -0.6994807720184326, -0.6751793622970581, -0.6508780121803284, -0.6265766620635986, -0.6022752523422241, -0.5779738426208496, -0.5536724925041199, -0.5293710827827454, -0.5050697326660156, -0.4807683229446411, -0.4564669728279114, -0.43216559290885925, -0.40786421298980713, -0.3835628628730774, -0.35926148295402527, -0.33496010303497314, -0.3106587529182434, -0.2863573431968689, -0.26205599308013916, -0.23775461316108704, -0.2134532332420349, -0.1891518533229828, -0.16485047340393066, -0.14054909348487854, -0.11624772846698761, -0.09194634854793549, -0.06764496862888336, -0.04334360361099243, -0.019042223691940308, 0.005259156227111816, 0.029560532420873642, 0.05386190861463547, 0.078163281083107, 0.10246466100215912, 0.12676604092121124, 0.15106740593910217, 0.1753687858581543, 0.19967016577720642, 0.22397154569625854, 0.24827292561531067, 0.2725743055343628, 0.29687565565109253, 0.32117706537246704, 0.3454784154891968, 0.3697797954082489, 0.394081175327301, 0.41838255524635315, 0.4426839351654053, 0.466985285282135, 0.4912866950035095, 0.5155880451202393, 0.5398894548416138, 0.5641908049583435, 0.5884921550750732, 0.612793505191803, 0.6370949149131775, 0.6613962650299072, 0.6856976747512817, 0.7099990248680115, 0.7343003749847412, 0.7586017847061157, 0.7829031944274902]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 5.0, 7.0, 7.0, 12.0, 18.0, 25.0, 39.0, 62.0, 106.0, 171.0, 348.0, 611.0, 1144.0, 2520.0, 6091.0, 17147.0, 62596.0, 337949.0, 491444.0, 91392.0, 23104.0, 7618.0, 3127.0, 1429.0, 676.0, 360.0, 198.0, 118.0, 68.0, 53.0, 23.0, 14.0, 22.0, 8.0, 6.0, 11.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.409423828125, -0.3966789245605469, -0.38393402099609375, -0.3711891174316406, -0.3584442138671875, -0.3456993103027344, -0.33295440673828125, -0.3202095031738281, -0.307464599609375, -0.2947196960449219, -0.28197479248046875, -0.2692298889160156, -0.2564849853515625, -0.24374008178710938, -0.23099517822265625, -0.21825027465820312, -0.20550537109375, -0.19276046752929688, -0.18001556396484375, -0.16727066040039062, -0.1545257568359375, -0.14178085327148438, -0.12903594970703125, -0.11629104614257812, -0.103546142578125, -0.09080123901367188, -0.07805633544921875, -0.06531143188476562, -0.0525665283203125, -0.039821624755859375, -0.02707672119140625, -0.014331817626953125, -0.0015869140625, 0.011157989501953125, 0.02390289306640625, 0.036647796630859375, 0.0493927001953125, 0.062137603759765625, 0.07488250732421875, 0.08762741088867188, 0.100372314453125, 0.11311721801757812, 0.12586212158203125, 0.13860702514648438, 0.1513519287109375, 0.16409683227539062, 0.17684173583984375, 0.18958663940429688, 0.20233154296875, 0.21507644653320312, 0.22782135009765625, 0.24056625366210938, 0.2533111572265625, 0.2660560607910156, 0.27880096435546875, 0.2915458679199219, 0.304290771484375, 0.3170356750488281, 0.32978057861328125, 0.3425254821777344, 0.3552703857421875, 0.3680152893066406, 0.38076019287109375, 0.3935050964355469, 0.40625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 5.0, 4.0, 11.0, 12.0, 12.0, 13.0, 17.0, 10.0, 30.0, 33.0, 36.0, 37.0, 34.0, 47.0, 54.0, 46.0, 48.0, 61.0, 57.0, 49.0, 48.0, 49.0, 39.0, 32.0, 38.0, 32.0, 24.0, 29.0, 15.0, 13.0, 17.0, 4.0, 8.0, 10.0, 3.0, 5.0, 1.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5595016479492188, -0.5418548583984375, -0.5242080688476562, -0.506561279296875, -0.48891448974609375, -0.4712677001953125, -0.45362091064453125, -0.43597412109375, -0.41832733154296875, -0.4006805419921875, -0.38303375244140625, -0.365386962890625, -0.34774017333984375, -0.3300933837890625, -0.31244659423828125, -0.2947998046875, -0.27715301513671875, -0.2595062255859375, -0.24185943603515625, -0.224212646484375, -0.20656585693359375, -0.1889190673828125, -0.17127227783203125, -0.15362548828125, -0.13597869873046875, -0.1183319091796875, -0.10068511962890625, -0.083038330078125, -0.06539154052734375, -0.0477447509765625, -0.03009796142578125, -0.012451171875, 0.00519561767578125, 0.0228424072265625, 0.04048919677734375, 0.058135986328125, 0.07578277587890625, 0.0934295654296875, 0.11107635498046875, 0.12872314453125, 0.14636993408203125, 0.1640167236328125, 0.18166351318359375, 0.199310302734375, 0.21695709228515625, 0.2346038818359375, 0.25225067138671875, 0.2698974609375, 0.28754425048828125, 0.3051910400390625, 0.32283782958984375, 0.340484619140625, 0.35813140869140625, 0.3757781982421875, 0.39342498779296875, 0.41107177734375, 0.42871856689453125, 0.4463653564453125, 0.46401214599609375, 0.481658935546875, 0.49930572509765625, 0.5169525146484375, 0.5345993041992188, 0.55224609375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 11.0, 11.0, 13.0, 19.0, 21.0, 31.0, 46.0, 56.0, 81.0, 124.0, 201.0, 349.0, 610.0, 1128.0, 2467.0, 6235.0, 19723.0, 81275.0, 481129.0, 368508.0, 61136.0, 15479.0, 5331.0, 2123.0, 983.0, 493.0, 328.0, 184.0, 132.0, 98.0, 50.0, 42.0, 31.0, 28.0, 17.0, 15.0, 13.0, 7.0, 2.0, 8.0, 5.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30615234375, -0.2965583801269531, -0.28696441650390625, -0.2773704528808594, -0.2677764892578125, -0.2581825256347656, -0.24858856201171875, -0.23899459838867188, -0.229400634765625, -0.21980667114257812, -0.21021270751953125, -0.20061874389648438, -0.1910247802734375, -0.18143081665039062, -0.17183685302734375, -0.16224288940429688, -0.15264892578125, -0.14305496215820312, -0.13346099853515625, -0.12386703491210938, -0.1142730712890625, -0.10467910766601562, -0.09508514404296875, -0.08549118041992188, -0.075897216796875, -0.06630325317382812, -0.05670928955078125, -0.047115325927734375, -0.0375213623046875, -0.027927398681640625, -0.01833343505859375, -0.008739471435546875, 0.0008544921875, 0.010448455810546875, 0.02004241943359375, 0.029636383056640625, 0.0392303466796875, 0.048824310302734375, 0.05841827392578125, 0.06801223754882812, 0.077606201171875, 0.08720016479492188, 0.09679412841796875, 0.10638809204101562, 0.1159820556640625, 0.12557601928710938, 0.13516998291015625, 0.14476394653320312, 0.15435791015625, 0.16395187377929688, 0.17354583740234375, 0.18313980102539062, 0.1927337646484375, 0.20232772827148438, 0.21192169189453125, 0.22151565551757812, 0.231109619140625, 0.24070358276367188, 0.25029754638671875, 0.2598915100097656, 0.2694854736328125, 0.2790794372558594, 0.28867340087890625, 0.2982673645019531, 0.307861328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 8.0, 7.0, 14.0, 11.0, 25.0, 24.0, 23.0, 19.0, 22.0, 32.0, 34.0, 33.0, 40.0, 50.0, 49.0, 37.0, 51.0, 44.0, 37.0, 60.0, 44.0, 45.0, 34.0, 22.0, 34.0, 26.0, 22.0, 25.0, 23.0, 16.0, 15.0, 8.0, 11.0, 9.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8752670288085938, -0.8457489013671875, -0.8162307739257812, -0.786712646484375, -0.7571945190429688, -0.7276763916015625, -0.6981582641601562, -0.66864013671875, -0.6391220092773438, -0.6096038818359375, -0.5800857543945312, -0.550567626953125, -0.5210494995117188, -0.4915313720703125, -0.46201324462890625, -0.4324951171875, -0.40297698974609375, -0.3734588623046875, -0.34394073486328125, -0.314422607421875, -0.28490447998046875, -0.2553863525390625, -0.22586822509765625, -0.19635009765625, -0.16683197021484375, -0.1373138427734375, -0.10779571533203125, -0.078277587890625, -0.04875946044921875, -0.0192413330078125, 0.01027679443359375, 0.039794921875, 0.06931304931640625, 0.0988311767578125, 0.12834930419921875, 0.157867431640625, 0.18738555908203125, 0.2169036865234375, 0.24642181396484375, 0.27593994140625, 0.30545806884765625, 0.3349761962890625, 0.36449432373046875, 0.394012451171875, 0.42353057861328125, 0.4530487060546875, 0.48256683349609375, 0.5120849609375, 0.5416030883789062, 0.5711212158203125, 0.6006393432617188, 0.630157470703125, 0.6596755981445312, 0.6891937255859375, 0.7187118530273438, 0.74822998046875, 0.7777481079101562, 0.8072662353515625, 0.8367843627929688, 0.866302490234375, 0.8958206176757812, 0.9253387451171875, 0.9548568725585938, 0.984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 6.0, 3.0, 10.0, 6.0, 11.0, 11.0, 20.0, 30.0, 47.0, 82.0, 115.0, 177.0, 289.0, 539.0, 1017.0, 2013.0, 4433.0, 12018.0, 51343.0, 493790.0, 418083.0, 44861.0, 11165.0, 4180.0, 2024.0, 969.0, 479.0, 302.0, 181.0, 108.0, 67.0, 48.0, 32.0, 32.0, 21.0, 13.0, 11.0, 4.0, 4.0, 3.0, 9.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.1603565216064453, -0.15481948852539062, -0.14928245544433594, -0.14374542236328125, -0.13820838928222656, -0.13267135620117188, -0.1271343231201172, -0.1215972900390625, -0.11606025695800781, -0.11052322387695312, -0.10498619079589844, -0.09944915771484375, -0.09391212463378906, -0.08837509155273438, -0.08283805847167969, -0.077301025390625, -0.07176399230957031, -0.06622695922851562, -0.06068992614746094, -0.05515289306640625, -0.04961585998535156, -0.044078826904296875, -0.03854179382324219, -0.0330047607421875, -0.027467727661132812, -0.021930694580078125, -0.016393661499023438, -0.01085662841796875, -0.0053195953369140625, 0.000217437744140625, 0.0057544708251953125, 0.01129150390625, 0.016828536987304688, 0.022365570068359375, 0.027902603149414062, 0.03343963623046875, 0.03897666931152344, 0.044513702392578125, 0.05005073547363281, 0.0555877685546875, 0.06112480163574219, 0.06666183471679688, 0.07219886779785156, 0.07773590087890625, 0.08327293395996094, 0.08880996704101562, 0.09434700012207031, 0.099884033203125, 0.10542106628417969, 0.11095809936523438, 0.11649513244628906, 0.12203216552734375, 0.12756919860839844, 0.13310623168945312, 0.1386432647705078, 0.1441802978515625, 0.1497173309326172, 0.15525436401367188, 0.16079139709472656, 0.16632843017578125, 0.17186546325683594, 0.17740249633789062, 0.1829395294189453, 0.1884765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 9.0, 6.0, 9.0, 10.0, 14.0, 23.0, 57.0, 102.0, 155.0, 184.0, 172.0, 109.0, 64.0, 29.0, 25.0, 10.0, 8.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013756752014160156, -0.00013357866555452347, -0.00012958981096744537, -0.00012560095638036728, -0.00012161210179328918, -0.00011762324720621109, -0.000113634392619133, -0.0001096455380320549, -0.0001056566834449768, -0.00010166782885789871, -9.767897427082062e-05, -9.369011968374252e-05, -8.970126509666443e-05, -8.571241050958633e-05, -8.172355592250824e-05, -7.773470133543015e-05, -7.374584674835205e-05, -6.975699216127396e-05, -6.576813757419586e-05, -6.177928298711777e-05, -5.779042840003967e-05, -5.380157381296158e-05, -4.9812719225883484e-05, -4.582386463880539e-05, -4.1835010051727295e-05, -3.78461554646492e-05, -3.3857300877571106e-05, -2.986844629049301e-05, -2.5879591703414917e-05, -2.1890737116336823e-05, -1.7901882529258728e-05, -1.3913027942180634e-05, -9.924173355102539e-06, -5.935318768024445e-06, -1.94646418094635e-06, 2.0423904061317444e-06, 6.031244993209839e-06, 1.0020099580287933e-05, 1.4008954167366028e-05, 1.7997808754444122e-05, 2.1986663341522217e-05, 2.597551792860031e-05, 2.9964372515678406e-05, 3.39532271027565e-05, 3.7942081689834595e-05, 4.193093627691269e-05, 4.5919790863990784e-05, 4.990864545106888e-05, 5.389750003814697e-05, 5.788635462522507e-05, 6.187520921230316e-05, 6.586406379938126e-05, 6.985291838645935e-05, 7.384177297353745e-05, 7.783062756061554e-05, 8.181948214769363e-05, 8.580833673477173e-05, 8.979719132184982e-05, 9.378604590892792e-05, 9.777490049600601e-05, 0.0001017637550830841, 0.0001057526096701622, 0.0001097414642572403, 0.00011373031884431839, 0.00011771917343139648]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 5.0, 10.0, 14.0, 21.0, 25.0, 51.0, 90.0, 140.0, 210.0, 388.0, 740.0, 1382.0, 2692.0, 5849.0, 16812.0, 84759.0, 623804.0, 259834.0, 34236.0, 9392.0, 3885.0, 1920.0, 983.0, 546.0, 299.0, 162.0, 91.0, 70.0, 46.0, 28.0, 16.0, 10.0, 9.0, 8.0, 2.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1904296875, -0.18402862548828125, -0.1776275634765625, -0.17122650146484375, -0.164825439453125, -0.15842437744140625, -0.1520233154296875, -0.14562225341796875, -0.13922119140625, -0.13282012939453125, -0.1264190673828125, -0.12001800537109375, -0.113616943359375, -0.10721588134765625, -0.1008148193359375, -0.09441375732421875, -0.0880126953125, -0.08161163330078125, -0.0752105712890625, -0.06880950927734375, -0.062408447265625, -0.05600738525390625, -0.0496063232421875, -0.04320526123046875, -0.03680419921875, -0.03040313720703125, -0.0240020751953125, -0.01760101318359375, -0.011199951171875, -0.00479888916015625, 0.0016021728515625, 0.00800323486328125, 0.014404296875, 0.02080535888671875, 0.0272064208984375, 0.03360748291015625, 0.040008544921875, 0.04640960693359375, 0.0528106689453125, 0.05921173095703125, 0.06561279296875, 0.07201385498046875, 0.0784149169921875, 0.08481597900390625, 0.091217041015625, 0.09761810302734375, 0.1040191650390625, 0.11042022705078125, 0.1168212890625, 0.12322235107421875, 0.1296234130859375, 0.13602447509765625, 0.142425537109375, 0.14882659912109375, 0.1552276611328125, 0.16162872314453125, 0.16802978515625, 0.17443084716796875, 0.1808319091796875, 0.18723297119140625, 0.193634033203125, 0.20003509521484375, 0.2064361572265625, 0.21283721923828125, 0.21923828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 1.0, 3.0, 6.0, 2.0, 11.0, 11.0, 20.0, 26.0, 26.0, 43.0, 49.0, 100.0, 88.0, 106.0, 118.0, 106.0, 71.0, 63.0, 40.0, 23.0, 25.0, 12.0, 13.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039215087890625, -0.03791379928588867, -0.036612510681152344, -0.035311222076416016, -0.03400993347167969, -0.03270864486694336, -0.03140735626220703, -0.030106067657470703, -0.028804779052734375, -0.027503490447998047, -0.02620220184326172, -0.02490091323852539, -0.023599624633789062, -0.022298336029052734, -0.020997047424316406, -0.019695758819580078, -0.01839447021484375, -0.017093181610107422, -0.015791893005371094, -0.014490604400634766, -0.013189315795898438, -0.01188802719116211, -0.010586738586425781, -0.009285449981689453, -0.007984161376953125, -0.006682872772216797, -0.005381584167480469, -0.004080295562744141, -0.0027790069580078125, -0.0014777183532714844, -0.00017642974853515625, 0.0011248588562011719, 0.0024261474609375, 0.003727436065673828, 0.005028724670410156, 0.006330013275146484, 0.0076313018798828125, 0.00893259048461914, 0.010233879089355469, 0.011535167694091797, 0.012836456298828125, 0.014137744903564453, 0.015439033508300781, 0.01674032211303711, 0.018041610717773438, 0.019342899322509766, 0.020644187927246094, 0.021945476531982422, 0.02324676513671875, 0.024548053741455078, 0.025849342346191406, 0.027150630950927734, 0.028451919555664062, 0.02975320816040039, 0.03105449676513672, 0.03235578536987305, 0.033657073974609375, 0.0349583625793457, 0.03625965118408203, 0.03756093978881836, 0.03886222839355469, 0.040163516998291016, 0.041464805603027344, 0.04276609420776367, 0.0440673828125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 12.0, 13.0, 20.0, 33.0, 51.0, 76.0, 126.0, 140.0, 117.0, 129.0, 74.0, 52.0, 49.0, 26.0, 19.0, 11.0, 11.0, 4.0, 5.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7656697034835815, -0.7325798273086548, -0.6994898915290833, -0.6663999557495117, -0.633310079574585, -0.6002202033996582, -0.5671302676200867, -0.5340403318405151, -0.5009504556655884, -0.46786054968833923, -0.4347706437110901, -0.40168073773384094, -0.3685908317565918, -0.33550092577934265, -0.3024110198020935, -0.26932111382484436, -0.23623120784759521, -0.20314130187034607, -0.17005139589309692, -0.13696148991584778, -0.10387158393859863, -0.07078167796134949, -0.03769177198410034, -0.004601866006851196, 0.02848803997039795, 0.061577945947647095, 0.09466785192489624, 0.12775775790214539, 0.16084766387939453, 0.19393756985664368, 0.22702747583389282, 0.26011738181114197, 0.29320740699768066, 0.3262973129749298, 0.35938721895217896, 0.3924771249294281, 0.42556703090667725, 0.4586569368839264, 0.49174684286117554, 0.5248367786407471, 0.5579266548156738, 0.5910165309906006, 0.6241064667701721, 0.6571964025497437, 0.6902862787246704, 0.7233761548995972, 0.7564660906791687, 0.7895560264587402, 0.822645902633667, 0.8557357788085938, 0.8888257145881653, 0.9219156503677368, 0.9550055265426636, 0.9880954027175903, 1.0211853981018066, 1.0542752742767334, 1.0873651504516602, 1.120455026626587, 1.1535449028015137, 1.18663489818573, 1.2197247743606567, 1.2528146505355835, 1.2859046459197998, 1.3189945220947266, 1.3520843982696533]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 8.0, 9.0, 15.0, 11.0, 14.0, 10.0, 26.0, 20.0, 24.0, 36.0, 36.0, 30.0, 43.0, 46.0, 46.0, 54.0, 57.0, 62.0, 53.0, 42.0, 47.0, 42.0, 33.0, 35.0, 27.0, 28.0, 29.0, 24.0, 20.0, 9.0, 15.0, 5.0, 11.0, 10.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.522476315498352, -0.505682110786438, -0.4888879060745239, -0.47209370136260986, -0.4552994966506958, -0.43850529193878174, -0.4217110872268677, -0.4049168825149536, -0.38812267780303955, -0.3713284730911255, -0.3545342683792114, -0.33774006366729736, -0.3209458589553833, -0.30415165424346924, -0.2873574495315552, -0.2705632448196411, -0.25376904010772705, -0.236974835395813, -0.22018063068389893, -0.20338642597198486, -0.1865922212600708, -0.16979801654815674, -0.15300381183624268, -0.1362096071243286, -0.11941540241241455, -0.10262119770050049, -0.08582699298858643, -0.06903278827667236, -0.0522385835647583, -0.03544437885284424, -0.018650174140930176, -0.0018559694290161133, 0.014938294887542725, 0.03173249959945679, 0.04852670431137085, 0.06532090902328491, 0.08211511373519897, 0.09890931844711304, 0.1157035231590271, 0.13249772787094116, 0.14929193258285522, 0.1660861372947693, 0.18288034200668335, 0.1996745467185974, 0.21646875143051147, 0.23326295614242554, 0.2500571608543396, 0.26685136556625366, 0.2836455702781677, 0.3004397749900818, 0.31723397970199585, 0.3340281844139099, 0.350822389125824, 0.36761659383773804, 0.3844107985496521, 0.40120500326156616, 0.4179992079734802, 0.4347934126853943, 0.45158761739730835, 0.4683818221092224, 0.4851760268211365, 0.5019702315330505, 0.5187644362449646, 0.5355586409568787, 0.5523528456687927]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 3.0, 9.0, 8.0, 11.0, 15.0, 30.0, 65.0, 87.0, 153.0, 276.0, 542.0, 1204.0, 2645.0, 6754.0, 19287.0, 66077.0, 275567.0, 500612.0, 124247.0, 32993.0, 10623.0, 4104.0, 1639.0, 800.0, 354.0, 172.0, 123.0, 57.0, 29.0, 21.0, 10.0, 12.0, 10.0, 3.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.880859375, -0.8526535034179688, -0.8244476318359375, -0.7962417602539062, -0.768035888671875, -0.7398300170898438, -0.7116241455078125, -0.6834182739257812, -0.65521240234375, -0.6270065307617188, -0.5988006591796875, -0.5705947875976562, -0.542388916015625, -0.5141830444335938, -0.4859771728515625, -0.45777130126953125, -0.4295654296875, -0.40135955810546875, -0.3731536865234375, -0.34494781494140625, -0.316741943359375, -0.28853607177734375, -0.2603302001953125, -0.23212432861328125, -0.20391845703125, -0.17571258544921875, -0.1475067138671875, -0.11930084228515625, -0.091094970703125, -0.06288909912109375, -0.0346832275390625, -0.00647735595703125, 0.021728515625, 0.04993438720703125, 0.0781402587890625, 0.10634613037109375, 0.134552001953125, 0.16275787353515625, 0.1909637451171875, 0.21916961669921875, 0.24737548828125, 0.27558135986328125, 0.3037872314453125, 0.33199310302734375, 0.360198974609375, 0.38840484619140625, 0.4166107177734375, 0.44481658935546875, 0.4730224609375, 0.5012283325195312, 0.5294342041015625, 0.5576400756835938, 0.585845947265625, 0.6140518188476562, 0.6422576904296875, 0.6704635620117188, 0.69866943359375, 0.7268753051757812, 0.7550811767578125, 0.7832870483398438, 0.811492919921875, 0.8396987915039062, 0.8679046630859375, 0.8961105346679688, 0.92431640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 5.0, 4.0, 17.0, 10.0, 15.0, 21.0, 19.0, 23.0, 27.0, 28.0, 40.0, 59.0, 36.0, 57.0, 63.0, 40.0, 51.0, 59.0, 50.0, 42.0, 54.0, 43.0, 37.0, 28.0, 29.0, 25.0, 23.0, 17.0, 21.0, 6.0, 10.0, 11.0, 4.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98193359375, -0.9447708129882812, -0.9076080322265625, -0.8704452514648438, -0.833282470703125, -0.7961196899414062, -0.7589569091796875, -0.7217941284179688, -0.68463134765625, -0.6474685668945312, -0.6103057861328125, -0.5731430053710938, -0.535980224609375, -0.49881744384765625, -0.4616546630859375, -0.42449188232421875, -0.3873291015625, -0.35016632080078125, -0.3130035400390625, -0.27584075927734375, -0.238677978515625, -0.20151519775390625, -0.1643524169921875, -0.12718963623046875, -0.09002685546875, -0.05286407470703125, -0.0157012939453125, 0.02146148681640625, 0.058624267578125, 0.09578704833984375, 0.1329498291015625, 0.17011260986328125, 0.207275390625, 0.24443817138671875, 0.2816009521484375, 0.31876373291015625, 0.355926513671875, 0.39308929443359375, 0.4302520751953125, 0.46741485595703125, 0.50457763671875, 0.5417404174804688, 0.5789031982421875, 0.6160659790039062, 0.653228759765625, 0.6903915405273438, 0.7275543212890625, 0.7647171020507812, 0.8018798828125, 0.8390426635742188, 0.8762054443359375, 0.9133682250976562, 0.950531005859375, 0.9876937866210938, 1.0248565673828125, 1.0620193481445312, 1.09918212890625, 1.1363449096679688, 1.1735076904296875, 1.2106704711914062, 1.247833251953125, 1.2849960327148438, 1.3221588134765625, 1.3593215942382812, 1.396484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 6.0, 7.0, 10.0, 12.0, 13.0, 11.0, 23.0, 25.0, 24.0, 25.0, 29.0, 32.0, 40.0, 43.0, 50.0, 69.0, 173.0, 818.0, 27545.0, 983552.0, 34496.0, 959.0, 173.0, 74.0, 61.0, 34.0, 33.0, 30.0, 18.0, 14.0, 29.0, 16.0, 17.0, 9.0, 17.0, 9.0, 8.0, 8.0, 4.0, 3.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.888671875, -2.783721923828125, -2.67877197265625, -2.573822021484375, -2.4688720703125, -2.363922119140625, -2.25897216796875, -2.154022216796875, -2.049072265625, -1.944122314453125, -1.83917236328125, -1.734222412109375, -1.6292724609375, -1.524322509765625, -1.41937255859375, -1.314422607421875, -1.20947265625, -1.104522705078125, -0.99957275390625, -0.894622802734375, -0.7896728515625, -0.684722900390625, -0.57977294921875, -0.474822998046875, -0.369873046875, -0.264923095703125, -0.15997314453125, -0.055023193359375, 0.0499267578125, 0.154876708984375, 0.25982666015625, 0.364776611328125, 0.4697265625, 0.574676513671875, 0.67962646484375, 0.784576416015625, 0.8895263671875, 0.994476318359375, 1.09942626953125, 1.204376220703125, 1.309326171875, 1.414276123046875, 1.51922607421875, 1.624176025390625, 1.7291259765625, 1.834075927734375, 1.93902587890625, 2.043975830078125, 2.14892578125, 2.253875732421875, 2.35882568359375, 2.463775634765625, 2.5687255859375, 2.673675537109375, 2.77862548828125, 2.883575439453125, 2.988525390625, 3.093475341796875, 3.19842529296875, 3.303375244140625, 3.4083251953125, 3.513275146484375, 3.61822509765625, 3.723175048828125, 3.828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 8.0, 9.0, 7.0, 13.0, 7.0, 17.0, 16.0, 21.0, 27.0, 28.0, 21.0, 37.0, 35.0, 37.0, 27.0, 37.0, 47.0, 35.0, 42.0, 46.0, 45.0, 49.0, 51.0, 44.0, 39.0, 34.0, 31.0, 30.0, 13.0, 20.0, 24.0, 17.0, 9.0, 12.0, 11.0, 9.0, 8.0, 13.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.09375, -1.0581817626953125, -1.022613525390625, -0.9870452880859375, -0.95147705078125, -0.9159088134765625, -0.880340576171875, -0.8447723388671875, -0.8092041015625, -0.7736358642578125, -0.738067626953125, -0.7024993896484375, -0.66693115234375, -0.6313629150390625, -0.595794677734375, -0.5602264404296875, -0.524658203125, -0.4890899658203125, -0.453521728515625, -0.4179534912109375, -0.38238525390625, -0.3468170166015625, -0.311248779296875, -0.2756805419921875, -0.2401123046875, -0.2045440673828125, -0.168975830078125, -0.1334075927734375, -0.09783935546875, -0.0622711181640625, -0.026702880859375, 0.0088653564453125, 0.04443359375, 0.0800018310546875, 0.115570068359375, 0.1511383056640625, 0.18670654296875, 0.2222747802734375, 0.257843017578125, 0.2934112548828125, 0.3289794921875, 0.3645477294921875, 0.400115966796875, 0.4356842041015625, 0.47125244140625, 0.5068206787109375, 0.542388916015625, 0.5779571533203125, 0.613525390625, 0.6490936279296875, 0.684661865234375, 0.7202301025390625, 0.75579833984375, 0.7913665771484375, 0.826934814453125, 0.8625030517578125, 0.8980712890625, 0.9336395263671875, 0.969207763671875, 1.0047760009765625, 1.04034423828125, 1.0759124755859375, 1.111480712890625, 1.1470489501953125, 1.1826171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 3.0, 9.0, 14.0, 11.0, 19.0, 24.0, 54.0, 70.0, 155.0, 317.0, 646.0, 1877.0, 6500.0, 31862.0, 221562.0, 641679.0, 118304.0, 18709.0, 4267.0, 1394.0, 537.0, 234.0, 110.0, 80.0, 45.0, 28.0, 11.0, 10.0, 8.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.274658203125, -0.2649688720703125, -0.255279541015625, -0.2455902099609375, -0.23590087890625, -0.2262115478515625, -0.216522216796875, -0.2068328857421875, -0.1971435546875, -0.1874542236328125, -0.177764892578125, -0.1680755615234375, -0.15838623046875, -0.1486968994140625, -0.139007568359375, -0.1293182373046875, -0.11962890625, -0.1099395751953125, -0.100250244140625, -0.0905609130859375, -0.08087158203125, -0.0711822509765625, -0.061492919921875, -0.0518035888671875, -0.0421142578125, -0.0324249267578125, -0.022735595703125, -0.0130462646484375, -0.00335693359375, 0.0063323974609375, 0.016021728515625, 0.0257110595703125, 0.035400390625, 0.0450897216796875, 0.054779052734375, 0.0644683837890625, 0.07415771484375, 0.0838470458984375, 0.093536376953125, 0.1032257080078125, 0.1129150390625, 0.1226043701171875, 0.132293701171875, 0.1419830322265625, 0.15167236328125, 0.1613616943359375, 0.171051025390625, 0.1807403564453125, 0.1904296875, 0.2001190185546875, 0.209808349609375, 0.2194976806640625, 0.22918701171875, 0.2388763427734375, 0.248565673828125, 0.2582550048828125, 0.2679443359375, 0.2776336669921875, 0.287322998046875, 0.2970123291015625, 0.30670166015625, 0.3163909912109375, 0.326080322265625, 0.3357696533203125, 0.345458984375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 2.0, 8.0, 8.0, 11.0, 12.0, 10.0, 27.0, 27.0, 28.0, 29.0, 31.0, 51.0, 69.0, 86.0, 93.0, 81.0, 85.0, 68.0, 48.0, 48.0, 31.0, 30.0, 23.0, 24.0, 12.0, 12.0, 9.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.403425216674805e-05, -3.294367343187332e-05, -3.1853094696998596e-05, -3.076251596212387e-05, -2.9671937227249146e-05, -2.858135849237442e-05, -2.7490779757499695e-05, -2.640020102262497e-05, -2.5309622287750244e-05, -2.421904355287552e-05, -2.3128464818000793e-05, -2.2037886083126068e-05, -2.0947307348251343e-05, -1.9856728613376617e-05, -1.8766149878501892e-05, -1.7675571143627167e-05, -1.658499240875244e-05, -1.5494413673877716e-05, -1.440383493900299e-05, -1.3313256204128265e-05, -1.222267746925354e-05, -1.1132098734378815e-05, -1.004151999950409e-05, -8.950941264629364e-06, -7.860362529754639e-06, -6.769783794879913e-06, -5.679205060005188e-06, -4.588626325130463e-06, -3.4980475902557373e-06, -2.407468855381012e-06, -1.3168901205062866e-06, -2.2631138563156128e-07, 8.642673492431641e-07, 1.9548460841178894e-06, 3.0454248189926147e-06, 4.13600355386734e-06, 5.2265822887420654e-06, 6.317161023616791e-06, 7.407739758491516e-06, 8.498318493366241e-06, 9.588897228240967e-06, 1.0679475963115692e-05, 1.1770054697990417e-05, 1.2860633432865143e-05, 1.3951212167739868e-05, 1.5041790902614594e-05, 1.613236963748932e-05, 1.7222948372364044e-05, 1.831352710723877e-05, 1.9404105842113495e-05, 2.049468457698822e-05, 2.1585263311862946e-05, 2.267584204673767e-05, 2.3766420781612396e-05, 2.485699951648712e-05, 2.5947578251361847e-05, 2.7038156986236572e-05, 2.8128735721111298e-05, 2.9219314455986023e-05, 3.0309893190860748e-05, 3.1400471925735474e-05, 3.24910506606102e-05, 3.3581629395484924e-05, 3.467220813035965e-05, 3.5762786865234375e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 3.0, 6.0, 3.0, 11.0, 6.0, 22.0, 32.0, 67.0, 67.0, 117.0, 290.0, 644.0, 1638.0, 4725.0, 17692.0, 82925.0, 430290.0, 408052.0, 77688.0, 16896.0, 4559.0, 1569.0, 631.0, 283.0, 133.0, 81.0, 39.0, 31.0, 15.0, 13.0, 7.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2001953125, -0.1924896240234375, -0.184783935546875, -0.1770782470703125, -0.16937255859375, -0.1616668701171875, -0.153961181640625, -0.1462554931640625, -0.1385498046875, -0.1308441162109375, -0.123138427734375, -0.1154327392578125, -0.10772705078125, -0.1000213623046875, -0.092315673828125, -0.0846099853515625, -0.076904296875, -0.0691986083984375, -0.061492919921875, -0.0537872314453125, -0.04608154296875, -0.0383758544921875, -0.030670166015625, -0.0229644775390625, -0.0152587890625, -0.0075531005859375, 0.000152587890625, 0.0078582763671875, 0.01556396484375, 0.0232696533203125, 0.030975341796875, 0.0386810302734375, 0.04638671875, 0.0540924072265625, 0.061798095703125, 0.0695037841796875, 0.07720947265625, 0.0849151611328125, 0.092620849609375, 0.1003265380859375, 0.1080322265625, 0.1157379150390625, 0.123443603515625, 0.1311492919921875, 0.13885498046875, 0.1465606689453125, 0.154266357421875, 0.1619720458984375, 0.169677734375, 0.1773834228515625, 0.185089111328125, 0.1927947998046875, 0.20050048828125, 0.2082061767578125, 0.215911865234375, 0.2236175537109375, 0.2313232421875, 0.2390289306640625, 0.246734619140625, 0.2544403076171875, 0.26214599609375, 0.2698516845703125, 0.277557373046875, 0.2852630615234375, 0.29296875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 8.0, 9.0, 8.0, 7.0, 11.0, 14.0, 15.0, 29.0, 27.0, 36.0, 51.0, 47.0, 72.0, 76.0, 84.0, 80.0, 68.0, 69.0, 63.0, 44.0, 31.0, 31.0, 22.0, 27.0, 19.0, 13.0, 4.0, 6.0, 7.0, 5.0, 7.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10865020751953125, -0.1055450439453125, -0.10243988037109375, -0.099334716796875, -0.09622955322265625, -0.0931243896484375, -0.09001922607421875, -0.0869140625, -0.08380889892578125, -0.0807037353515625, -0.07759857177734375, -0.074493408203125, -0.07138824462890625, -0.0682830810546875, -0.06517791748046875, -0.06207275390625, -0.05896759033203125, -0.0558624267578125, -0.05275726318359375, -0.049652099609375, -0.04654693603515625, -0.0434417724609375, -0.04033660888671875, -0.0372314453125, -0.03412628173828125, -0.0310211181640625, -0.02791595458984375, -0.024810791015625, -0.02170562744140625, -0.0186004638671875, -0.01549530029296875, -0.01239013671875, -0.00928497314453125, -0.0061798095703125, -0.00307464599609375, 3.0517578125e-05, 0.00313568115234375, 0.0062408447265625, 0.00934600830078125, 0.012451171875, 0.01555633544921875, 0.0186614990234375, 0.02176666259765625, 0.024871826171875, 0.02797698974609375, 0.0310821533203125, 0.03418731689453125, 0.03729248046875, 0.04039764404296875, 0.0435028076171875, 0.04660797119140625, 0.049713134765625, 0.05281829833984375, 0.0559234619140625, 0.05902862548828125, 0.0621337890625, 0.06523895263671875, 0.0683441162109375, 0.07144927978515625, 0.074554443359375, 0.07765960693359375, 0.0807647705078125, 0.08386993408203125, 0.08697509765625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 14.0, 76.0, 301.0, 426.0, 144.0, 25.0, 9.0, 5.0, 2.0, 0.0, 0.0, 3.0], "bins": [-14.14339542388916, -13.887163162231445, -13.630931854248047, -13.374699592590332, -13.118467330932617, -12.862236022949219, -12.606003761291504, -12.349771499633789, -12.09354019165039, -11.837307929992676, -11.581076622009277, -11.324844360351562, -11.068612098693848, -10.812379837036133, -10.556148529052734, -10.29991626739502, -10.043684005737305, -9.78745174407959, -9.531220436096191, -9.274988174438477, -9.018755912780762, -8.762523651123047, -8.506292343139648, -8.250060081481934, -7.993828296661377, -7.73759651184082, -7.4813642501831055, -7.225132465362549, -6.968900680541992, -6.712668418884277, -6.456436634063721, -6.200204849243164, -5.943972587585449, -5.687740802764893, -5.431508541107178, -5.175276756286621, -4.919044494628906, -4.66281270980835, -4.406580924987793, -4.150348663330078, -3.8941168785095215, -3.6378848552703857, -3.38165283203125, -3.1254210472106934, -2.8691890239715576, -2.612957000732422, -2.3567252159118652, -2.1004931926727295, -1.8442611694335938, -1.588029146194458, -1.3317972421646118, -1.0755653381347656, -0.8193333148956299, -0.5631012916564941, -0.30686938762664795, -0.05063748359680176, 0.20559453964233398, 0.46182650327682495, 0.7180584669113159, 0.9742904305458069, 1.2305223941802979, 1.4867544174194336, 1.7429863214492798, 1.999218225479126, 2.2554502487182617]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 8.0, 11.0, 8.0, 12.0, 15.0, 16.0, 15.0, 19.0, 26.0, 31.0, 26.0, 28.0, 32.0, 48.0, 60.0, 45.0, 36.0, 49.0, 49.0, 41.0, 38.0, 62.0, 34.0, 43.0, 40.0, 34.0, 30.0, 27.0, 24.0, 18.0, 16.0, 8.0, 13.0, 11.0, 7.0, 8.0, 2.0, 2.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7210110425949097, -1.6546880006790161, -1.588364839553833, -1.5220417976379395, -1.455718755722046, -1.3893955945968628, -1.3230725526809692, -1.2567493915557861, -1.1904263496398926, -1.124103307723999, -1.057780146598816, -0.9914571046829224, -0.925134003162384, -0.8588109016418457, -0.7924878597259521, -0.7261647582054138, -0.6598416566848755, -0.5935185551643372, -0.5271954536437988, -0.4608724117279053, -0.39454931020736694, -0.3282262086868286, -0.26190313696861267, -0.19558006525039673, -0.1292569637298584, -0.06293387711048126, 0.003389209508895874, 0.06971229612827301, 0.13603538274765015, 0.20235848426818848, 0.2686815559864044, 0.33500462770462036, 0.40132784843444824, 0.4676509499549866, 0.5339740514755249, 0.6002970933914185, 0.6666201949119568, 0.7329432964324951, 0.7992663383483887, 0.865589439868927, 0.9319125413894653, 0.9982356429100037, 1.064558744430542, 1.1308817863464355, 1.197204828262329, 1.2635279893875122, 1.3298510313034058, 1.3961741924285889, 1.4624972343444824, 1.528820276260376, 1.595143437385559, 1.6614664793014526, 1.7277896404266357, 1.7941126823425293, 1.8604357242584229, 1.9267587661743164, 1.9930819272994995, 2.0594050884246826, 2.125728130340576, 2.1920511722564697, 2.2583742141723633, 2.324697494506836, 2.3910205364227295, 2.457343578338623, 2.5236666202545166]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 9.0, 3.0, 8.0, 15.0, 18.0, 17.0, 39.0, 42.0, 53.0, 109.0, 211.0, 444.0, 1185.0, 3744.0, 18419.0, 167135.0, 3174223.0, 774200.0, 43674.0, 7273.0, 2010.0, 717.0, 300.0, 156.0, 86.0, 61.0, 34.0, 29.0, 15.0, 13.0, 16.0, 10.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.603759765625, -1.55322265625, -1.502685546875, -1.4521484375, -1.401611328125, -1.35107421875, -1.300537109375, -1.25, -1.199462890625, -1.14892578125, -1.098388671875, -1.0478515625, -0.997314453125, -0.94677734375, -0.896240234375, -0.845703125, -0.795166015625, -0.74462890625, -0.694091796875, -0.6435546875, -0.593017578125, -0.54248046875, -0.491943359375, -0.44140625, -0.390869140625, -0.34033203125, -0.289794921875, -0.2392578125, -0.188720703125, -0.13818359375, -0.087646484375, -0.037109375, 0.013427734375, 0.06396484375, 0.114501953125, 0.1650390625, 0.215576171875, 0.26611328125, 0.316650390625, 0.3671875, 0.417724609375, 0.46826171875, 0.518798828125, 0.5693359375, 0.619873046875, 0.67041015625, 0.720947265625, 0.771484375, 0.822021484375, 0.87255859375, 0.923095703125, 0.9736328125, 1.024169921875, 1.07470703125, 1.125244140625, 1.17578125, 1.226318359375, 1.27685546875, 1.327392578125, 1.3779296875, 1.428466796875, 1.47900390625, 1.529541015625, 1.580078125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 2.0, 7.0, 8.0, 13.0, 10.0, 12.0, 17.0, 14.0, 13.0, 23.0, 31.0, 29.0, 35.0, 31.0, 37.0, 48.0, 47.0, 62.0, 43.0, 51.0, 58.0, 42.0, 50.0, 38.0, 47.0, 48.0, 32.0, 33.0, 29.0, 14.0, 9.0, 17.0, 12.0, 5.0, 9.0, 6.0, 7.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6435546875, -0.6207122802734375, -0.597869873046875, -0.5750274658203125, -0.55218505859375, -0.5293426513671875, -0.506500244140625, -0.4836578369140625, -0.4608154296875, -0.4379730224609375, -0.415130615234375, -0.3922882080078125, -0.36944580078125, -0.3466033935546875, -0.323760986328125, -0.3009185791015625, -0.278076171875, -0.2552337646484375, -0.232391357421875, -0.2095489501953125, -0.18670654296875, -0.1638641357421875, -0.141021728515625, -0.1181793212890625, -0.0953369140625, -0.0724945068359375, -0.049652099609375, -0.0268096923828125, -0.00396728515625, 0.0188751220703125, 0.041717529296875, 0.0645599365234375, 0.08740234375, 0.1102447509765625, 0.133087158203125, 0.1559295654296875, 0.17877197265625, 0.2016143798828125, 0.224456787109375, 0.2472991943359375, 0.2701416015625, 0.2929840087890625, 0.315826416015625, 0.3386688232421875, 0.36151123046875, 0.3843536376953125, 0.407196044921875, 0.4300384521484375, 0.452880859375, 0.4757232666015625, 0.498565673828125, 0.5214080810546875, 0.54425048828125, 0.5670928955078125, 0.589935302734375, 0.6127777099609375, 0.6356201171875, 0.6584625244140625, 0.681304931640625, 0.7041473388671875, 0.72698974609375, 0.7498321533203125, 0.772674560546875, 0.7955169677734375, 0.818359375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 10.0, 9.0, 14.0, 19.0, 31.0, 51.0, 86.0, 149.0, 278.0, 964.0, 7450.0, 448203.0, 3712580.0, 21714.0, 1780.0, 465.0, 187.0, 94.0, 57.0, 43.0, 24.0, 21.0, 18.0, 5.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.8553466796875, -2.769287109375, -2.6832275390625, -2.59716796875, -2.5111083984375, -2.425048828125, -2.3389892578125, -2.2529296875, -2.1668701171875, -2.080810546875, -1.9947509765625, -1.90869140625, -1.8226318359375, -1.736572265625, -1.6505126953125, -1.564453125, -1.4783935546875, -1.392333984375, -1.3062744140625, -1.22021484375, -1.1341552734375, -1.048095703125, -0.9620361328125, -0.8759765625, -0.7899169921875, -0.703857421875, -0.6177978515625, -0.53173828125, -0.4456787109375, -0.359619140625, -0.2735595703125, -0.1875, -0.1014404296875, -0.015380859375, 0.0706787109375, 0.15673828125, 0.2427978515625, 0.328857421875, 0.4149169921875, 0.5009765625, 0.5870361328125, 0.673095703125, 0.7591552734375, 0.84521484375, 0.9312744140625, 1.017333984375, 1.1033935546875, 1.189453125, 1.2755126953125, 1.361572265625, 1.4476318359375, 1.53369140625, 1.6197509765625, 1.705810546875, 1.7918701171875, 1.8779296875, 1.9639892578125, 2.050048828125, 2.1361083984375, 2.22216796875, 2.3082275390625, 2.394287109375, 2.4803466796875, 2.56640625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 7.0, 8.0, 12.0, 10.0, 23.0, 21.0, 29.0, 40.0, 47.0, 91.0, 104.0, 166.0, 247.0, 403.0, 591.0, 689.0, 530.0, 372.0, 206.0, 145.0, 99.0, 71.0, 52.0, 36.0, 16.0, 14.0, 16.0, 9.0, 12.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30224609375, -0.2934532165527344, -0.28466033935546875, -0.2758674621582031, -0.2670745849609375, -0.2582817077636719, -0.24948883056640625, -0.24069595336914062, -0.231903076171875, -0.22311019897460938, -0.21431732177734375, -0.20552444458007812, -0.1967315673828125, -0.18793869018554688, -0.17914581298828125, -0.17035293579101562, -0.16156005859375, -0.15276718139648438, -0.14397430419921875, -0.13518142700195312, -0.1263885498046875, -0.11759567260742188, -0.10880279541015625, -0.10000991821289062, -0.091217041015625, -0.08242416381835938, -0.07363128662109375, -0.06483840942382812, -0.0560455322265625, -0.047252655029296875, -0.03845977783203125, -0.029666900634765625, -0.0208740234375, -0.012081146240234375, -0.00328826904296875, 0.005504608154296875, 0.0142974853515625, 0.023090362548828125, 0.03188323974609375, 0.040676116943359375, 0.049468994140625, 0.058261871337890625, 0.06705474853515625, 0.07584762573242188, 0.0846405029296875, 0.09343338012695312, 0.10222625732421875, 0.11101913452148438, 0.11981201171875, 0.12860488891601562, 0.13739776611328125, 0.14619064331054688, 0.1549835205078125, 0.16377639770507812, 0.17256927490234375, 0.18136215209960938, 0.190155029296875, 0.19894790649414062, 0.20774078369140625, 0.21653366088867188, 0.2253265380859375, 0.23411941528320312, 0.24291229248046875, 0.2517051696777344, 0.260498046875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 2.0, 4.0, 7.0, 8.0, 20.0, 25.0, 35.0, 65.0, 92.0, 114.0, 144.0, 156.0, 87.0, 90.0, 58.0, 43.0, 19.0, 12.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2217812538146973, -1.1683746576309204, -1.114967942237854, -1.0615613460540771, -1.0081546306610107, -0.9547480344772339, -0.9013413190841675, -0.8479347229003906, -0.7945280075073242, -0.7411213517189026, -0.687714695930481, -0.6343080401420593, -0.5809013843536377, -0.5274947881698608, -0.4740881025791168, -0.4206814467906952, -0.36727482080459595, -0.3138681650161743, -0.2604615092277527, -0.20705486834049225, -0.15364821255207062, -0.10024157166481018, -0.04683491587638855, 0.006571739912033081, 0.05997839570045471, 0.11338505148887634, 0.16679170727729797, 0.2201983481645584, 0.27360498905181885, 0.3270116448402405, 0.3804183006286621, 0.43382495641708374, 0.48723161220550537, 0.540638267993927, 0.5940449237823486, 0.6474515795707703, 0.7008582353591919, 0.7542648315429688, 0.8076715469360352, 0.861078143119812, 0.9144848585128784, 0.9678915143013, 1.0212981700897217, 1.0747047662734985, 1.128111481666565, 1.1815180778503418, 1.2349247932434082, 1.288331389427185, 1.341737985610962, 1.3951445817947388, 1.4485512971878052, 1.501957893371582, 1.5553646087646484, 1.6087712049484253, 1.6621779203414917, 1.7155845165252686, 1.768991231918335, 1.8223978281021118, 1.8758045434951782, 1.929211139678955, 1.9826178550720215, 2.036024570465088, 2.089431047439575, 2.1428377628326416, 2.196244478225708]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 11.0, 14.0, 8.0, 22.0, 13.0, 15.0, 17.0, 20.0, 30.0, 40.0, 49.0, 40.0, 42.0, 45.0, 48.0, 60.0, 59.0, 43.0, 45.0, 40.0, 48.0, 41.0, 35.0, 44.0, 30.0, 28.0, 22.0, 19.0, 10.0, 14.0, 8.0, 9.0, 4.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.758748471736908, -0.7333011031150818, -0.7078537940979004, -0.6824064254760742, -0.656959056854248, -0.6315117478370667, -0.6060643792152405, -0.5806170701980591, -0.5551697015762329, -0.5297223329544067, -0.5042750239372253, -0.47882765531539917, -0.4533803164958954, -0.4279329776763916, -0.40248560905456543, -0.37703827023506165, -0.35159093141555786, -0.3261435925960541, -0.3006962537765503, -0.2752488851547241, -0.24980154633522034, -0.22435420751571655, -0.19890685379505157, -0.1734595000743866, -0.1480121612548828, -0.12256481498479843, -0.09711746871471405, -0.07167012244462967, -0.04622277617454529, -0.020775437355041504, 0.004671916365623474, 0.030119270086288452, 0.05556666851043701, 0.08101401478052139, 0.10646136105060577, 0.13190871477127075, 0.15735605359077454, 0.18280339241027832, 0.2082507461309433, 0.23369809985160828, 0.25914543867111206, 0.28459277749061584, 0.31004011631011963, 0.3354874849319458, 0.3609348237514496, 0.38638216257095337, 0.41182953119277954, 0.4372768700122833, 0.4627242088317871, 0.4881715476512909, 0.5136188864707947, 0.5390662550926208, 0.5645135641098022, 0.5899609327316284, 0.6154083013534546, 0.6408556699752808, 0.6663029789924622, 0.6917503476142883, 0.7171976566314697, 0.7426450252532959, 0.7680923938751221, 0.7935397028923035, 0.8189870715141296, 0.844434380531311, 0.8698817491531372]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 9.0, 21.0, 25.0, 64.0, 125.0, 342.0, 1005.0, 4195.0, 23195.0, 207437.0, 715826.0, 81440.0, 11355.0, 2385.0, 654.0, 236.0, 88.0, 46.0, 24.0, 14.0, 12.0, 9.0, 10.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.5390625, -0.5246124267578125, -0.510162353515625, -0.4957122802734375, -0.48126220703125, -0.4668121337890625, -0.452362060546875, -0.4379119873046875, -0.4234619140625, -0.4090118408203125, -0.394561767578125, -0.3801116943359375, -0.36566162109375, -0.3512115478515625, -0.336761474609375, -0.3223114013671875, -0.307861328125, -0.2934112548828125, -0.278961181640625, -0.2645111083984375, -0.25006103515625, -0.2356109619140625, -0.221160888671875, -0.2067108154296875, -0.1922607421875, -0.1778106689453125, -0.163360595703125, -0.1489105224609375, -0.13446044921875, -0.1200103759765625, -0.105560302734375, -0.0911102294921875, -0.07666015625, -0.0622100830078125, -0.047760009765625, -0.0333099365234375, -0.01885986328125, -0.0044097900390625, 0.010040283203125, 0.0244903564453125, 0.0389404296875, 0.0533905029296875, 0.067840576171875, 0.0822906494140625, 0.09674072265625, 0.1111907958984375, 0.125640869140625, 0.1400909423828125, 0.154541015625, 0.1689910888671875, 0.183441162109375, 0.1978912353515625, 0.21234130859375, 0.2267913818359375, 0.241241455078125, 0.2556915283203125, 0.2701416015625, 0.2845916748046875, 0.299041748046875, 0.3134918212890625, 0.32794189453125, 0.3423919677734375, 0.356842041015625, 0.3712921142578125, 0.3857421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 10.0, 10.0, 19.0, 15.0, 31.0, 43.0, 47.0, 61.0, 79.0, 77.0, 71.0, 83.0, 74.0, 89.0, 64.0, 46.0, 39.0, 43.0, 26.0, 10.0, 17.0, 11.0, 6.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6142578125, -0.58892822265625, -0.5635986328125, -0.53826904296875, -0.512939453125, -0.48760986328125, -0.4622802734375, -0.43695068359375, -0.41162109375, -0.38629150390625, -0.3609619140625, -0.33563232421875, -0.310302734375, -0.28497314453125, -0.2596435546875, -0.23431396484375, -0.208984375, -0.18365478515625, -0.1583251953125, -0.13299560546875, -0.107666015625, -0.08233642578125, -0.0570068359375, -0.03167724609375, -0.00634765625, 0.01898193359375, 0.0443115234375, 0.06964111328125, 0.094970703125, 0.12030029296875, 0.1456298828125, 0.17095947265625, 0.1962890625, 0.22161865234375, 0.2469482421875, 0.27227783203125, 0.297607421875, 0.32293701171875, 0.3482666015625, 0.37359619140625, 0.39892578125, 0.42425537109375, 0.4495849609375, 0.47491455078125, 0.500244140625, 0.52557373046875, 0.5509033203125, 0.57623291015625, 0.6015625, 0.62689208984375, 0.6522216796875, 0.67755126953125, 0.702880859375, 0.72821044921875, 0.7535400390625, 0.77886962890625, 0.80419921875, 0.82952880859375, 0.8548583984375, 0.88018798828125, 0.905517578125, 0.93084716796875, 0.9561767578125, 0.98150634765625, 1.0068359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 11.0, 5.0, 5.0, 21.0, 27.0, 42.0, 46.0, 76.0, 106.0, 172.0, 269.0, 584.0, 1474.0, 4391.0, 17985.0, 124699.0, 694792.0, 172864.0, 22506.0, 5168.0, 1741.0, 645.0, 338.0, 185.0, 122.0, 80.0, 58.0, 43.0, 29.0, 9.0, 12.0, 10.0, 8.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24599456787109375, -0.2363739013671875, -0.22675323486328125, -0.217132568359375, -0.20751190185546875, -0.1978912353515625, -0.18827056884765625, -0.17864990234375, -0.16902923583984375, -0.1594085693359375, -0.14978790283203125, -0.140167236328125, -0.13054656982421875, -0.1209259033203125, -0.11130523681640625, -0.1016845703125, -0.09206390380859375, -0.0824432373046875, -0.07282257080078125, -0.063201904296875, -0.05358123779296875, -0.0439605712890625, -0.03433990478515625, -0.02471923828125, -0.01509857177734375, -0.0054779052734375, 0.00414276123046875, 0.013763427734375, 0.02338409423828125, 0.0330047607421875, 0.04262542724609375, 0.05224609375, 0.06186676025390625, 0.0714874267578125, 0.08110809326171875, 0.090728759765625, 0.10034942626953125, 0.1099700927734375, 0.11959075927734375, 0.12921142578125, 0.13883209228515625, 0.1484527587890625, 0.15807342529296875, 0.167694091796875, 0.17731475830078125, 0.1869354248046875, 0.19655609130859375, 0.2061767578125, 0.21579742431640625, 0.2254180908203125, 0.23503875732421875, 0.244659423828125, 0.25428009033203125, 0.2639007568359375, 0.27352142333984375, 0.28314208984375, 0.29276275634765625, 0.3023834228515625, 0.31200408935546875, 0.321624755859375, 0.33124542236328125, 0.3408660888671875, 0.35048675537109375, 0.360107421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 9.0, 7.0, 9.0, 14.0, 21.0, 12.0, 25.0, 24.0, 24.0, 36.0, 44.0, 48.0, 41.0, 52.0, 48.0, 56.0, 46.0, 45.0, 60.0, 47.0, 43.0, 45.0, 36.0, 25.0, 37.0, 25.0, 21.0, 31.0, 17.0, 15.0, 8.0, 6.0, 11.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.158203125, -1.1248703002929688, -1.0915374755859375, -1.0582046508789062, -1.024871826171875, -0.9915390014648438, -0.9582061767578125, -0.9248733520507812, -0.89154052734375, -0.8582077026367188, -0.8248748779296875, -0.7915420532226562, -0.758209228515625, -0.7248764038085938, -0.6915435791015625, -0.6582107543945312, -0.6248779296875, -0.5915451049804688, -0.5582122802734375, -0.5248794555664062, -0.491546630859375, -0.45821380615234375, -0.4248809814453125, -0.39154815673828125, -0.35821533203125, -0.32488250732421875, -0.2915496826171875, -0.25821685791015625, -0.224884033203125, -0.19155120849609375, -0.1582183837890625, -0.12488555908203125, -0.091552734375, -0.05821990966796875, -0.0248870849609375, 0.00844573974609375, 0.041778564453125, 0.07511138916015625, 0.1084442138671875, 0.14177703857421875, 0.17510986328125, 0.20844268798828125, 0.2417755126953125, 0.27510833740234375, 0.308441162109375, 0.34177398681640625, 0.3751068115234375, 0.40843963623046875, 0.4417724609375, 0.47510528564453125, 0.5084381103515625, 0.5417709350585938, 0.575103759765625, 0.6084365844726562, 0.6417694091796875, 0.6751022338867188, 0.70843505859375, 0.7417678833007812, 0.7751007080078125, 0.8084335327148438, 0.841766357421875, 0.8750991821289062, 0.9084320068359375, 0.9417648315429688, 0.97509765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 18.0, 19.0, 38.0, 65.0, 118.0, 294.0, 657.0, 2455.0, 18976.0, 876596.0, 141008.0, 6203.0, 1283.0, 400.0, 197.0, 82.0, 42.0, 30.0, 11.0, 9.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2648658752441406, -0.25458526611328125, -0.24430465698242188, -0.2340240478515625, -0.22374343872070312, -0.21346282958984375, -0.20318222045898438, -0.192901611328125, -0.18262100219726562, -0.17234039306640625, -0.16205978393554688, -0.1517791748046875, -0.14149856567382812, -0.13121795654296875, -0.12093734741210938, -0.11065673828125, -0.10037612915039062, -0.09009552001953125, -0.07981491088867188, -0.0695343017578125, -0.059253692626953125, -0.04897308349609375, -0.038692474365234375, -0.028411865234375, -0.018131256103515625, -0.00785064697265625, 0.002429962158203125, 0.0127105712890625, 0.022991180419921875, 0.03327178955078125, 0.043552398681640625, 0.0538330078125, 0.06411361694335938, 0.07439422607421875, 0.08467483520507812, 0.0949554443359375, 0.10523605346679688, 0.11551666259765625, 0.12579727172851562, 0.136077880859375, 0.14635848999023438, 0.15663909912109375, 0.16691970825195312, 0.1772003173828125, 0.18748092651367188, 0.19776153564453125, 0.20804214477539062, 0.21832275390625, 0.22860336303710938, 0.23888397216796875, 0.24916458129882812, 0.2594451904296875, 0.2697257995605469, 0.28000640869140625, 0.2902870178222656, 0.300567626953125, 0.3108482360839844, 0.32112884521484375, 0.3314094543457031, 0.3416900634765625, 0.3519706726074219, 0.36225128173828125, 0.3725318908691406, 0.3828125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 12.0, 14.0, 9.0, 21.0, 34.0, 60.0, 71.0, 89.0, 107.0, 111.0, 106.0, 82.0, 63.0, 54.0, 38.0, 29.0, 31.0, 9.0, 13.0, 7.0, 5.0, 8.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7756900787353516e-05, -5.5856071412563324e-05, -5.395524203777313e-05, -5.205441266298294e-05, -5.015358328819275e-05, -4.825275391340256e-05, -4.6351924538612366e-05, -4.4451095163822174e-05, -4.255026578903198e-05, -4.064943641424179e-05, -3.87486070394516e-05, -3.684777766466141e-05, -3.4946948289871216e-05, -3.3046118915081024e-05, -3.114528954029083e-05, -2.924446016550064e-05, -2.734363079071045e-05, -2.5442801415920258e-05, -2.3541972041130066e-05, -2.1641142666339874e-05, -1.9740313291549683e-05, -1.783948391675949e-05, -1.59386545419693e-05, -1.4037825167179108e-05, -1.2136995792388916e-05, -1.0236166417598724e-05, -8.335337042808533e-06, -6.434507668018341e-06, -4.533678293228149e-06, -2.6328489184379578e-06, -7.320195436477661e-07, 1.1688098311424255e-06, 3.069639205932617e-06, 4.970468580722809e-06, 6.8712979555130005e-06, 8.772127330303192e-06, 1.0672956705093384e-05, 1.2573786079883575e-05, 1.4474615454673767e-05, 1.637544482946396e-05, 1.827627420425415e-05, 2.0177103579044342e-05, 2.2077932953834534e-05, 2.3978762328624725e-05, 2.5879591703414917e-05, 2.778042107820511e-05, 2.96812504529953e-05, 3.158207982778549e-05, 3.3482909202575684e-05, 3.5383738577365875e-05, 3.728456795215607e-05, 3.918539732694626e-05, 4.108622670173645e-05, 4.298705607652664e-05, 4.4887885451316833e-05, 4.6788714826107025e-05, 4.868954420089722e-05, 5.059037357568741e-05, 5.24912029504776e-05, 5.439203232526779e-05, 5.6292861700057983e-05, 5.8193691074848175e-05, 6.009452044963837e-05, 6.199534982442856e-05, 6.389617919921875e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 6.0, 4.0, 11.0, 17.0, 25.0, 32.0, 59.0, 97.0, 148.0, 316.0, 777.0, 2047.0, 7212.0, 38777.0, 365344.0, 559880.0, 59594.0, 9829.0, 2679.0, 858.0, 385.0, 194.0, 96.0, 51.0, 40.0, 21.0, 16.0, 11.0, 7.0, 5.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.163818359375, -0.1585521697998047, -0.15328598022460938, -0.14801979064941406, -0.14275360107421875, -0.13748741149902344, -0.13222122192382812, -0.1269550323486328, -0.1216888427734375, -0.11642265319824219, -0.11115646362304688, -0.10589027404785156, -0.10062408447265625, -0.09535789489746094, -0.09009170532226562, -0.08482551574707031, -0.079559326171875, -0.07429313659667969, -0.06902694702148438, -0.06376075744628906, -0.05849456787109375, -0.05322837829589844, -0.047962188720703125, -0.04269599914550781, -0.0374298095703125, -0.03216361999511719, -0.026897430419921875, -0.021631240844726562, -0.01636505126953125, -0.011098861694335938, -0.005832672119140625, -0.0005664825439453125, 0.00469970703125, 0.009965896606445312, 0.015232086181640625, 0.020498275756835938, 0.02576446533203125, 0.031030654907226562, 0.036296844482421875, 0.04156303405761719, 0.0468292236328125, 0.05209541320800781, 0.057361602783203125, 0.06262779235839844, 0.06789398193359375, 0.07316017150878906, 0.07842636108398438, 0.08369255065917969, 0.088958740234375, 0.09422492980957031, 0.09949111938476562, 0.10475730895996094, 0.11002349853515625, 0.11528968811035156, 0.12055587768554688, 0.1258220672607422, 0.1310882568359375, 0.1363544464111328, 0.14162063598632812, 0.14688682556152344, 0.15215301513671875, 0.15741920471191406, 0.16268539428710938, 0.1679515838623047, 0.1732177734375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 4.0, 8.0, 7.0, 12.0, 12.0, 21.0, 18.0, 36.0, 44.0, 50.0, 87.0, 108.0, 107.0, 102.0, 87.0, 74.0, 50.0, 44.0, 30.0, 17.0, 27.0, 11.0, 11.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033538818359375, -0.03255033493041992, -0.031561851501464844, -0.030573368072509766, -0.029584884643554688, -0.02859640121459961, -0.02760791778564453, -0.026619434356689453, -0.025630950927734375, -0.024642467498779297, -0.02365398406982422, -0.02266550064086914, -0.021677017211914062, -0.020688533782958984, -0.019700050354003906, -0.018711566925048828, -0.01772308349609375, -0.016734600067138672, -0.015746116638183594, -0.014757633209228516, -0.013769149780273438, -0.01278066635131836, -0.011792182922363281, -0.010803699493408203, -0.009815216064453125, -0.008826732635498047, -0.007838249206542969, -0.006849765777587891, -0.0058612823486328125, -0.004872798919677734, -0.0038843154907226562, -0.002895832061767578, -0.0019073486328125, -0.0009188652038574219, 6.961822509765625e-05, 0.0010581016540527344, 0.0020465850830078125, 0.0030350685119628906, 0.004023551940917969, 0.005012035369873047, 0.006000518798828125, 0.006989002227783203, 0.007977485656738281, 0.00896596908569336, 0.009954452514648438, 0.010942935943603516, 0.011931419372558594, 0.012919902801513672, 0.01390838623046875, 0.014896869659423828, 0.015885353088378906, 0.016873836517333984, 0.017862319946289062, 0.01885080337524414, 0.01983928680419922, 0.020827770233154297, 0.021816253662109375, 0.022804737091064453, 0.02379322052001953, 0.02478170394897461, 0.025770187377929688, 0.026758670806884766, 0.027747154235839844, 0.028735637664794922, 0.02972412109375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 1.0, 7.0, 9.0, 15.0, 23.0, 37.0, 74.0, 126.0, 158.0, 165.0, 151.0, 101.0, 59.0, 29.0, 13.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8272049427032471, -0.7863610982894897, -0.7455172538757324, -0.7046734094619751, -0.6638295650482178, -0.6229857206344604, -0.5821418762207031, -0.5412980318069458, -0.5004541873931885, -0.45961034297943115, -0.41876649856567383, -0.3779226541519165, -0.3370788097381592, -0.29623496532440186, -0.25539112091064453, -0.2145472764968872, -0.17370343208312988, -0.13285958766937256, -0.09201574325561523, -0.05117189884185791, -0.010328054428100586, 0.03051578998565674, 0.07135963439941406, 0.11220347881317139, 0.1530473232269287, 0.19389116764068604, 0.23473501205444336, 0.2755788564682007, 0.316422700881958, 0.35726654529571533, 0.39811038970947266, 0.43895423412323, 0.47979795932769775, 0.5206418037414551, 0.5614856481552124, 0.6023294925689697, 0.643173336982727, 0.6840171813964844, 0.7248610258102417, 0.765704870223999, 0.8065487146377563, 0.8473925590515137, 0.888236403465271, 0.9290802478790283, 0.9699240922927856, 1.010767936706543, 1.0516117811203003, 1.0924556255340576, 1.133299469947815, 1.1741433143615723, 1.2149871587753296, 1.255831003189087, 1.2966748476028442, 1.3375186920166016, 1.3783625364303589, 1.4192063808441162, 1.4600502252578735, 1.5008940696716309, 1.5417379140853882, 1.5825817584991455, 1.6234256029129028, 1.6642694473266602, 1.7051132917404175, 1.7459571361541748, 1.7868009805679321]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 7.0, 12.0, 10.0, 20.0, 25.0, 26.0, 26.0, 52.0, 59.0, 72.0, 82.0, 87.0, 99.0, 79.0, 69.0, 69.0, 55.0, 50.0, 30.0, 26.0, 16.0, 12.0, 8.0, 10.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5463542938232422, -0.5193899273872375, -0.4924255609512329, -0.4654611647129059, -0.43849679827690125, -0.4115324318408966, -0.3845680356025696, -0.35760366916656494, -0.3306393027305603, -0.30367493629455566, -0.276710569858551, -0.249746173620224, -0.22278180718421936, -0.19581744074821472, -0.1688530594110489, -0.14188867807388306, -0.11492431163787842, -0.08795993775129318, -0.06099556386470795, -0.03403118997812271, -0.007066816091537476, 0.019897550344467163, 0.046861931681632996, 0.07382631301879883, 0.10079067945480347, 0.1277550458908081, 0.15471942722797394, 0.18168380856513977, 0.2086481750011444, 0.23561254143714905, 0.2625769376754761, 0.2895413041114807, 0.31650567054748535, 0.34347003698349, 0.37043440341949463, 0.39739879965782166, 0.4243631660938263, 0.45132753252983093, 0.47829192876815796, 0.5052562952041626, 0.5322206616401672, 0.5591850280761719, 0.5861493945121765, 0.6131137609481812, 0.6400781869888306, 0.6670424938201904, 0.6940069198608398, 0.7209712862968445, 0.7479356527328491, 0.7749000191688538, 0.8018643856048584, 0.828828752040863, 0.8557931184768677, 0.8827575445175171, 0.9097219109535217, 0.9366862773895264, 0.963650643825531, 0.9906150102615356, 1.017579436302185, 1.044543743133545, 1.0715081691741943, 1.0984724760055542, 1.1254369020462036, 1.1524012088775635, 1.179365634918213]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 3.0, 9.0, 5.0, 11.0, 14.0, 24.0, 31.0, 43.0, 69.0, 150.0, 606.0, 4381.0, 91370.0, 892444.0, 55304.0, 3249.0, 510.0, 129.0, 65.0, 33.0, 28.0, 16.0, 19.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.98046875, -1.913177490234375, -1.84588623046875, -1.778594970703125, -1.7113037109375, -1.644012451171875, -1.57672119140625, -1.509429931640625, -1.442138671875, -1.374847412109375, -1.30755615234375, -1.240264892578125, -1.1729736328125, -1.105682373046875, -1.03839111328125, -0.971099853515625, -0.90380859375, -0.836517333984375, -0.76922607421875, -0.701934814453125, -0.6346435546875, -0.567352294921875, -0.50006103515625, -0.432769775390625, -0.365478515625, -0.298187255859375, -0.23089599609375, -0.163604736328125, -0.0963134765625, -0.029022216796875, 0.03826904296875, 0.105560302734375, 0.1728515625, 0.240142822265625, 0.30743408203125, 0.374725341796875, 0.4420166015625, 0.509307861328125, 0.57659912109375, 0.643890380859375, 0.711181640625, 0.778472900390625, 0.84576416015625, 0.913055419921875, 0.9803466796875, 1.047637939453125, 1.11492919921875, 1.182220458984375, 1.24951171875, 1.316802978515625, 1.38409423828125, 1.451385498046875, 1.5186767578125, 1.585968017578125, 1.65325927734375, 1.720550537109375, 1.787841796875, 1.855133056640625, 1.92242431640625, 1.989715576171875, 2.0570068359375, 2.124298095703125, 2.19158935546875, 2.258880615234375, 2.326171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 7.0, 17.0, 43.0, 52.0, 62.0, 115.0, 164.0, 173.0, 137.0, 105.0, 61.0, 41.0, 17.0, 7.0, 6.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.140625, -1.039306640625, -0.93798828125, -0.836669921875, -0.7353515625, -0.634033203125, -0.53271484375, -0.431396484375, -0.330078125, -0.228759765625, -0.12744140625, -0.026123046875, 0.0751953125, 0.176513671875, 0.27783203125, 0.379150390625, 0.48046875, 0.581787109375, 0.68310546875, 0.784423828125, 0.8857421875, 0.987060546875, 1.08837890625, 1.189697265625, 1.291015625, 1.392333984375, 1.49365234375, 1.594970703125, 1.6962890625, 1.797607421875, 1.89892578125, 2.000244140625, 2.1015625, 2.202880859375, 2.30419921875, 2.405517578125, 2.5068359375, 2.608154296875, 2.70947265625, 2.810791015625, 2.912109375, 3.013427734375, 3.11474609375, 3.216064453125, 3.3173828125, 3.418701171875, 3.52001953125, 3.621337890625, 3.72265625, 3.823974609375, 3.92529296875, 4.026611328125, 4.1279296875, 4.229248046875, 4.33056640625, 4.431884765625, 4.533203125, 4.634521484375, 4.73583984375, 4.837158203125, 4.9384765625, 5.039794921875, 5.14111328125, 5.242431640625, 5.34375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 6.0, 11.0, 9.0, 23.0, 19.0, 19.0, 23.0, 35.0, 45.0, 57.0, 80.0, 85.0, 139.0, 183.0, 376.0, 1061.0, 4650.0, 43074.0, 649109.0, 324505.0, 20492.0, 2838.0, 723.0, 307.0, 138.0, 109.0, 87.0, 59.0, 50.0, 30.0, 38.0, 35.0, 18.0, 25.0, 24.0, 8.0, 14.0, 10.0, 2.0, 4.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2791748046875, -1.239013671875, -1.1988525390625, -1.15869140625, -1.1185302734375, -1.078369140625, -1.0382080078125, -0.998046875, -0.9578857421875, -0.917724609375, -0.8775634765625, -0.83740234375, -0.7972412109375, -0.757080078125, -0.7169189453125, -0.6767578125, -0.6365966796875, -0.596435546875, -0.5562744140625, -0.51611328125, -0.4759521484375, -0.435791015625, -0.3956298828125, -0.35546875, -0.3153076171875, -0.275146484375, -0.2349853515625, -0.19482421875, -0.1546630859375, -0.114501953125, -0.0743408203125, -0.0341796875, 0.0059814453125, 0.046142578125, 0.0863037109375, 0.12646484375, 0.1666259765625, 0.206787109375, 0.2469482421875, 0.287109375, 0.3272705078125, 0.367431640625, 0.4075927734375, 0.44775390625, 0.4879150390625, 0.528076171875, 0.5682373046875, 0.6083984375, 0.6485595703125, 0.688720703125, 0.7288818359375, 0.76904296875, 0.8092041015625, 0.849365234375, 0.8895263671875, 0.9296875, 0.9698486328125, 1.010009765625, 1.0501708984375, 1.09033203125, 1.1304931640625, 1.170654296875, 1.2108154296875, 1.2509765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 9.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 11.0, 16.0, 13.0, 18.0, 13.0, 21.0, 32.0, 22.0, 35.0, 36.0, 42.0, 35.0, 38.0, 36.0, 39.0, 46.0, 37.0, 47.0, 30.0, 47.0, 36.0, 34.0, 36.0, 33.0, 33.0, 19.0, 23.0, 20.0, 28.0, 21.0, 17.0, 10.0, 9.0, 6.0, 4.0, 4.0, 7.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9106674194335938, -0.8794403076171875, -0.8482131958007812, -0.816986083984375, -0.7857589721679688, -0.7545318603515625, -0.7233047485351562, -0.69207763671875, -0.6608505249023438, -0.6296234130859375, -0.5983963012695312, -0.567169189453125, -0.5359420776367188, -0.5047149658203125, -0.47348785400390625, -0.4422607421875, -0.41103363037109375, -0.3798065185546875, -0.34857940673828125, -0.317352294921875, -0.28612518310546875, -0.2548980712890625, -0.22367095947265625, -0.19244384765625, -0.16121673583984375, -0.1299896240234375, -0.09876251220703125, -0.067535400390625, -0.03630828857421875, -0.0050811767578125, 0.02614593505859375, 0.057373046875, 0.08860015869140625, 0.1198272705078125, 0.15105438232421875, 0.182281494140625, 0.21350860595703125, 0.2447357177734375, 0.27596282958984375, 0.30718994140625, 0.33841705322265625, 0.3696441650390625, 0.40087127685546875, 0.432098388671875, 0.46332550048828125, 0.4945526123046875, 0.5257797241210938, 0.5570068359375, 0.5882339477539062, 0.6194610595703125, 0.6506881713867188, 0.681915283203125, 0.7131423950195312, 0.7443695068359375, 0.7755966186523438, 0.80682373046875, 0.8380508422851562, 0.8692779541015625, 0.9005050659179688, 0.931732177734375, 0.9629592895507812, 0.9941864013671875, 1.0254135131835938, 1.056640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 12.0, 11.0, 16.0, 19.0, 32.0, 36.0, 54.0, 84.0, 100.0, 142.0, 262.0, 448.0, 694.0, 1181.0, 2459.0, 4943.0, 11032.0, 27442.0, 76559.0, 217646.0, 379590.0, 206328.0, 72632.0, 26244.0, 10512.0, 4702.0, 2276.0, 1230.0, 691.0, 421.0, 233.0, 171.0, 102.0, 72.0, 43.0, 36.0, 37.0, 15.0, 15.0, 7.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12744140625, -0.12311744689941406, -0.11879348754882812, -0.11446952819824219, -0.11014556884765625, -0.10582160949707031, -0.10149765014648438, -0.09717369079589844, -0.0928497314453125, -0.08852577209472656, -0.08420181274414062, -0.07987785339355469, -0.07555389404296875, -0.07122993469238281, -0.06690597534179688, -0.06258201599121094, -0.058258056640625, -0.05393409729003906, -0.049610137939453125, -0.04528617858886719, -0.04096221923828125, -0.03663825988769531, -0.032314300537109375, -0.027990341186523438, -0.0236663818359375, -0.019342422485351562, -0.015018463134765625, -0.010694503784179688, -0.00637054443359375, -0.0020465850830078125, 0.002277374267578125, 0.0066013336181640625, 0.01092529296875, 0.015249252319335938, 0.019573211669921875, 0.023897171020507812, 0.02822113037109375, 0.03254508972167969, 0.036869049072265625, 0.04119300842285156, 0.0455169677734375, 0.04984092712402344, 0.054164886474609375, 0.05848884582519531, 0.06281280517578125, 0.06713676452636719, 0.07146072387695312, 0.07578468322753906, 0.080108642578125, 0.08443260192871094, 0.08875656127929688, 0.09308052062988281, 0.09740447998046875, 0.10172843933105469, 0.10605239868164062, 0.11037635803222656, 0.1147003173828125, 0.11902427673339844, 0.12334823608398438, 0.1276721954345703, 0.13199615478515625, 0.1363201141357422, 0.14064407348632812, 0.14496803283691406, 0.1492919921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 4.0, 9.0, 6.0, 10.0, 16.0, 17.0, 24.0, 30.0, 28.0, 28.0, 38.0, 50.0, 46.0, 62.0, 68.0, 66.0, 87.0, 62.0, 64.0, 48.0, 48.0, 36.0, 26.0, 20.0, 23.0, 15.0, 9.0, 11.0, 12.0, 6.0, 10.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.248453140258789e-05, -3.1521543860435486e-05, -3.055855631828308e-05, -2.9595568776130676e-05, -2.863258123397827e-05, -2.7669593691825867e-05, -2.6706606149673462e-05, -2.5743618607521057e-05, -2.4780631065368652e-05, -2.3817643523216248e-05, -2.2854655981063843e-05, -2.1891668438911438e-05, -2.0928680896759033e-05, -1.996569335460663e-05, -1.9002705812454224e-05, -1.803971827030182e-05, -1.7076730728149414e-05, -1.611374318599701e-05, -1.5150755643844604e-05, -1.41877681016922e-05, -1.3224780559539795e-05, -1.226179301738739e-05, -1.1298805475234985e-05, -1.033581793308258e-05, -9.372830390930176e-06, -8.409842848777771e-06, -7.446855306625366e-06, -6.4838677644729614e-06, -5.520880222320557e-06, -4.557892680168152e-06, -3.594905138015747e-06, -2.6319175958633423e-06, -1.6689300537109375e-06, -7.059425115585327e-07, 2.5704503059387207e-07, 1.2200325727462769e-06, 2.1830201148986816e-06, 3.1460076570510864e-06, 4.108995199203491e-06, 5.071982741355896e-06, 6.034970283508301e-06, 6.9979578256607056e-06, 7.96094536781311e-06, 8.923932909965515e-06, 9.88692045211792e-06, 1.0849907994270325e-05, 1.181289553642273e-05, 1.2775883078575134e-05, 1.3738870620727539e-05, 1.4701858162879944e-05, 1.566484570503235e-05, 1.6627833247184753e-05, 1.7590820789337158e-05, 1.8553808331489563e-05, 1.9516795873641968e-05, 2.0479783415794373e-05, 2.1442770957946777e-05, 2.2405758500099182e-05, 2.3368746042251587e-05, 2.4331733584403992e-05, 2.5294721126556396e-05, 2.62577086687088e-05, 2.7220696210861206e-05, 2.818368375301361e-05, 2.9146671295166016e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 9.0, 15.0, 19.0, 38.0, 55.0, 67.0, 140.0, 219.0, 346.0, 766.0, 1663.0, 3939.0, 10893.0, 35609.0, 138013.0, 455325.0, 296118.0, 73150.0, 20279.0, 6832.0, 2524.0, 1178.0, 539.0, 328.0, 182.0, 99.0, 59.0, 44.0, 32.0, 22.0, 12.0, 9.0, 10.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1988525390625, -0.19278526306152344, -0.18671798706054688, -0.1806507110595703, -0.17458343505859375, -0.1685161590576172, -0.16244888305664062, -0.15638160705566406, -0.1503143310546875, -0.14424705505371094, -0.13817977905273438, -0.1321125030517578, -0.12604522705078125, -0.11997795104980469, -0.11391067504882812, -0.10784339904785156, -0.101776123046875, -0.09570884704589844, -0.08964157104492188, -0.08357429504394531, -0.07750701904296875, -0.07143974304199219, -0.06537246704101562, -0.05930519104003906, -0.0532379150390625, -0.04717063903808594, -0.041103363037109375, -0.03503608703613281, -0.02896881103515625, -0.022901535034179688, -0.016834259033203125, -0.010766983032226562, -0.00469970703125, 0.0013675689697265625, 0.007434844970703125, 0.013502120971679688, 0.01956939697265625, 0.025636672973632812, 0.031703948974609375, 0.03777122497558594, 0.0438385009765625, 0.04990577697753906, 0.055973052978515625, 0.06204032897949219, 0.06810760498046875, 0.07417488098144531, 0.08024215698242188, 0.08630943298339844, 0.092376708984375, 0.09844398498535156, 0.10451126098632812, 0.11057853698730469, 0.11664581298828125, 0.12271308898925781, 0.12878036499023438, 0.13484764099121094, 0.1409149169921875, 0.14698219299316406, 0.15304946899414062, 0.1591167449951172, 0.16518402099609375, 0.1712512969970703, 0.17731857299804688, 0.18338584899902344, 0.189453125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 9.0, 7.0, 12.0, 17.0, 27.0, 23.0, 46.0, 41.0, 59.0, 58.0, 66.0, 82.0, 72.0, 67.0, 69.0, 59.0, 51.0, 42.0, 39.0, 35.0, 33.0, 20.0, 21.0, 11.0, 9.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06939697265625, -0.06636905670166016, -0.06334114074707031, -0.06031322479248047, -0.057285308837890625, -0.05425739288330078, -0.05122947692871094, -0.048201560974121094, -0.04517364501953125, -0.042145729064941406, -0.03911781311035156, -0.03608989715576172, -0.033061981201171875, -0.03003406524658203, -0.027006149291992188, -0.023978233337402344, -0.0209503173828125, -0.017922401428222656, -0.014894485473632812, -0.011866569519042969, -0.008838653564453125, -0.005810737609863281, -0.0027828216552734375, 0.00024509429931640625, 0.00327301025390625, 0.006300926208496094, 0.009328842163085938, 0.012356758117675781, 0.015384674072265625, 0.01841259002685547, 0.021440505981445312, 0.024468421936035156, 0.027496337890625, 0.030524253845214844, 0.03355216979980469, 0.03658008575439453, 0.039608001708984375, 0.04263591766357422, 0.04566383361816406, 0.048691749572753906, 0.05171966552734375, 0.054747581481933594, 0.05777549743652344, 0.06080341339111328, 0.06383132934570312, 0.06685924530029297, 0.06988716125488281, 0.07291507720947266, 0.0759429931640625, 0.07897090911865234, 0.08199882507324219, 0.08502674102783203, 0.08805465698242188, 0.09108257293701172, 0.09411048889160156, 0.0971384048461914, 0.10016632080078125, 0.1031942367553711, 0.10622215270996094, 0.10925006866455078, 0.11227798461914062, 0.11530590057373047, 0.11833381652832031, 0.12136173248291016, 0.1243896484375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 10.0, 26.0, 157.0, 577.0, 207.0, 25.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.765289545059204, -1.4488767385482788, -1.1324639320373535, -0.8160512447357178, -0.4996384382247925, -0.1832256317138672, 0.13318705558776855, 0.4495999813079834, 0.7660126686096191, 1.0824254751205444, 1.3988382816314697, 1.7152509689331055, 2.0316638946533203, 2.348076581954956, 2.664489269256592, 2.9809021949768066, 3.2973148822784424, 3.613727569580078, 3.930140495300293, 4.246553421020508, 4.5629658699035645, 4.879378795623779, 5.195791244506836, 5.512204170227051, 5.828617095947266, 6.1450300216674805, 6.461442470550537, 6.777855396270752, 7.094268321990967, 7.410680770874023, 7.727093696594238, 8.043506622314453, 8.359919548034668, 8.676332473754883, 8.992745399475098, 9.309158325195312, 9.625570297241211, 9.941983222961426, 10.25839614868164, 10.574809074401855, 10.89122200012207, 11.207634925842285, 11.5240478515625, 11.840459823608398, 12.156872749328613, 12.473285675048828, 12.789698600769043, 13.106111526489258, 13.422523498535156, 13.738936424255371, 14.055349349975586, 14.371761322021484, 14.6881742477417, 15.004587173461914, 15.321000099182129, 15.637413024902344, 15.953825950622559, 16.270238876342773, 16.586650848388672, 16.903064727783203, 17.2194766998291, 17.535890579223633, 17.85230255126953, 18.168716430664062, 18.48512840270996]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 8.0, 21.0, 23.0, 33.0, 44.0, 58.0, 75.0, 73.0, 87.0, 94.0, 93.0, 80.0, 83.0, 59.0, 61.0, 35.0, 31.0, 19.0, 11.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9270498752593994, -1.8039333820343018, -1.6808167695999146, -1.5577001571655273, -1.4345836639404297, -1.311467170715332, -1.1883505582809448, -1.0652339458465576, -0.94211745262146, -0.8190008997917175, -0.6958843469619751, -0.5727677941322327, -0.44965124130249023, -0.3265346884727478, -0.20341813564300537, -0.08030158281326294, 0.04281497001647949, 0.16593152284622192, 0.28904807567596436, 0.4121646285057068, 0.5352811813354492, 0.6583977341651917, 0.7815142869949341, 0.9046308398246765, 1.027747392654419, 1.1508638858795166, 1.2739804983139038, 1.397097110748291, 1.5202136039733887, 1.6433300971984863, 1.7664467096328735, 1.8895633220672607, 2.0126800537109375, 2.135796546936035, 2.258913040161133, 2.3820297718048096, 2.5051462650299072, 2.628262758255005, 2.7513794898986816, 2.8744959831237793, 2.997612476348877, 3.1207289695739746, 3.2438454627990723, 3.366962194442749, 3.4900786876678467, 3.6131951808929443, 3.736311912536621, 3.8594284057617188, 3.9825448989868164, 4.105661392211914, 4.228777885437012, 4.351894378662109, 4.475010871887207, 4.598127841949463, 4.7212443351745605, 4.844360828399658, 4.967477321624756, 5.0905938148498535, 5.213710308074951, 5.336826801300049, 5.459943771362305, 5.583060264587402, 5.7061767578125, 5.829293251037598, 5.952409744262695]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 9.0, 6.0, 18.0, 24.0, 38.0, 45.0, 47.0, 85.0, 133.0, 173.0, 232.0, 414.0, 676.0, 1137.0, 2058.0, 3872.0, 8420.0, 21387.0, 68574.0, 314162.0, 2205119.0, 1306432.0, 186939.0, 45154.0, 15305.0, 6448.0, 3052.0, 1594.0, 1011.0, 581.0, 359.0, 226.0, 168.0, 129.0, 70.0, 47.0, 40.0, 24.0, 22.0, 14.0, 12.0, 11.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.741119384765625, -0.71710205078125, -0.693084716796875, -0.6690673828125, -0.645050048828125, -0.62103271484375, -0.597015380859375, -0.572998046875, -0.548980712890625, -0.52496337890625, -0.500946044921875, -0.4769287109375, -0.452911376953125, -0.42889404296875, -0.404876708984375, -0.380859375, -0.356842041015625, -0.33282470703125, -0.308807373046875, -0.2847900390625, -0.260772705078125, -0.23675537109375, -0.212738037109375, -0.188720703125, -0.164703369140625, -0.14068603515625, -0.116668701171875, -0.0926513671875, -0.068634033203125, -0.04461669921875, -0.020599365234375, 0.00341796875, 0.027435302734375, 0.05145263671875, 0.075469970703125, 0.0994873046875, 0.123504638671875, 0.14752197265625, 0.171539306640625, 0.195556640625, 0.219573974609375, 0.24359130859375, 0.267608642578125, 0.2916259765625, 0.315643310546875, 0.33966064453125, 0.363677978515625, 0.3876953125, 0.411712646484375, 0.43572998046875, 0.459747314453125, 0.4837646484375, 0.507781982421875, 0.53179931640625, 0.555816650390625, 0.579833984375, 0.603851318359375, 0.62786865234375, 0.651885986328125, 0.6759033203125, 0.699920654296875, 0.72393798828125, 0.747955322265625, 0.77197265625]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 15.0, 7.0, 8.0, 11.0, 11.0, 12.0, 24.0, 30.0, 32.0, 38.0, 59.0, 47.0, 70.0, 55.0, 56.0, 55.0, 63.0, 61.0, 48.0, 37.0, 43.0, 37.0, 35.0, 34.0, 34.0, 19.0, 10.0, 10.0, 8.0, 5.0, 9.0, 4.0, 2.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.708984375, -0.6848068237304688, -0.6606292724609375, -0.6364517211914062, -0.612274169921875, -0.5880966186523438, -0.5639190673828125, -0.5397415161132812, -0.51556396484375, -0.49138641357421875, -0.4672088623046875, -0.44303131103515625, -0.418853759765625, -0.39467620849609375, -0.3704986572265625, -0.34632110595703125, -0.3221435546875, -0.29796600341796875, -0.2737884521484375, -0.24961090087890625, -0.225433349609375, -0.20125579833984375, -0.1770782470703125, -0.15290069580078125, -0.12872314453125, -0.10454559326171875, -0.0803680419921875, -0.05619049072265625, -0.032012939453125, -0.00783538818359375, 0.0163421630859375, 0.04051971435546875, 0.064697265625, 0.08887481689453125, 0.1130523681640625, 0.13722991943359375, 0.161407470703125, 0.18558502197265625, 0.2097625732421875, 0.23394012451171875, 0.25811767578125, 0.28229522705078125, 0.3064727783203125, 0.33065032958984375, 0.354827880859375, 0.37900543212890625, 0.4031829833984375, 0.42736053466796875, 0.4515380859375, 0.47571563720703125, 0.4998931884765625, 0.5240707397460938, 0.548248291015625, 0.5724258422851562, 0.5966033935546875, 0.6207809448242188, 0.64495849609375, 0.6691360473632812, 0.6933135986328125, 0.7174911499023438, 0.741668701171875, 0.7658462524414062, 0.7900238037109375, 0.8142013549804688, 0.83837890625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 9.0, 7.0, 12.0, 14.0, 24.0, 37.0, 51.0, 70.0, 117.0, 295.0, 868.0, 5102.0, 99913.0, 3997118.0, 84536.0, 4617.0, 844.0, 263.0, 138.0, 59.0, 49.0, 45.0, 29.0, 17.0, 13.0, 11.0, 6.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.1690673828125, -2.097900390625, -2.0267333984375, -1.95556640625, -1.8843994140625, -1.813232421875, -1.7420654296875, -1.6708984375, -1.5997314453125, -1.528564453125, -1.4573974609375, -1.38623046875, -1.3150634765625, -1.243896484375, -1.1727294921875, -1.1015625, -1.0303955078125, -0.959228515625, -0.8880615234375, -0.81689453125, -0.7457275390625, -0.674560546875, -0.6033935546875, -0.5322265625, -0.4610595703125, -0.389892578125, -0.3187255859375, -0.24755859375, -0.1763916015625, -0.105224609375, -0.0340576171875, 0.037109375, 0.1082763671875, 0.179443359375, 0.2506103515625, 0.32177734375, 0.3929443359375, 0.464111328125, 0.5352783203125, 0.6064453125, 0.6776123046875, 0.748779296875, 0.8199462890625, 0.89111328125, 0.9622802734375, 1.033447265625, 1.1046142578125, 1.17578125, 1.2469482421875, 1.318115234375, 1.3892822265625, 1.46044921875, 1.5316162109375, 1.602783203125, 1.6739501953125, 1.7451171875, 1.8162841796875, 1.887451171875, 1.9586181640625, 2.02978515625, 2.1009521484375, 2.172119140625, 2.2432861328125, 2.314453125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 7.0, 8.0, 13.0, 15.0, 20.0, 21.0, 42.0, 52.0, 80.0, 119.0, 164.0, 230.0, 431.0, 652.0, 785.0, 507.0, 285.0, 179.0, 142.0, 95.0, 64.0, 35.0, 32.0, 19.0, 14.0, 16.0, 12.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.2411365509033203, -0.23288345336914062, -0.22463035583496094, -0.21637725830078125, -0.20812416076660156, -0.19987106323242188, -0.1916179656982422, -0.1833648681640625, -0.1751117706298828, -0.16685867309570312, -0.15860557556152344, -0.15035247802734375, -0.14209938049316406, -0.13384628295898438, -0.1255931854248047, -0.117340087890625, -0.10908699035644531, -0.10083389282226562, -0.09258079528808594, -0.08432769775390625, -0.07607460021972656, -0.06782150268554688, -0.05956840515136719, -0.0513153076171875, -0.04306221008300781, -0.034809112548828125, -0.026556015014648438, -0.01830291748046875, -0.010049819946289062, -0.001796722412109375, 0.0064563751220703125, 0.01470947265625, 0.022962570190429688, 0.031215667724609375, 0.03946876525878906, 0.04772186279296875, 0.05597496032714844, 0.06422805786132812, 0.07248115539550781, 0.0807342529296875, 0.08898735046386719, 0.09724044799804688, 0.10549354553222656, 0.11374664306640625, 0.12199974060058594, 0.13025283813476562, 0.1385059356689453, 0.146759033203125, 0.1550121307373047, 0.16326522827148438, 0.17151832580566406, 0.17977142333984375, 0.18802452087402344, 0.19627761840820312, 0.2045307159423828, 0.2127838134765625, 0.2210369110107422, 0.22929000854492188, 0.23754310607910156, 0.24579620361328125, 0.25404930114746094, 0.2623023986816406, 0.2705554962158203, 0.27880859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 17.0, 8.0, 31.0, 51.0, 83.0, 134.0, 149.0, 179.0, 133.0, 89.0, 48.0, 31.0, 13.0, 8.0, 9.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6551011800765991, -1.5942275524139404, -1.5333538055419922, -1.4724801778793335, -1.4116064310073853, -1.3507328033447266, -1.2898590564727783, -1.2289854288101196, -1.168111801147461, -1.1072381734848022, -1.046364426612854, -0.9854907989501953, -0.9246170520782471, -0.8637434244155884, -0.8028697371482849, -0.7419960498809814, -0.6811223030090332, -0.6202486157417297, -0.5593749284744263, -0.4985012710094452, -0.4376275837421417, -0.37675389647483826, -0.3158802390098572, -0.2550065517425537, -0.19413286447525024, -0.13325917720794678, -0.0723855048418045, -0.011511832475662231, 0.049361854791641235, 0.1102355420589447, 0.17110919952392578, 0.23198288679122925, 0.29285669326782227, 0.35373038053512573, 0.4146040678024292, 0.4754777252674103, 0.5363514423370361, 0.5972250699996948, 0.6580987572669983, 0.7189724445343018, 0.7798461318016052, 0.8407198190689087, 0.9015935063362122, 0.9624671936035156, 1.0233408212661743, 1.0842145681381226, 1.1450881958007812, 1.2059619426727295, 1.2668355703353882, 1.3277091979980469, 1.3885829448699951, 1.4494565725326538, 1.510330319404602, 1.5712039470672607, 1.632077693939209, 1.6929513216018677, 1.7538249492645264, 1.814698576927185, 1.8755723237991333, 1.936445951461792, 1.9973196983337402, 2.0581934452056885, 2.1190669536590576, 2.179940700531006, 2.240814447402954]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 5.0, 11.0, 19.0, 16.0, 20.0, 30.0, 25.0, 32.0, 32.0, 48.0, 33.0, 54.0, 48.0, 45.0, 47.0, 60.0, 55.0, 46.0, 49.0, 46.0, 40.0, 39.0, 32.0, 34.0, 24.0, 17.0, 22.0, 22.0, 13.0, 10.0, 8.0, 4.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8964429497718811, -0.8708083629608154, -0.8451738357543945, -0.8195392489433289, -0.7939046621322632, -0.7682700753211975, -0.7426354885101318, -0.7170009613037109, -0.6913663744926453, -0.6657317876815796, -0.6400972604751587, -0.614462673664093, -0.5888280868530273, -0.5631935000419617, -0.537558913230896, -0.5119243860244751, -0.4862897992134094, -0.46065521240234375, -0.43502065539360046, -0.4093860983848572, -0.3837515115737915, -0.35811692476272583, -0.33248236775398254, -0.30684781074523926, -0.2812132239341736, -0.2555786371231079, -0.22994408011436462, -0.20430950820446014, -0.17867493629455566, -0.15304036438465118, -0.1274057924747467, -0.10177122056484222, -0.07613670825958252, -0.05050213634967804, -0.02486756443977356, 0.0007670074701309204, 0.0264015793800354, 0.05203615128993988, 0.07767072319984436, 0.10330529510974884, 0.12893986701965332, 0.1545744389295578, 0.18020901083946228, 0.20584358274936676, 0.23147815465927124, 0.2571127414703369, 0.2827472984790802, 0.3083818554878235, 0.33401644229888916, 0.35965102910995483, 0.3852855861186981, 0.4109201431274414, 0.4365547299385071, 0.46218931674957275, 0.48782387375831604, 0.5134584307670593, 0.539093017578125, 0.5647276043891907, 0.5903621912002563, 0.6159967184066772, 0.6416313052177429, 0.6672658920288086, 0.6929004192352295, 0.7185350060462952, 0.7441695928573608]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 9.0, 8.0, 12.0, 27.0, 51.0, 128.0, 262.0, 673.0, 1964.0, 6355.0, 27249.0, 411300.0, 557252.0, 32813.0, 6928.0, 2166.0, 781.0, 311.0, 125.0, 66.0, 21.0, 11.0, 11.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.416748046875, -0.4018898010253906, -0.38703155517578125, -0.3721733093261719, -0.3573150634765625, -0.3424568176269531, -0.32759857177734375, -0.3127403259277344, -0.297882080078125, -0.2830238342285156, -0.26816558837890625, -0.2533073425292969, -0.2384490966796875, -0.22359085083007812, -0.20873260498046875, -0.19387435913085938, -0.17901611328125, -0.16415786743164062, -0.14929962158203125, -0.13444137573242188, -0.1195831298828125, -0.10472488403320312, -0.08986663818359375, -0.07500839233398438, -0.060150146484375, -0.045291900634765625, -0.03043365478515625, -0.015575408935546875, -0.0007171630859375, 0.014141082763671875, 0.02899932861328125, 0.043857574462890625, 0.0587158203125, 0.07357406616210938, 0.08843231201171875, 0.10329055786132812, 0.1181488037109375, 0.13300704956054688, 0.14786529541015625, 0.16272354125976562, 0.177581787109375, 0.19244003295898438, 0.20729827880859375, 0.22215652465820312, 0.2370147705078125, 0.2518730163574219, 0.26673126220703125, 0.2815895080566406, 0.29644775390625, 0.3113059997558594, 0.32616424560546875, 0.3410224914550781, 0.3558807373046875, 0.3707389831542969, 0.38559722900390625, 0.4004554748535156, 0.415313720703125, 0.4301719665527344, 0.44503021240234375, 0.4598884582519531, 0.4747467041015625, 0.4896049499511719, 0.5044631958007812, 0.5193214416503906, 0.5341796875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 11.0, 15.0, 23.0, 21.0, 34.0, 36.0, 41.0, 51.0, 68.0, 63.0, 65.0, 63.0, 65.0, 72.0, 60.0, 53.0, 49.0, 43.0, 37.0, 28.0, 26.0, 19.0, 8.0, 12.0, 12.0, 11.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67822265625, -0.6562957763671875, -0.634368896484375, -0.6124420166015625, -0.59051513671875, -0.5685882568359375, -0.546661376953125, -0.5247344970703125, -0.5028076171875, -0.4808807373046875, -0.458953857421875, -0.4370269775390625, -0.41510009765625, -0.3931732177734375, -0.371246337890625, -0.3493194580078125, -0.327392578125, -0.3054656982421875, -0.283538818359375, -0.2616119384765625, -0.23968505859375, -0.2177581787109375, -0.195831298828125, -0.1739044189453125, -0.1519775390625, -0.1300506591796875, -0.108123779296875, -0.0861968994140625, -0.06427001953125, -0.0423431396484375, -0.020416259765625, 0.0015106201171875, 0.0234375, 0.0453643798828125, 0.067291259765625, 0.0892181396484375, 0.11114501953125, 0.1330718994140625, 0.154998779296875, 0.1769256591796875, 0.1988525390625, 0.2207794189453125, 0.242706298828125, 0.2646331787109375, 0.28656005859375, 0.3084869384765625, 0.330413818359375, 0.3523406982421875, 0.374267578125, 0.3961944580078125, 0.418121337890625, 0.4400482177734375, 0.46197509765625, 0.4839019775390625, 0.505828857421875, 0.5277557373046875, 0.5496826171875, 0.5716094970703125, 0.593536376953125, 0.6154632568359375, 0.63739013671875, 0.6593170166015625, 0.681243896484375, 0.7031707763671875, 0.72509765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 8.0, 10.0, 10.0, 12.0, 23.0, 28.0, 31.0, 46.0, 101.0, 184.0, 337.0, 662.0, 1776.0, 5959.0, 31064.0, 640695.0, 340536.0, 20052.0, 4389.0, 1370.0, 580.0, 291.0, 127.0, 70.0, 60.0, 29.0, 22.0, 20.0, 11.0, 13.0, 8.0, 6.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40087890625, -0.3886909484863281, -0.37650299072265625, -0.3643150329589844, -0.3521270751953125, -0.3399391174316406, -0.32775115966796875, -0.3155632019042969, -0.303375244140625, -0.2911872863769531, -0.27899932861328125, -0.2668113708496094, -0.2546234130859375, -0.24243545532226562, -0.23024749755859375, -0.21805953979492188, -0.20587158203125, -0.19368362426757812, -0.18149566650390625, -0.16930770874023438, -0.1571197509765625, -0.14493179321289062, -0.13274383544921875, -0.12055587768554688, -0.108367919921875, -0.09617996215820312, -0.08399200439453125, -0.07180404663085938, -0.0596160888671875, -0.047428131103515625, -0.03524017333984375, -0.023052215576171875, -0.0108642578125, 0.001323699951171875, 0.01351165771484375, 0.025699615478515625, 0.0378875732421875, 0.050075531005859375, 0.06226348876953125, 0.07445144653320312, 0.086639404296875, 0.09882736206054688, 0.11101531982421875, 0.12320327758789062, 0.1353912353515625, 0.14757919311523438, 0.15976715087890625, 0.17195510864257812, 0.18414306640625, 0.19633102416992188, 0.20851898193359375, 0.22070693969726562, 0.2328948974609375, 0.24508285522460938, 0.25727081298828125, 0.2694587707519531, 0.281646728515625, 0.2938346862792969, 0.30602264404296875, 0.3182106018066406, 0.3303985595703125, 0.3425865173339844, 0.35477447509765625, 0.3669624328613281, 0.379150390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 6.0, 7.0, 16.0, 10.0, 17.0, 18.0, 25.0, 23.0, 30.0, 27.0, 28.0, 29.0, 43.0, 38.0, 42.0, 46.0, 44.0, 38.0, 49.0, 52.0, 41.0, 38.0, 35.0, 34.0, 39.0, 20.0, 30.0, 35.0, 27.0, 19.0, 14.0, 11.0, 7.0, 13.0, 12.0, 6.0, 6.0, 6.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9990234375, -0.969482421875, -0.93994140625, -0.910400390625, -0.880859375, -0.851318359375, -0.82177734375, -0.792236328125, -0.7626953125, -0.733154296875, -0.70361328125, -0.674072265625, -0.64453125, -0.614990234375, -0.58544921875, -0.555908203125, -0.5263671875, -0.496826171875, -0.46728515625, -0.437744140625, -0.408203125, -0.378662109375, -0.34912109375, -0.319580078125, -0.2900390625, -0.260498046875, -0.23095703125, -0.201416015625, -0.171875, -0.142333984375, -0.11279296875, -0.083251953125, -0.0537109375, -0.024169921875, 0.00537109375, 0.034912109375, 0.064453125, 0.093994140625, 0.12353515625, 0.153076171875, 0.1826171875, 0.212158203125, 0.24169921875, 0.271240234375, 0.30078125, 0.330322265625, 0.35986328125, 0.389404296875, 0.4189453125, 0.448486328125, 0.47802734375, 0.507568359375, 0.537109375, 0.566650390625, 0.59619140625, 0.625732421875, 0.6552734375, 0.684814453125, 0.71435546875, 0.743896484375, 0.7734375, 0.802978515625, 0.83251953125, 0.862060546875, 0.8916015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 11.0, 28.0, 42.0, 69.0, 127.0, 198.0, 443.0, 968.0, 2672.0, 8654.0, 40235.0, 575711.0, 377198.0, 31174.0, 7111.0, 2204.0, 850.0, 379.0, 187.0, 102.0, 61.0, 42.0, 20.0, 28.0, 8.0, 13.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142822265625, -0.13820457458496094, -0.13358688354492188, -0.1289691925048828, -0.12435150146484375, -0.11973381042480469, -0.11511611938476562, -0.11049842834472656, -0.1058807373046875, -0.10126304626464844, -0.09664535522460938, -0.09202766418457031, -0.08740997314453125, -0.08279228210449219, -0.07817459106445312, -0.07355690002441406, -0.068939208984375, -0.06432151794433594, -0.059703826904296875, -0.05508613586425781, -0.05046844482421875, -0.04585075378417969, -0.041233062744140625, -0.03661537170410156, -0.0319976806640625, -0.027379989624023438, -0.022762298583984375, -0.018144607543945312, -0.01352691650390625, -0.008909225463867188, -0.004291534423828125, 0.0003261566162109375, 0.00494384765625, 0.009561538696289062, 0.014179229736328125, 0.018796920776367188, 0.02341461181640625, 0.028032302856445312, 0.032649993896484375, 0.03726768493652344, 0.0418853759765625, 0.04650306701660156, 0.051120758056640625, 0.05573844909667969, 0.06035614013671875, 0.06497383117675781, 0.06959152221679688, 0.07420921325683594, 0.078826904296875, 0.08344459533691406, 0.08806228637695312, 0.09267997741699219, 0.09729766845703125, 0.10191535949707031, 0.10653305053710938, 0.11115074157714844, 0.1157684326171875, 0.12038612365722656, 0.12500381469726562, 0.1296215057373047, 0.13423919677734375, 0.1388568878173828, 0.14347457885742188, 0.14809226989746094, 0.1527099609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 2.0, 0.0, 2.0, 7.0, 4.0, 3.0, 4.0, 4.0, 15.0, 19.0, 16.0, 22.0, 34.0, 59.0, 91.0, 114.0, 153.0, 123.0, 94.0, 73.0, 53.0, 33.0, 24.0, 12.0, 10.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.358457565307617e-05, -5.171261727809906e-05, -4.984065890312195e-05, -4.7968700528144836e-05, -4.6096742153167725e-05, -4.422478377819061e-05, -4.23528254032135e-05, -4.048086702823639e-05, -3.860890865325928e-05, -3.6736950278282166e-05, -3.4864991903305054e-05, -3.299303352832794e-05, -3.112107515335083e-05, -2.9249116778373718e-05, -2.7377158403396606e-05, -2.5505200028419495e-05, -2.3633241653442383e-05, -2.176128327846527e-05, -1.988932490348816e-05, -1.8017366528511047e-05, -1.6145408153533936e-05, -1.4273449778556824e-05, -1.2401491403579712e-05, -1.05295330286026e-05, -8.657574653625488e-06, -6.7856162786483765e-06, -4.913657903671265e-06, -3.041699528694153e-06, -1.169741153717041e-06, 7.022172212600708e-07, 2.5741755962371826e-06, 4.4461339712142944e-06, 6.318092346191406e-06, 8.190050721168518e-06, 1.006200909614563e-05, 1.1933967471122742e-05, 1.3805925846099854e-05, 1.5677884221076965e-05, 1.7549842596054077e-05, 1.942180097103119e-05, 2.12937593460083e-05, 2.3165717720985413e-05, 2.5037676095962524e-05, 2.6909634470939636e-05, 2.8781592845916748e-05, 3.065355122089386e-05, 3.252550959587097e-05, 3.4397467970848083e-05, 3.6269426345825195e-05, 3.814138472080231e-05, 4.001334309577942e-05, 4.188530147075653e-05, 4.375725984573364e-05, 4.5629218220710754e-05, 4.7501176595687866e-05, 4.937313497066498e-05, 5.124509334564209e-05, 5.31170517206192e-05, 5.4989010095596313e-05, 5.6860968470573425e-05, 5.873292684555054e-05, 6.060488522052765e-05, 6.247684359550476e-05, 6.434880197048187e-05, 6.622076034545898e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 6.0, 7.0, 4.0, 9.0, 14.0, 25.0, 23.0, 33.0, 71.0, 117.0, 242.0, 411.0, 889.0, 2038.0, 5288.0, 15315.0, 60124.0, 477761.0, 409142.0, 54244.0, 14311.0, 4795.0, 1860.0, 865.0, 422.0, 228.0, 99.0, 62.0, 34.0, 26.0, 20.0, 16.0, 8.0, 10.0, 11.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.12237548828125, -0.11877250671386719, -0.11516952514648438, -0.11156654357910156, -0.10796356201171875, -0.10436058044433594, -0.10075759887695312, -0.09715461730957031, -0.0935516357421875, -0.08994865417480469, -0.08634567260742188, -0.08274269104003906, -0.07913970947265625, -0.07553672790527344, -0.07193374633789062, -0.06833076477050781, -0.064727783203125, -0.06112480163574219, -0.057521820068359375, -0.05391883850097656, -0.05031585693359375, -0.04671287536621094, -0.043109893798828125, -0.03950691223144531, -0.0359039306640625, -0.03230094909667969, -0.028697967529296875, -0.025094985961914062, -0.02149200439453125, -0.017889022827148438, -0.014286041259765625, -0.010683059692382812, -0.007080078125, -0.0034770965576171875, 0.000125885009765625, 0.0037288665771484375, 0.00733184814453125, 0.010934829711914062, 0.014537811279296875, 0.018140792846679688, 0.0217437744140625, 0.025346755981445312, 0.028949737548828125, 0.03255271911621094, 0.03615570068359375, 0.03975868225097656, 0.043361663818359375, 0.04696464538574219, 0.050567626953125, 0.05417060852050781, 0.057773590087890625, 0.06137657165527344, 0.06497955322265625, 0.06858253479003906, 0.07218551635742188, 0.07578849792480469, 0.0793914794921875, 0.08299446105957031, 0.08659744262695312, 0.09020042419433594, 0.09380340576171875, 0.09740638732910156, 0.10100936889648438, 0.10461235046386719, 0.10821533203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 4.0, 11.0, 14.0, 14.0, 16.0, 21.0, 27.0, 43.0, 51.0, 50.0, 90.0, 139.0, 123.0, 97.0, 71.0, 49.0, 29.0, 22.0, 25.0, 11.0, 13.0, 9.0, 7.0, 10.0, 9.0, 5.0, 9.0, 2.0, 4.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0254669189453125, -0.02469325065612793, -0.02391958236694336, -0.02314591407775879, -0.02237224578857422, -0.02159857749938965, -0.020824909210205078, -0.020051240921020508, -0.019277572631835938, -0.018503904342651367, -0.017730236053466797, -0.016956567764282227, -0.016182899475097656, -0.015409231185913086, -0.014635562896728516, -0.013861894607543945, -0.013088226318359375, -0.012314558029174805, -0.011540889739990234, -0.010767221450805664, -0.009993553161621094, -0.009219884872436523, -0.008446216583251953, -0.007672548294067383, -0.0068988800048828125, -0.006125211715698242, -0.005351543426513672, -0.0045778751373291016, -0.0038042068481445312, -0.003030538558959961, -0.0022568702697753906, -0.0014832019805908203, -0.00070953369140625, 6.413459777832031e-05, 0.0008378028869628906, 0.001611471176147461, 0.0023851394653320312, 0.0031588077545166016, 0.003932476043701172, 0.004706144332885742, 0.0054798126220703125, 0.006253480911254883, 0.007027149200439453, 0.0078008174896240234, 0.008574485778808594, 0.009348154067993164, 0.010121822357177734, 0.010895490646362305, 0.011669158935546875, 0.012442827224731445, 0.013216495513916016, 0.013990163803100586, 0.014763832092285156, 0.015537500381469727, 0.016311168670654297, 0.017084836959838867, 0.017858505249023438, 0.018632173538208008, 0.019405841827392578, 0.02017951011657715, 0.02095317840576172, 0.02172684669494629, 0.02250051498413086, 0.02327418327331543, 0.0240478515625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 12.0, 24.0, 29.0, 59.0, 118.0, 183.0, 209.0, 163.0, 90.0, 48.0, 18.0, 16.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9354134202003479, -0.8895204067230225, -0.843627393245697, -0.7977343797683716, -0.7518413066864014, -0.7059483528137207, -0.6600552797317505, -0.614162266254425, -0.5682692527770996, -0.5223762392997742, -0.47648322582244873, -0.4305901825428009, -0.38469716906547546, -0.33880415558815, -0.2929111123085022, -0.24701809883117676, -0.20112508535385132, -0.15523207187652588, -0.10933904349803925, -0.06344601511955261, -0.017553001642227173, 0.028340011835098267, 0.0742330551147461, 0.12012606859207153, 0.16601908206939697, 0.2119120955467224, 0.25780510902404785, 0.3036981523036957, 0.3495911657810211, 0.39548417925834656, 0.4413772225379944, 0.4872702360153198, 0.53316330909729, 0.5790563225746155, 0.6249493360519409, 0.6708424091339111, 0.7167353630065918, 0.762628436088562, 0.8085214495658875, 0.8544144630432129, 0.9003074765205383, 0.9462004899978638, 0.9920935034751892, 1.0379865169525146, 1.0838795900344849, 1.1297725439071655, 1.1756656169891357, 1.2215585708618164, 1.2674516439437866, 1.3133447170257568, 1.3592376708984375, 1.4051307439804077, 1.4510236978530884, 1.4969167709350586, 1.5428097248077393, 1.5887027978897095, 1.6345958709716797, 1.68048894405365, 1.7263818979263306, 1.7722749710083008, 1.8181679248809814, 1.8640609979629517, 1.9099540710449219, 1.9558470249176025, 2.001739978790283]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 9.0, 6.0, 19.0, 31.0, 22.0, 34.0, 55.0, 55.0, 66.0, 58.0, 72.0, 85.0, 75.0, 74.0, 51.0, 64.0, 48.0, 40.0, 31.0, 23.0, 26.0, 16.0, 14.0, 9.0, 2.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5885597467422485, -0.5658830404281616, -0.5432063341140747, -0.5205296277999878, -0.4978529214859009, -0.47517621517181396, -0.45249950885772705, -0.42982280254364014, -0.4071460962295532, -0.3844693899154663, -0.3617926836013794, -0.3391159772872925, -0.31643927097320557, -0.29376256465911865, -0.27108585834503174, -0.24840915203094482, -0.2257324457168579, -0.203055739402771, -0.18037903308868408, -0.15770232677459717, -0.13502562046051025, -0.11234891414642334, -0.08967220783233643, -0.06699550151824951, -0.0443187952041626, -0.021642088890075684, 0.0010346174240112305, 0.023711323738098145, 0.04638803005218506, 0.06906473636627197, 0.09174144268035889, 0.1144181489944458, 0.1370949149131775, 0.1597716212272644, 0.18244832754135132, 0.20512503385543823, 0.22780174016952515, 0.25047844648361206, 0.273155152797699, 0.2958318591117859, 0.3185085654258728, 0.3411852717399597, 0.36386197805404663, 0.38653868436813354, 0.40921539068222046, 0.4318920969963074, 0.4545688033103943, 0.4772455096244812, 0.4999222159385681, 0.522598922252655, 0.5452756285667419, 0.5679523348808289, 0.5906290411949158, 0.6133057475090027, 0.6359824538230896, 0.6586591601371765, 0.6813358664512634, 0.7040125727653503, 0.7266892790794373, 0.7493659853935242, 0.7720426917076111, 0.794719398021698, 0.8173961043357849, 0.8400728106498718, 0.8627495169639587]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 6.0, 2.0, 5.0, 7.0, 17.0, 22.0, 58.0, 222.0, 3990.0, 880481.0, 161945.0, 1538.0, 133.0, 31.0, 24.0, 16.0, 13.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.3828125, -4.27001953125, -4.1572265625, -4.04443359375, -3.931640625, -3.81884765625, -3.7060546875, -3.59326171875, -3.48046875, -3.36767578125, -3.2548828125, -3.14208984375, -3.029296875, -2.91650390625, -2.8037109375, -2.69091796875, -2.578125, -2.46533203125, -2.3525390625, -2.23974609375, -2.126953125, -2.01416015625, -1.9013671875, -1.78857421875, -1.67578125, -1.56298828125, -1.4501953125, -1.33740234375, -1.224609375, -1.11181640625, -0.9990234375, -0.88623046875, -0.7734375, -0.66064453125, -0.5478515625, -0.43505859375, -0.322265625, -0.20947265625, -0.0966796875, 0.01611328125, 0.12890625, 0.24169921875, 0.3544921875, 0.46728515625, 0.580078125, 0.69287109375, 0.8056640625, 0.91845703125, 1.03125, 1.14404296875, 1.2568359375, 1.36962890625, 1.482421875, 1.59521484375, 1.7080078125, 1.82080078125, 1.93359375, 2.04638671875, 2.1591796875, 2.27197265625, 2.384765625, 2.49755859375, 2.6103515625, 2.72314453125, 2.8359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 11.0, 14.0, 32.0, 45.0, 73.0, 118.0, 124.0, 154.0, 129.0, 109.0, 72.0, 48.0, 33.0, 16.0, 15.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2294921875, -1.1385650634765625, -1.047637939453125, -0.9567108154296875, -0.86578369140625, -0.7748565673828125, -0.683929443359375, -0.5930023193359375, -0.5020751953125, -0.4111480712890625, -0.320220947265625, -0.2292938232421875, -0.13836669921875, -0.0474395751953125, 0.043487548828125, 0.1344146728515625, 0.225341796875, 0.3162689208984375, 0.407196044921875, 0.4981231689453125, 0.58905029296875, 0.6799774169921875, 0.770904541015625, 0.8618316650390625, 0.9527587890625, 1.0436859130859375, 1.134613037109375, 1.2255401611328125, 1.31646728515625, 1.4073944091796875, 1.498321533203125, 1.5892486572265625, 1.68017578125, 1.7711029052734375, 1.862030029296875, 1.9529571533203125, 2.04388427734375, 2.1348114013671875, 2.225738525390625, 2.3166656494140625, 2.4075927734375, 2.4985198974609375, 2.589447021484375, 2.6803741455078125, 2.77130126953125, 2.8622283935546875, 2.953155517578125, 3.0440826416015625, 3.135009765625, 3.2259368896484375, 3.316864013671875, 3.4077911376953125, 3.49871826171875, 3.5896453857421875, 3.680572509765625, 3.7714996337890625, 3.8624267578125, 3.9533538818359375, 4.044281005859375, 4.1352081298828125, 4.22613525390625, 4.3170623779296875, 4.407989501953125, 4.4989166259765625, 4.58984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 10.0, 17.0, 16.0, 37.0, 40.0, 56.0, 88.0, 152.0, 248.0, 395.0, 758.0, 1722.0, 4809.0, 17141.0, 86461.0, 563080.0, 310559.0, 46302.0, 10601.0, 3283.0, 1286.0, 596.0, 335.0, 181.0, 121.0, 75.0, 36.0, 40.0, 33.0, 18.0, 19.0, 10.0, 11.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55615234375, -0.536163330078125, -0.51617431640625, -0.496185302734375, -0.4761962890625, -0.456207275390625, -0.43621826171875, -0.416229248046875, -0.396240234375, -0.376251220703125, -0.35626220703125, -0.336273193359375, -0.3162841796875, -0.296295166015625, -0.27630615234375, -0.256317138671875, -0.236328125, -0.216339111328125, -0.19635009765625, -0.176361083984375, -0.1563720703125, -0.136383056640625, -0.11639404296875, -0.096405029296875, -0.076416015625, -0.056427001953125, -0.03643798828125, -0.016448974609375, 0.0035400390625, 0.023529052734375, 0.04351806640625, 0.063507080078125, 0.08349609375, 0.103485107421875, 0.12347412109375, 0.143463134765625, 0.1634521484375, 0.183441162109375, 0.20343017578125, 0.223419189453125, 0.243408203125, 0.263397216796875, 0.28338623046875, 0.303375244140625, 0.3233642578125, 0.343353271484375, 0.36334228515625, 0.383331298828125, 0.4033203125, 0.423309326171875, 0.44329833984375, 0.463287353515625, 0.4832763671875, 0.503265380859375, 0.52325439453125, 0.543243408203125, 0.563232421875, 0.583221435546875, 0.60321044921875, 0.623199462890625, 0.6431884765625, 0.663177490234375, 0.68316650390625, 0.703155517578125, 0.72314453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 3.0, 5.0, 4.0, 11.0, 11.0, 7.0, 22.0, 16.0, 30.0, 19.0, 27.0, 29.0, 30.0, 35.0, 39.0, 44.0, 41.0, 46.0, 38.0, 38.0, 45.0, 45.0, 38.0, 36.0, 42.0, 48.0, 31.0, 31.0, 20.0, 29.0, 24.0, 26.0, 22.0, 12.0, 12.0, 7.0, 8.0, 3.0, 4.0, 5.0, 5.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0001678466796875, -0.964202880859375, -0.9282379150390625, -0.89227294921875, -0.8563079833984375, -0.820343017578125, -0.7843780517578125, -0.7484130859375, -0.7124481201171875, -0.676483154296875, -0.6405181884765625, -0.60455322265625, -0.5685882568359375, -0.532623291015625, -0.4966583251953125, -0.460693359375, -0.4247283935546875, -0.388763427734375, -0.3527984619140625, -0.31683349609375, -0.2808685302734375, -0.244903564453125, -0.2089385986328125, -0.1729736328125, -0.1370086669921875, -0.101043701171875, -0.0650787353515625, -0.02911376953125, 0.0068511962890625, 0.042816162109375, 0.0787811279296875, 0.11474609375, 0.1507110595703125, 0.186676025390625, 0.2226409912109375, 0.25860595703125, 0.2945709228515625, 0.330535888671875, 0.3665008544921875, 0.4024658203125, 0.4384307861328125, 0.474395751953125, 0.5103607177734375, 0.54632568359375, 0.5822906494140625, 0.618255615234375, 0.6542205810546875, 0.690185546875, 0.7261505126953125, 0.762115478515625, 0.7980804443359375, 0.83404541015625, 0.8700103759765625, 0.905975341796875, 0.9419403076171875, 0.9779052734375, 1.0138702392578125, 1.049835205078125, 1.0858001708984375, 1.12176513671875, 1.1577301025390625, 1.193695068359375, 1.2296600341796875, 1.265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 9.0, 12.0, 13.0, 21.0, 28.0, 39.0, 63.0, 73.0, 126.0, 233.0, 373.0, 742.0, 1468.0, 3622.0, 10289.0, 35938.0, 151478.0, 539637.0, 229608.0, 52121.0, 13986.0, 4720.0, 1853.0, 871.0, 464.0, 269.0, 150.0, 113.0, 64.0, 46.0, 30.0, 24.0, 18.0, 11.0, 11.0, 7.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.1742267608642578, -0.16888809204101562, -0.16354942321777344, -0.15821075439453125, -0.15287208557128906, -0.14753341674804688, -0.1421947479248047, -0.1368560791015625, -0.1315174102783203, -0.12617874145507812, -0.12084007263183594, -0.11550140380859375, -0.11016273498535156, -0.10482406616210938, -0.09948539733886719, -0.094146728515625, -0.08880805969238281, -0.08346939086914062, -0.07813072204589844, -0.07279205322265625, -0.06745338439941406, -0.062114715576171875, -0.05677604675292969, -0.0514373779296875, -0.04609870910644531, -0.040760040283203125, -0.03542137145996094, -0.03008270263671875, -0.024744033813476562, -0.019405364990234375, -0.014066696166992188, -0.00872802734375, -0.0033893585205078125, 0.001949310302734375, 0.0072879791259765625, 0.01262664794921875, 0.017965316772460938, 0.023303985595703125, 0.028642654418945312, 0.0339813232421875, 0.03931999206542969, 0.044658660888671875, 0.04999732971191406, 0.05533599853515625, 0.06067466735839844, 0.06601333618164062, 0.07135200500488281, 0.076690673828125, 0.08202934265136719, 0.08736801147460938, 0.09270668029785156, 0.09804534912109375, 0.10338401794433594, 0.10872268676757812, 0.11406135559082031, 0.1194000244140625, 0.12473869323730469, 0.13007736206054688, 0.13541603088378906, 0.14075469970703125, 0.14609336853027344, 0.15143203735351562, 0.1567707061767578, 0.162109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 7.0, 6.0, 3.0, 9.0, 17.0, 14.0, 20.0, 28.0, 39.0, 44.0, 53.0, 77.0, 98.0, 98.0, 102.0, 92.0, 64.0, 68.0, 33.0, 25.0, 23.0, 14.0, 14.0, 12.0, 12.0, 6.0, 3.0, 2.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0279159545898438e-05, -2.9224902391433716e-05, -2.8170645236968994e-05, -2.7116388082504272e-05, -2.606213092803955e-05, -2.500787377357483e-05, -2.3953616619110107e-05, -2.2899359464645386e-05, -2.1845102310180664e-05, -2.0790845155715942e-05, -1.973658800125122e-05, -1.86823308467865e-05, -1.7628073692321777e-05, -1.6573816537857056e-05, -1.5519559383392334e-05, -1.4465302228927612e-05, -1.341104507446289e-05, -1.2356787919998169e-05, -1.1302530765533447e-05, -1.0248273611068726e-05, -9.194016456604004e-06, -8.139759302139282e-06, -7.0855021476745605e-06, -6.031244993209839e-06, -4.976987838745117e-06, -3.9227306842803955e-06, -2.868473529815674e-06, -1.8142163753509521e-06, -7.599592208862305e-07, 2.942979335784912e-07, 1.3485550880432129e-06, 2.4028122425079346e-06, 3.4570693969726562e-06, 4.511326551437378e-06, 5.5655837059021e-06, 6.619840860366821e-06, 7.674098014831543e-06, 8.728355169296265e-06, 9.782612323760986e-06, 1.0836869478225708e-05, 1.189112663269043e-05, 1.2945383787155151e-05, 1.3999640941619873e-05, 1.5053898096084595e-05, 1.6108155250549316e-05, 1.7162412405014038e-05, 1.821666955947876e-05, 1.927092671394348e-05, 2.0325183868408203e-05, 2.1379441022872925e-05, 2.2433698177337646e-05, 2.3487955331802368e-05, 2.454221248626709e-05, 2.559646964073181e-05, 2.6650726795196533e-05, 2.7704983949661255e-05, 2.8759241104125977e-05, 2.9813498258590698e-05, 3.086775541305542e-05, 3.192201256752014e-05, 3.297626972198486e-05, 3.4030526876449585e-05, 3.508478403091431e-05, 3.613904118537903e-05, 3.719329833984375e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 19.0, 16.0, 25.0, 53.0, 89.0, 146.0, 306.0, 623.0, 1410.0, 3930.0, 11993.0, 51415.0, 302579.0, 547699.0, 98082.0, 20465.0, 5880.0, 1999.0, 918.0, 399.0, 220.0, 120.0, 58.0, 32.0, 18.0, 16.0, 11.0, 4.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1329345703125, -0.12635231018066406, -0.11977005004882812, -0.11318778991699219, -0.10660552978515625, -0.10002326965332031, -0.09344100952148438, -0.08685874938964844, -0.0802764892578125, -0.07369422912597656, -0.06711196899414062, -0.06052970886230469, -0.05394744873046875, -0.04736518859863281, -0.040782928466796875, -0.03420066833496094, -0.027618408203125, -0.021036148071289062, -0.014453887939453125, -0.007871627807617188, -0.00128936767578125, 0.0052928924560546875, 0.011875152587890625, 0.018457412719726562, 0.0250396728515625, 0.03162193298339844, 0.038204193115234375, 0.04478645324707031, 0.05136871337890625, 0.05795097351074219, 0.06453323364257812, 0.07111549377441406, 0.07769775390625, 0.08428001403808594, 0.09086227416992188, 0.09744453430175781, 0.10402679443359375, 0.11060905456542969, 0.11719131469726562, 0.12377357482910156, 0.1303558349609375, 0.13693809509277344, 0.14352035522460938, 0.1501026153564453, 0.15668487548828125, 0.1632671356201172, 0.16984939575195312, 0.17643165588378906, 0.183013916015625, 0.18959617614746094, 0.19617843627929688, 0.2027606964111328, 0.20934295654296875, 0.2159252166748047, 0.22250747680664062, 0.22908973693847656, 0.2356719970703125, 0.24225425720214844, 0.24883651733398438, 0.2554187774658203, 0.26200103759765625, 0.2685832977294922, 0.2751655578613281, 0.28174781799316406, 0.288330078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 12.0, 11.0, 19.0, 15.0, 35.0, 49.0, 75.0, 103.0, 92.0, 104.0, 120.0, 85.0, 70.0, 65.0, 42.0, 34.0, 22.0, 12.0, 13.0, 9.0, 4.0, 4.0, 5.0, 7.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.171142578125, -0.1673288345336914, -0.1635150909423828, -0.15970134735107422, -0.15588760375976562, -0.15207386016845703, -0.14826011657714844, -0.14444637298583984, -0.14063262939453125, -0.13681888580322266, -0.13300514221191406, -0.12919139862060547, -0.12537765502929688, -0.12156391143798828, -0.11775016784667969, -0.1139364242553711, -0.1101226806640625, -0.1063089370727539, -0.10249519348144531, -0.09868144989013672, -0.09486770629882812, -0.09105396270751953, -0.08724021911621094, -0.08342647552490234, -0.07961273193359375, -0.07579898834228516, -0.07198524475097656, -0.06817150115966797, -0.06435775756835938, -0.06054401397705078, -0.05673027038574219, -0.052916526794433594, -0.049102783203125, -0.045289039611816406, -0.04147529602050781, -0.03766155242919922, -0.033847808837890625, -0.03003406524658203, -0.026220321655273438, -0.022406578063964844, -0.01859283447265625, -0.014779090881347656, -0.010965347290039062, -0.007151603698730469, -0.003337860107421875, 0.00047588348388671875, 0.0042896270751953125, 0.008103370666503906, 0.0119171142578125, 0.015730857849121094, 0.019544601440429688, 0.02335834503173828, 0.027172088623046875, 0.03098583221435547, 0.03479957580566406, 0.038613319396972656, 0.04242706298828125, 0.046240806579589844, 0.05005455017089844, 0.05386829376220703, 0.057682037353515625, 0.06149578094482422, 0.06530952453613281, 0.0691232681274414, 0.07293701171875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 16.0, 32.0, 161.0, 422.0, 278.0, 69.0, 17.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.370660781860352, -10.166275024414062, -9.96189022064209, -9.7575044631958, -9.553119659423828, -9.348733901977539, -9.14434814453125, -8.939963340759277, -8.735577583312988, -8.5311918258667, -8.326807022094727, -8.122421264648438, -7.918035984039307, -7.713650703430176, -7.509264945983887, -7.304879665374756, -7.100494384765625, -6.896109104156494, -6.691723823547363, -6.487338066101074, -6.282952785491943, -6.0785675048828125, -5.874181747436523, -5.669796466827393, -5.465411186218262, -5.261025905609131, -5.056640625, -4.852254867553711, -4.64786958694458, -4.443484306335449, -4.23909854888916, -4.034713268280029, -3.8303277492523193, -3.6259422302246094, -3.4215569496154785, -3.2171716690063477, -3.0127861499786377, -2.8084006309509277, -2.604015350341797, -2.399630069732666, -2.195244550704956, -1.9908591508865356, -1.7864737510681152, -1.5820883512496948, -1.3777029514312744, -1.173317551612854, -0.9689321517944336, -0.7645467519760132, -0.5601613521575928, -0.35577595233917236, -0.15139055252075195, 0.05299484729766846, 0.25738024711608887, 0.4617656469345093, 0.6661510467529297, 0.8705364465713501, 1.0749218463897705, 1.279307246208191, 1.4836926460266113, 1.6880780458450317, 1.8924634456634521, 2.096848964691162, 2.301234245300293, 2.505619525909424, 2.710005044937134]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 12.0, 10.0, 18.0, 25.0, 27.0, 33.0, 42.0, 48.0, 56.0, 66.0, 69.0, 66.0, 81.0, 70.0, 68.0, 53.0, 43.0, 45.0, 38.0, 38.0, 31.0, 13.0, 19.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1095077991485596, -2.005922794342041, -1.9023380279541016, -1.798753023147583, -1.6951682567596436, -1.591583251953125, -1.487998366355896, -1.384413480758667, -1.280828595161438, -1.177243709564209, -1.07365882396698, -0.9700738787651062, -0.8664889931678772, -0.7629041075706482, -0.6593191623687744, -0.5557342767715454, -0.4521493911743164, -0.3485645055770874, -0.244979590177536, -0.14139467477798462, -0.037809789180755615, 0.06577509641647339, 0.16936004161834717, 0.27294492721557617, 0.3765298128128052, 0.4801146984100342, 0.5836995840072632, 0.687284529209137, 0.790869414806366, 0.894454300403595, 0.9980392456054688, 1.1016241312026978, 1.2052087783813477, 1.3087936639785767, 1.4123785495758057, 1.5159635543823242, 1.6195483207702637, 1.7231333255767822, 1.8267182111740112, 1.9303030967712402, 2.0338878631591797, 2.1374728679656982, 2.2410576343536377, 2.3446426391601562, 2.4482274055480957, 2.5518124103546143, 2.655397415161133, 2.7589821815490723, 2.862567186355591, 2.9661521911621094, 3.069736957550049, 3.1733219623565674, 3.276906728744507, 3.3804917335510254, 3.484076499938965, 3.5876615047454834, 3.691246509552002, 3.7948315143585205, 3.89841628074646, 4.0020012855529785, 4.105586051940918, 4.209170818328857, 4.312756061553955, 4.4163408279418945, 4.519925594329834]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 14.0, 13.0, 18.0, 14.0, 29.0, 46.0, 59.0, 105.0, 122.0, 192.0, 296.0, 465.0, 687.0, 1091.0, 1835.0, 3123.0, 6047.0, 12901.0, 32278.0, 101987.0, 484432.0, 2428309.0, 889300.0, 154763.0, 43005.0, 16478.0, 7379.0, 3730.0, 2000.0, 1289.0, 749.0, 480.0, 339.0, 196.0, 150.0, 102.0, 70.0, 61.0, 31.0, 30.0, 26.0, 9.0, 6.0, 10.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.6435546875, -0.6238479614257812, -0.6041412353515625, -0.5844345092773438, -0.564727783203125, -0.5450210571289062, -0.5253143310546875, -0.5056076049804688, -0.48590087890625, -0.46619415283203125, -0.4464874267578125, -0.42678070068359375, -0.407073974609375, -0.38736724853515625, -0.3676605224609375, -0.34795379638671875, -0.3282470703125, -0.30854034423828125, -0.2888336181640625, -0.26912689208984375, -0.249420166015625, -0.22971343994140625, -0.2100067138671875, -0.19029998779296875, -0.17059326171875, -0.15088653564453125, -0.1311798095703125, -0.11147308349609375, -0.091766357421875, -0.07205963134765625, -0.0523529052734375, -0.03264617919921875, -0.012939453125, 0.00676727294921875, 0.0264739990234375, 0.04618072509765625, 0.065887451171875, 0.08559417724609375, 0.1053009033203125, 0.12500762939453125, 0.14471435546875, 0.16442108154296875, 0.1841278076171875, 0.20383453369140625, 0.223541259765625, 0.24324798583984375, 0.2629547119140625, 0.28266143798828125, 0.3023681640625, 0.32207489013671875, 0.3417816162109375, 0.36148834228515625, 0.381195068359375, 0.40090179443359375, 0.4206085205078125, 0.44031524658203125, 0.46002197265625, 0.47972869873046875, 0.4994354248046875, 0.5191421508789062, 0.538848876953125, 0.5585556030273438, 0.5782623291015625, 0.5979690551757812, 0.61767578125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 5.0, 9.0, 9.0, 10.0, 20.0, 25.0, 20.0, 27.0, 30.0, 28.0, 43.0, 44.0, 41.0, 50.0, 53.0, 53.0, 67.0, 55.0, 54.0, 48.0, 43.0, 36.0, 34.0, 26.0, 29.0, 14.0, 20.0, 18.0, 17.0, 11.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.70947265625, -0.6903076171875, -0.671142578125, -0.6519775390625, -0.6328125, -0.6136474609375, -0.594482421875, -0.5753173828125, -0.55615234375, -0.5369873046875, -0.517822265625, -0.4986572265625, -0.4794921875, -0.4603271484375, -0.441162109375, -0.4219970703125, -0.40283203125, -0.3836669921875, -0.364501953125, -0.3453369140625, -0.326171875, -0.3070068359375, -0.287841796875, -0.2686767578125, -0.24951171875, -0.2303466796875, -0.211181640625, -0.1920166015625, -0.1728515625, -0.1536865234375, -0.134521484375, -0.1153564453125, -0.09619140625, -0.0770263671875, -0.057861328125, -0.0386962890625, -0.01953125, -0.0003662109375, 0.018798828125, 0.0379638671875, 0.05712890625, 0.0762939453125, 0.095458984375, 0.1146240234375, 0.1337890625, 0.1529541015625, 0.172119140625, 0.1912841796875, 0.21044921875, 0.2296142578125, 0.248779296875, 0.2679443359375, 0.287109375, 0.3062744140625, 0.325439453125, 0.3446044921875, 0.36376953125, 0.3829345703125, 0.402099609375, 0.4212646484375, 0.4404296875, 0.4595947265625, 0.478759765625, 0.4979248046875, 0.51708984375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 8.0, 10.0, 17.0, 25.0, 21.0, 64.0, 81.0, 147.0, 258.0, 492.0, 1277.0, 4009.0, 17436.0, 148394.0, 3596031.0, 387590.0, 29508.0, 5838.0, 1737.0, 640.0, 273.0, 162.0, 102.0, 46.0, 35.0, 28.0, 17.0, 12.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.0197601318359375, -0.982879638671875, -0.9459991455078125, -0.90911865234375, -0.8722381591796875, -0.835357666015625, -0.7984771728515625, -0.7615966796875, -0.7247161865234375, -0.687835693359375, -0.6509552001953125, -0.61407470703125, -0.5771942138671875, -0.540313720703125, -0.5034332275390625, -0.466552734375, -0.4296722412109375, -0.392791748046875, -0.3559112548828125, -0.31903076171875, -0.2821502685546875, -0.245269775390625, -0.2083892822265625, -0.1715087890625, -0.1346282958984375, -0.097747802734375, -0.0608673095703125, -0.02398681640625, 0.0128936767578125, 0.049774169921875, 0.0866546630859375, 0.12353515625, 0.1604156494140625, 0.197296142578125, 0.2341766357421875, 0.27105712890625, 0.3079376220703125, 0.344818115234375, 0.3816986083984375, 0.4185791015625, 0.4554595947265625, 0.492340087890625, 0.5292205810546875, 0.56610107421875, 0.6029815673828125, 0.639862060546875, 0.6767425537109375, 0.713623046875, 0.7505035400390625, 0.787384033203125, 0.8242645263671875, 0.86114501953125, 0.8980255126953125, 0.934906005859375, 0.9717864990234375, 1.0086669921875, 1.0455474853515625, 1.082427978515625, 1.1193084716796875, 1.15618896484375, 1.1930694580078125, 1.229949951171875, 1.2668304443359375, 1.3037109375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 4.0, 9.0, 23.0, 13.0, 19.0, 43.0, 54.0, 63.0, 89.0, 148.0, 247.0, 408.0, 639.0, 794.0, 553.0, 300.0, 216.0, 125.0, 80.0, 68.0, 46.0, 28.0, 27.0, 17.0, 13.0, 14.0, 6.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260986328125, -0.25316429138183594, -0.24534225463867188, -0.2375202178955078, -0.22969818115234375, -0.2218761444091797, -0.21405410766601562, -0.20623207092285156, -0.1984100341796875, -0.19058799743652344, -0.18276596069335938, -0.1749439239501953, -0.16712188720703125, -0.1592998504638672, -0.15147781372070312, -0.14365577697753906, -0.135833740234375, -0.12801170349121094, -0.12018966674804688, -0.11236763000488281, -0.10454559326171875, -0.09672355651855469, -0.08890151977539062, -0.08107948303222656, -0.0732574462890625, -0.06543540954589844, -0.057613372802734375, -0.04979133605957031, -0.04196929931640625, -0.03414726257324219, -0.026325225830078125, -0.018503189086914062, -0.01068115234375, -0.0028591156005859375, 0.004962921142578125, 0.012784957885742188, 0.02060699462890625, 0.028429031372070312, 0.036251068115234375, 0.04407310485839844, 0.0518951416015625, 0.05971717834472656, 0.06753921508789062, 0.07536125183105469, 0.08318328857421875, 0.09100532531738281, 0.09882736206054688, 0.10664939880371094, 0.114471435546875, 0.12229347229003906, 0.13011550903320312, 0.1379375457763672, 0.14575958251953125, 0.1535816192626953, 0.16140365600585938, 0.16922569274902344, 0.1770477294921875, 0.18486976623535156, 0.19269180297851562, 0.2005138397216797, 0.20833587646484375, 0.2161579132080078, 0.22397994995117188, 0.23180198669433594, 0.2396240234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 6.0, 8.0, 14.0, 10.0, 20.0, 26.0, 36.0, 77.0, 104.0, 125.0, 123.0, 133.0, 100.0, 80.0, 44.0, 28.0, 15.0, 20.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8860098719596863, -0.843083918094635, -0.8001580238342285, -0.7572320699691772, -0.714306116104126, -0.6713801622390747, -0.6284542083740234, -0.5855283141136169, -0.5426023602485657, -0.4996764063835144, -0.4567504823207855, -0.41382455825805664, -0.37089860439300537, -0.3279726505279541, -0.2850467264652252, -0.24212080240249634, -0.19919484853744507, -0.156268909573555, -0.11334297060966492, -0.07041703164577484, -0.027491092681884766, 0.01543484628200531, 0.058360785245895386, 0.10128670930862427, 0.14421266317367554, 0.1871386021375656, 0.2300645411014557, 0.27299046516418457, 0.31591641902923584, 0.3588423728942871, 0.401768296957016, 0.4446942210197449, 0.4876202344894409, 0.5305461883544922, 0.5734721422195435, 0.61639803647995, 0.6593239903450012, 0.7022499442100525, 0.745175838470459, 0.7881017923355103, 0.8310277462005615, 0.8739537000656128, 0.9168796539306641, 0.9598055481910706, 1.0027315616607666, 1.0456573963165283, 1.0885833501815796, 1.1315093040466309, 1.1744352579116821, 1.2173612117767334, 1.2602871656417847, 1.303213119506836, 1.3461389541625977, 1.389064908027649, 1.4319908618927002, 1.4749168157577515, 1.5178427696228027, 1.560768723487854, 1.6036946773529053, 1.6466206312179565, 1.6895465850830078, 1.7324724197387695, 1.7753983736038208, 1.818324327468872, 1.8612502813339233]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 15.0, 9.0, 12.0, 22.0, 24.0, 18.0, 18.0, 26.0, 20.0, 40.0, 39.0, 47.0, 54.0, 52.0, 49.0, 49.0, 48.0, 65.0, 53.0, 44.0, 50.0, 39.0, 29.0, 28.0, 27.0, 23.0, 16.0, 19.0, 15.0, 9.0, 15.0, 7.0, 5.0, 1.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9039857387542725, -0.8814032673835754, -0.8588207960128784, -0.8362383842468262, -0.8136559128761292, -0.7910734415054321, -0.7684909701347351, -0.7459084987640381, -0.7233260869979858, -0.7007436156272888, -0.6781611442565918, -0.6555787324905396, -0.6329962611198425, -0.6104137897491455, -0.5878313183784485, -0.5652488470077515, -0.5426663756370544, -0.5200839042663574, -0.4975014626979828, -0.47491899132728577, -0.45233654975891113, -0.4297540783882141, -0.4071716070175171, -0.38458913564682007, -0.36200669407844543, -0.3394242227077484, -0.3168417811393738, -0.29425930976867676, -0.27167683839797974, -0.2490943968296051, -0.22651192545890808, -0.20392946898937225, -0.1813470721244812, -0.15876461565494537, -0.13618215918540955, -0.11359968781471252, -0.0910172313451767, -0.06843477487564087, -0.04585230350494385, -0.02326984703540802, -0.0006873905658721924, 0.021895069628953934, 0.04447752982378006, 0.06705999374389648, 0.08964245021343231, 0.11222490668296814, 0.13480737805366516, 0.157389834523201, 0.17997229099273682, 0.20255474746227264, 0.22513720393180847, 0.2477196753025055, 0.2703021168708801, 0.29288458824157715, 0.31546705961227417, 0.3380495309829712, 0.3606319725513458, 0.38321444392204285, 0.4057968854904175, 0.4283793568611145, 0.4509618282318115, 0.47354426980018616, 0.4961267411708832, 0.5187091827392578, 0.5412916541099548]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 17.0, 21.0, 22.0, 31.0, 70.0, 85.0, 166.0, 251.0, 419.0, 740.0, 1343.0, 2510.0, 5117.0, 11311.0, 27852.0, 81408.0, 264230.0, 407541.0, 160155.0, 50514.0, 18773.0, 7989.0, 3684.0, 1843.0, 948.0, 582.0, 349.0, 201.0, 124.0, 77.0, 55.0, 36.0, 29.0, 12.0, 16.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10748291015625, -0.10425376892089844, -0.10102462768554688, -0.09779548645019531, -0.09456634521484375, -0.09133720397949219, -0.08810806274414062, -0.08487892150878906, -0.0816497802734375, -0.07842063903808594, -0.07519149780273438, -0.07196235656738281, -0.06873321533203125, -0.06550407409667969, -0.062274932861328125, -0.05904579162597656, -0.055816650390625, -0.05258750915527344, -0.049358367919921875, -0.04612922668457031, -0.04290008544921875, -0.03967094421386719, -0.036441802978515625, -0.03321266174316406, -0.0299835205078125, -0.026754379272460938, -0.023525238037109375, -0.020296096801757812, -0.01706695556640625, -0.013837814331054688, -0.010608673095703125, -0.0073795318603515625, -0.004150390625, -0.0009212493896484375, 0.002307891845703125, 0.0055370330810546875, 0.00876617431640625, 0.011995315551757812, 0.015224456787109375, 0.018453598022460938, 0.0216827392578125, 0.024911880493164062, 0.028141021728515625, 0.03137016296386719, 0.03459930419921875, 0.03782844543457031, 0.041057586669921875, 0.04428672790527344, 0.047515869140625, 0.05074501037597656, 0.053974151611328125, 0.05720329284667969, 0.06043243408203125, 0.06366157531738281, 0.06689071655273438, 0.07011985778808594, 0.0733489990234375, 0.07657814025878906, 0.07980728149414062, 0.08303642272949219, 0.08626556396484375, 0.08949470520019531, 0.09272384643554688, 0.09595298767089844, 0.09918212890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 11.0, 8.0, 8.0, 14.0, 26.0, 24.0, 28.0, 22.0, 34.0, 40.0, 49.0, 43.0, 59.0, 59.0, 57.0, 61.0, 67.0, 54.0, 50.0, 61.0, 38.0, 35.0, 27.0, 16.0, 18.0, 17.0, 17.0, 7.0, 14.0, 8.0, 3.0, 8.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54833984375, -0.5322074890136719, -0.5160751342773438, -0.4999427795410156, -0.4838104248046875, -0.4676780700683594, -0.45154571533203125, -0.4354133605957031, -0.419281005859375, -0.4031486511230469, -0.38701629638671875, -0.3708839416503906, -0.3547515869140625, -0.3386192321777344, -0.32248687744140625, -0.3063545227050781, -0.29022216796875, -0.2740898132324219, -0.25795745849609375, -0.24182510375976562, -0.2256927490234375, -0.20956039428710938, -0.19342803955078125, -0.17729568481445312, -0.161163330078125, -0.14503097534179688, -0.12889862060546875, -0.11276626586914062, -0.0966339111328125, -0.08050155639648438, -0.06436920166015625, -0.048236846923828125, -0.0321044921875, -0.015972137451171875, 0.00016021728515625, 0.016292572021484375, 0.0324249267578125, 0.048557281494140625, 0.06468963623046875, 0.08082199096679688, 0.096954345703125, 0.11308670043945312, 0.12921905517578125, 0.14535140991210938, 0.1614837646484375, 0.17761611938476562, 0.19374847412109375, 0.20988082885742188, 0.22601318359375, 0.24214553833007812, 0.25827789306640625, 0.2744102478027344, 0.2905426025390625, 0.3066749572753906, 0.32280731201171875, 0.3389396667480469, 0.355072021484375, 0.3712043762207031, 0.38733673095703125, 0.4034690856933594, 0.4196014404296875, 0.4357337951660156, 0.45186614990234375, 0.4679985046386719, 0.484130859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 10.0, 17.0, 17.0, 19.0, 33.0, 75.0, 98.0, 162.0, 289.0, 643.0, 1536.0, 5321.0, 35770.0, 468095.0, 489949.0, 37930.0, 5710.0, 1526.0, 570.0, 306.0, 168.0, 96.0, 63.0, 36.0, 21.0, 21.0, 18.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.163818359375, -0.15752029418945312, -0.15122222900390625, -0.14492416381835938, -0.1386260986328125, -0.13232803344726562, -0.12602996826171875, -0.11973190307617188, -0.113433837890625, -0.10713577270507812, -0.10083770751953125, -0.09453964233398438, -0.0882415771484375, -0.08194351196289062, -0.07564544677734375, -0.06934738159179688, -0.06304931640625, -0.056751251220703125, -0.05045318603515625, -0.044155120849609375, -0.0378570556640625, -0.031558990478515625, -0.02526092529296875, -0.018962860107421875, -0.012664794921875, -0.006366729736328125, -6.866455078125e-05, 0.006229400634765625, 0.0125274658203125, 0.018825531005859375, 0.02512359619140625, 0.031421661376953125, 0.0377197265625, 0.044017791748046875, 0.05031585693359375, 0.056613922119140625, 0.0629119873046875, 0.06921005249023438, 0.07550811767578125, 0.08180618286132812, 0.088104248046875, 0.09440231323242188, 0.10070037841796875, 0.10699844360351562, 0.1132965087890625, 0.11959457397460938, 0.12589263916015625, 0.13219070434570312, 0.13848876953125, 0.14478683471679688, 0.15108489990234375, 0.15738296508789062, 0.1636810302734375, 0.16997909545898438, 0.17627716064453125, 0.18257522583007812, 0.188873291015625, 0.19517135620117188, 0.20146942138671875, 0.20776748657226562, 0.2140655517578125, 0.22036361694335938, 0.22666168212890625, 0.23295974731445312, 0.2392578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 3.0, 6.0, 6.0, 14.0, 17.0, 12.0, 18.0, 32.0, 31.0, 40.0, 36.0, 38.0, 43.0, 37.0, 46.0, 44.0, 47.0, 43.0, 57.0, 35.0, 52.0, 37.0, 45.0, 36.0, 27.0, 28.0, 23.0, 33.0, 19.0, 7.0, 18.0, 13.0, 11.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.9208984375, -0.8939971923828125, -0.867095947265625, -0.8401947021484375, -0.81329345703125, -0.7863922119140625, -0.759490966796875, -0.7325897216796875, -0.7056884765625, -0.6787872314453125, -0.651885986328125, -0.6249847412109375, -0.59808349609375, -0.5711822509765625, -0.544281005859375, -0.5173797607421875, -0.490478515625, -0.4635772705078125, -0.436676025390625, -0.4097747802734375, -0.38287353515625, -0.3559722900390625, -0.329071044921875, -0.3021697998046875, -0.2752685546875, -0.2483673095703125, -0.221466064453125, -0.1945648193359375, -0.16766357421875, -0.1407623291015625, -0.113861083984375, -0.0869598388671875, -0.06005859375, -0.0331573486328125, -0.006256103515625, 0.0206451416015625, 0.04754638671875, 0.0744476318359375, 0.101348876953125, 0.1282501220703125, 0.1551513671875, 0.1820526123046875, 0.208953857421875, 0.2358551025390625, 0.26275634765625, 0.2896575927734375, 0.316558837890625, 0.3434600830078125, 0.370361328125, 0.3972625732421875, 0.424163818359375, 0.4510650634765625, 0.47796630859375, 0.5048675537109375, 0.531768798828125, 0.5586700439453125, 0.5855712890625, 0.6124725341796875, 0.639373779296875, 0.6662750244140625, 0.69317626953125, 0.7200775146484375, 0.746978759765625, 0.7738800048828125, 0.80078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 8.0, 16.0, 17.0, 28.0, 43.0, 62.0, 107.0, 162.0, 355.0, 902.0, 2403.0, 8876.0, 68929.0, 810579.0, 137165.0, 13348.0, 3291.0, 1184.0, 466.0, 235.0, 128.0, 92.0, 43.0, 24.0, 22.0, 10.0, 9.0, 3.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10394287109375, -0.10085105895996094, -0.09775924682617188, -0.09466743469238281, -0.09157562255859375, -0.08848381042480469, -0.08539199829101562, -0.08230018615722656, -0.0792083740234375, -0.07611656188964844, -0.07302474975585938, -0.06993293762207031, -0.06684112548828125, -0.06374931335449219, -0.060657501220703125, -0.05756568908691406, -0.054473876953125, -0.05138206481933594, -0.048290252685546875, -0.04519844055175781, -0.04210662841796875, -0.03901481628417969, -0.035923004150390625, -0.03283119201660156, -0.0297393798828125, -0.026647567749023438, -0.023555755615234375, -0.020463943481445312, -0.01737213134765625, -0.014280319213867188, -0.011188507080078125, -0.008096694946289062, -0.0050048828125, -0.0019130706787109375, 0.001178741455078125, 0.0042705535888671875, 0.00736236572265625, 0.010454177856445312, 0.013545989990234375, 0.016637802124023438, 0.0197296142578125, 0.022821426391601562, 0.025913238525390625, 0.029005050659179688, 0.03209686279296875, 0.03518867492675781, 0.038280487060546875, 0.04137229919433594, 0.044464111328125, 0.04755592346191406, 0.050647735595703125, 0.05373954772949219, 0.05683135986328125, 0.05992317199707031, 0.06301498413085938, 0.06610679626464844, 0.0691986083984375, 0.07229042053222656, 0.07538223266601562, 0.07847404479980469, 0.08156585693359375, 0.08465766906738281, 0.08774948120117188, 0.09084129333496094, 0.09393310546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 11.0, 11.0, 17.0, 20.0, 31.0, 36.0, 73.0, 82.0, 126.0, 131.0, 119.0, 85.0, 67.0, 64.0, 25.0, 27.0, 17.0, 17.0, 15.0, 7.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3451786041259766e-05, -4.238169640302658e-05, -4.1311606764793396e-05, -4.024151712656021e-05, -3.9171427488327026e-05, -3.810133785009384e-05, -3.703124821186066e-05, -3.596115857362747e-05, -3.489106893539429e-05, -3.38209792971611e-05, -3.275088965892792e-05, -3.168080002069473e-05, -3.061071038246155e-05, -2.9540620744228363e-05, -2.8470531105995178e-05, -2.7400441467761993e-05, -2.633035182952881e-05, -2.5260262191295624e-05, -2.419017255306244e-05, -2.3120082914829254e-05, -2.204999327659607e-05, -2.0979903638362885e-05, -1.99098140001297e-05, -1.8839724361896515e-05, -1.776963472366333e-05, -1.6699545085430145e-05, -1.562945544719696e-05, -1.4559365808963776e-05, -1.348927617073059e-05, -1.2419186532497406e-05, -1.1349096894264221e-05, -1.0279007256031036e-05, -9.208917617797852e-06, -8.138827979564667e-06, -7.068738341331482e-06, -5.998648703098297e-06, -4.928559064865112e-06, -3.8584694266319275e-06, -2.7883797883987427e-06, -1.7182901501655579e-06, -6.48200511932373e-07, 4.2188912630081177e-07, 1.4919787645339966e-06, 2.5620684027671814e-06, 3.632158041000366e-06, 4.702247679233551e-06, 5.772337317466736e-06, 6.842426955699921e-06, 7.912516593933105e-06, 8.98260623216629e-06, 1.0052695870399475e-05, 1.112278550863266e-05, 1.2192875146865845e-05, 1.326296478509903e-05, 1.4333054423332214e-05, 1.54031440615654e-05, 1.6473233699798584e-05, 1.754332333803177e-05, 1.8613412976264954e-05, 1.968350261449814e-05, 2.0753592252731323e-05, 2.1823681890964508e-05, 2.2893771529197693e-05, 2.3963861167430878e-05, 2.5033950805664062e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 7.0, 7.0, 7.0, 9.0, 18.0, 19.0, 31.0, 62.0, 66.0, 108.0, 184.0, 352.0, 654.0, 1445.0, 3332.0, 8925.0, 30741.0, 140740.0, 565824.0, 230767.0, 45052.0, 12373.0, 4175.0, 1701.0, 843.0, 456.0, 234.0, 137.0, 93.0, 59.0, 33.0, 22.0, 14.0, 14.0, 11.0, 7.0, 5.0, 5.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06866455078125, -0.06668233871459961, -0.06470012664794922, -0.06271791458129883, -0.06073570251464844, -0.05875349044799805, -0.056771278381347656, -0.054789066314697266, -0.052806854248046875, -0.050824642181396484, -0.048842430114746094, -0.0468602180480957, -0.04487800598144531, -0.04289579391479492, -0.04091358184814453, -0.03893136978149414, -0.03694915771484375, -0.03496694564819336, -0.03298473358154297, -0.031002521514892578, -0.029020309448242188, -0.027038097381591797, -0.025055885314941406, -0.023073673248291016, -0.021091461181640625, -0.019109249114990234, -0.017127037048339844, -0.015144824981689453, -0.013162612915039062, -0.011180400848388672, -0.009198188781738281, -0.007215976715087891, -0.0052337646484375, -0.0032515525817871094, -0.0012693405151367188, 0.0007128715515136719, 0.0026950836181640625, 0.004677295684814453, 0.006659507751464844, 0.008641719818115234, 0.010623931884765625, 0.012606143951416016, 0.014588356018066406, 0.016570568084716797, 0.018552780151367188, 0.020534992218017578, 0.02251720428466797, 0.02449941635131836, 0.02648162841796875, 0.02846384048461914, 0.03044605255126953, 0.03242826461791992, 0.03441047668457031, 0.0363926887512207, 0.038374900817871094, 0.040357112884521484, 0.042339324951171875, 0.044321537017822266, 0.046303749084472656, 0.04828596115112305, 0.05026817321777344, 0.05225038528442383, 0.05423259735107422, 0.05621480941772461, 0.058197021484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 10.0, 8.0, 9.0, 17.0, 14.0, 36.0, 17.0, 39.0, 47.0, 71.0, 81.0, 99.0, 106.0, 94.0, 78.0, 66.0, 49.0, 35.0, 25.0, 17.0, 12.0, 11.0, 6.0, 14.0, 4.0, 4.0, 3.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01366424560546875, -0.01316845417022705, -0.012672662734985352, -0.012176871299743652, -0.011681079864501953, -0.011185288429260254, -0.010689496994018555, -0.010193705558776855, -0.009697914123535156, -0.009202122688293457, -0.008706331253051758, -0.008210539817810059, -0.007714748382568359, -0.00721895694732666, -0.006723165512084961, -0.006227374076843262, -0.0057315826416015625, -0.005235791206359863, -0.004739999771118164, -0.004244208335876465, -0.0037484169006347656, -0.0032526254653930664, -0.002756834030151367, -0.002261042594909668, -0.0017652511596679688, -0.0012694597244262695, -0.0007736682891845703, -0.0002778768539428711, 0.00021791458129882812, 0.0007137060165405273, 0.0012094974517822266, 0.0017052888870239258, 0.002201080322265625, 0.0026968717575073242, 0.0031926631927490234, 0.0036884546279907227, 0.004184246063232422, 0.004680037498474121, 0.00517582893371582, 0.0056716203689575195, 0.006167411804199219, 0.006663203239440918, 0.007158994674682617, 0.007654786109924316, 0.008150577545166016, 0.008646368980407715, 0.009142160415649414, 0.009637951850891113, 0.010133743286132812, 0.010629534721374512, 0.011125326156616211, 0.01162111759185791, 0.01211690902709961, 0.012612700462341309, 0.013108491897583008, 0.013604283332824707, 0.014100074768066406, 0.014595866203308105, 0.015091657638549805, 0.015587449073791504, 0.016083240509033203, 0.016579031944274902, 0.0170748233795166, 0.0175706148147583, 0.01806640625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 12.0, 14.0, 17.0, 28.0, 57.0, 130.0, 178.0, 207.0, 157.0, 81.0, 52.0, 26.0, 9.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7911644577980042, -0.7521772384643555, -0.713189959526062, -0.6742027401924133, -0.6352155208587646, -0.5962282419204712, -0.5572410225868225, -0.5182538032531738, -0.47926652431488037, -0.4402792751789093, -0.40129202604293823, -0.36230480670928955, -0.3233175575733185, -0.2843303084373474, -0.24534307420253754, -0.20635583996772766, -0.1673685908317566, -0.12838134169578552, -0.08939410746097565, -0.050406865775585175, -0.011419624090194702, 0.027567625045776367, 0.06655485928058624, 0.10554209351539612, 0.1445293426513672, 0.18351659178733826, 0.22250382602214813, 0.261491060256958, 0.3004783093929291, 0.33946555852890015, 0.37845277786254883, 0.4174400269985199, 0.45642733573913574, 0.4954145848751068, 0.5344018340110779, 0.5733890533447266, 0.61237633228302, 0.6513635516166687, 0.6903507709503174, 0.7293380498886108, 0.7683252692222595, 0.8073124885559082, 0.8462997674942017, 0.8852869868278503, 0.924274206161499, 0.9632614850997925, 1.002248764038086, 1.0412359237670898, 1.0802232027053833, 1.1192104816436768, 1.1581976413726807, 1.1971849203109741, 1.2361721992492676, 1.2751593589782715, 1.314146637916565, 1.3531339168548584, 1.3921210765838623, 1.4311083555221558, 1.4700955152511597, 1.5090827941894531, 1.5480700731277466, 1.58705735206604, 1.626044511795044, 1.6650317907333374, 1.7040190696716309]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 6.0, 8.0, 13.0, 20.0, 16.0, 21.0, 19.0, 36.0, 26.0, 24.0, 41.0, 58.0, 54.0, 60.0, 61.0, 51.0, 68.0, 57.0, 64.0, 44.0, 38.0, 36.0, 29.0, 30.0, 23.0, 17.0, 18.0, 10.0, 11.0, 11.0, 6.0, 9.0, 1.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5933377742767334, -0.5779872536659241, -0.56263667345047, -0.5472861528396606, -0.5319355726242065, -0.5165850520133972, -0.5012345314025879, -0.4858839511871338, -0.47053343057632446, -0.45518288016319275, -0.43983232975006104, -0.4244818091392517, -0.40913125872612, -0.3937807083129883, -0.37843015789985657, -0.36307960748672485, -0.3477290868759155, -0.3323785364627838, -0.3170279860496521, -0.3016774654388428, -0.28632691502571106, -0.27097636461257935, -0.25562581419944763, -0.2402752786874771, -0.2249247133731842, -0.2095741629600525, -0.19422362744808197, -0.17887307703495026, -0.16352254152297974, -0.14817199110984802, -0.1328214406967163, -0.11747090518474579, -0.10212036967277527, -0.08676982671022415, -0.07141928374767303, -0.05606873705983162, -0.0407181940972805, -0.025367647409439087, -0.01001710444688797, 0.005333438515663147, 0.020683981478214264, 0.03603452444076538, 0.0513850674033165, 0.06673561036586761, 0.08208616077899933, 0.09743670374155045, 0.11278724670410156, 0.12813779711723328, 0.1434883326292038, 0.1588388830423355, 0.17418941855430603, 0.18953996896743774, 0.20489050447940826, 0.22024105489253998, 0.2355915904045105, 0.2509421408176422, 0.2662926912307739, 0.28164324164390564, 0.29699379205703735, 0.3123443126678467, 0.3276948630809784, 0.3430454134941101, 0.3583959639072418, 0.37374651432037354, 0.38909703493118286]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 23.0, 12.0, 16.0, 20.0, 35.0, 42.0, 80.0, 118.0, 168.0, 258.0, 393.0, 613.0, 1003.0, 1658.0, 2810.0, 4896.0, 9337.0, 17930.0, 38255.0, 88841.0, 220180.0, 339254.0, 182477.0, 73402.0, 32054.0, 15627.0, 8066.0, 4411.0, 2534.0, 1423.0, 966.0, 569.0, 381.0, 258.0, 135.0, 90.0, 64.0, 49.0, 29.0, 18.0, 11.0, 10.0, 11.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.31298828125, -0.3036155700683594, -0.29424285888671875, -0.2848701477050781, -0.2754974365234375, -0.2661247253417969, -0.25675201416015625, -0.24737930297851562, -0.238006591796875, -0.22863388061523438, -0.21926116943359375, -0.20988845825195312, -0.2005157470703125, -0.19114303588867188, -0.18177032470703125, -0.17239761352539062, -0.16302490234375, -0.15365219116210938, -0.14427947998046875, -0.13490676879882812, -0.1255340576171875, -0.11616134643554688, -0.10678863525390625, -0.09741592407226562, -0.088043212890625, -0.07867050170898438, -0.06929779052734375, -0.059925079345703125, -0.0505523681640625, -0.041179656982421875, -0.03180694580078125, -0.022434234619140625, -0.0130615234375, -0.003688812255859375, 0.00568389892578125, 0.015056610107421875, 0.0244293212890625, 0.033802032470703125, 0.04317474365234375, 0.052547454833984375, 0.061920166015625, 0.07129287719726562, 0.08066558837890625, 0.09003829956054688, 0.0994110107421875, 0.10878372192382812, 0.11815643310546875, 0.12752914428710938, 0.13690185546875, 0.14627456665039062, 0.15564727783203125, 0.16501998901367188, 0.1743927001953125, 0.18376541137695312, 0.19313812255859375, 0.20251083374023438, 0.211883544921875, 0.22125625610351562, 0.23062896728515625, 0.24000167846679688, 0.2493743896484375, 0.2587471008300781, 0.26811981201171875, 0.2774925231933594, 0.286865234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 9.0, 5.0, 11.0, 15.0, 17.0, 22.0, 28.0, 21.0, 39.0, 35.0, 35.0, 46.0, 50.0, 59.0, 65.0, 59.0, 63.0, 49.0, 56.0, 57.0, 41.0, 28.0, 33.0, 26.0, 21.0, 19.0, 14.0, 12.0, 14.0, 12.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2294921875, -1.1947250366210938, -1.1599578857421875, -1.1251907348632812, -1.090423583984375, -1.0556564331054688, -1.0208892822265625, -0.9861221313476562, -0.95135498046875, -0.9165878295898438, -0.8818206787109375, -0.8470535278320312, -0.812286376953125, -0.7775192260742188, -0.7427520751953125, -0.7079849243164062, -0.6732177734375, -0.6384506225585938, -0.6036834716796875, -0.5689163208007812, -0.534149169921875, -0.49938201904296875, -0.4646148681640625, -0.42984771728515625, -0.39508056640625, -0.36031341552734375, -0.3255462646484375, -0.29077911376953125, -0.256011962890625, -0.22124481201171875, -0.1864776611328125, -0.15171051025390625, -0.116943359375, -0.08217620849609375, -0.0474090576171875, -0.01264190673828125, 0.022125244140625, 0.05689239501953125, 0.0916595458984375, 0.12642669677734375, 0.16119384765625, 0.19596099853515625, 0.2307281494140625, 0.26549530029296875, 0.300262451171875, 0.33502960205078125, 0.3697967529296875, 0.40456390380859375, 0.4393310546875, 0.47409820556640625, 0.5088653564453125, 0.5436325073242188, 0.578399658203125, 0.6131668090820312, 0.6479339599609375, 0.6827011108398438, 0.71746826171875, 0.7522354125976562, 0.7870025634765625, 0.8217697143554688, 0.856536865234375, 0.8913040161132812, 0.9260711669921875, 0.9608383178710938, 0.99560546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 6.0, 11.0, 8.0, 9.0, 15.0, 26.0, 44.0, 35.0, 57.0, 65.0, 94.0, 142.0, 199.0, 321.0, 580.0, 1099.0, 2438.0, 6784.0, 24411.0, 118822.0, 527343.0, 292211.0, 53518.0, 12613.0, 4037.0, 1567.0, 758.0, 409.0, 262.0, 176.0, 121.0, 96.0, 73.0, 42.0, 41.0, 23.0, 30.0, 19.0, 16.0, 8.0, 3.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.420166015625, -0.4069366455078125, -0.393707275390625, -0.3804779052734375, -0.36724853515625, -0.3540191650390625, -0.340789794921875, -0.3275604248046875, -0.3143310546875, -0.3011016845703125, -0.287872314453125, -0.2746429443359375, -0.26141357421875, -0.2481842041015625, -0.234954833984375, -0.2217254638671875, -0.20849609375, -0.1952667236328125, -0.182037353515625, -0.1688079833984375, -0.15557861328125, -0.1423492431640625, -0.129119873046875, -0.1158905029296875, -0.1026611328125, -0.0894317626953125, -0.076202392578125, -0.0629730224609375, -0.04974365234375, -0.0365142822265625, -0.023284912109375, -0.0100555419921875, 0.003173828125, 0.0164031982421875, 0.029632568359375, 0.0428619384765625, 0.05609130859375, 0.0693206787109375, 0.082550048828125, 0.0957794189453125, 0.1090087890625, 0.1222381591796875, 0.135467529296875, 0.1486968994140625, 0.16192626953125, 0.1751556396484375, 0.188385009765625, 0.2016143798828125, 0.21484375, 0.2280731201171875, 0.241302490234375, 0.2545318603515625, 0.26776123046875, 0.2809906005859375, 0.294219970703125, 0.3074493408203125, 0.3206787109375, 0.3339080810546875, 0.347137451171875, 0.3603668212890625, 0.37359619140625, 0.3868255615234375, 0.400054931640625, 0.4132843017578125, 0.426513671875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 9.0, 7.0, 13.0, 15.0, 19.0, 13.0, 19.0, 22.0, 20.0, 14.0, 29.0, 32.0, 41.0, 35.0, 46.0, 48.0, 39.0, 40.0, 52.0, 39.0, 31.0, 43.0, 39.0, 44.0, 35.0, 36.0, 35.0, 24.0, 22.0, 20.0, 21.0, 16.0, 17.0, 12.0, 12.0, 11.0, 5.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1435546875, -1.1095428466796875, -1.075531005859375, -1.0415191650390625, -1.00750732421875, -0.9734954833984375, -0.939483642578125, -0.9054718017578125, -0.8714599609375, -0.8374481201171875, -0.803436279296875, -0.7694244384765625, -0.73541259765625, -0.7014007568359375, -0.667388916015625, -0.6333770751953125, -0.599365234375, -0.5653533935546875, -0.531341552734375, -0.4973297119140625, -0.46331787109375, -0.4293060302734375, -0.395294189453125, -0.3612823486328125, -0.3272705078125, -0.2932586669921875, -0.259246826171875, -0.2252349853515625, -0.19122314453125, -0.1572113037109375, -0.123199462890625, -0.0891876220703125, -0.05517578125, -0.0211639404296875, 0.012847900390625, 0.0468597412109375, 0.08087158203125, 0.1148834228515625, 0.148895263671875, 0.1829071044921875, 0.2169189453125, 0.2509307861328125, 0.284942626953125, 0.3189544677734375, 0.35296630859375, 0.3869781494140625, 0.420989990234375, 0.4550018310546875, 0.489013671875, 0.5230255126953125, 0.557037353515625, 0.5910491943359375, 0.62506103515625, 0.6590728759765625, 0.693084716796875, 0.7270965576171875, 0.7611083984375, 0.7951202392578125, 0.829132080078125, 0.8631439208984375, 0.89715576171875, 0.9311676025390625, 0.965179443359375, 0.9991912841796875, 1.033203125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 4.0, 6.0, 3.0, 4.0, 3.0, 5.0, 13.0, 15.0, 19.0, 26.0, 28.0, 60.0, 61.0, 105.0, 189.0, 283.0, 473.0, 884.0, 1771.0, 3954.0, 10861.0, 37722.0, 180372.0, 561803.0, 190749.0, 39861.0, 11062.0, 4141.0, 1852.0, 914.0, 506.0, 273.0, 180.0, 102.0, 79.0, 51.0, 38.0, 30.0, 13.0, 21.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1732177734375, -0.16834068298339844, -0.16346359252929688, -0.1585865020751953, -0.15370941162109375, -0.1488323211669922, -0.14395523071289062, -0.13907814025878906, -0.1342010498046875, -0.12932395935058594, -0.12444686889648438, -0.11956977844238281, -0.11469268798828125, -0.10981559753417969, -0.10493850708007812, -0.10006141662597656, -0.095184326171875, -0.09030723571777344, -0.08543014526367188, -0.08055305480957031, -0.07567596435546875, -0.07079887390136719, -0.06592178344726562, -0.06104469299316406, -0.0561676025390625, -0.05129051208496094, -0.046413421630859375, -0.04153633117675781, -0.03665924072265625, -0.03178215026855469, -0.026905059814453125, -0.022027969360351562, -0.01715087890625, -0.012273788452148438, -0.007396697998046875, -0.0025196075439453125, 0.00235748291015625, 0.0072345733642578125, 0.012111663818359375, 0.016988754272460938, 0.0218658447265625, 0.026742935180664062, 0.031620025634765625, 0.03649711608886719, 0.04137420654296875, 0.04625129699707031, 0.051128387451171875, 0.05600547790527344, 0.060882568359375, 0.06575965881347656, 0.07063674926757812, 0.07551383972167969, 0.08039093017578125, 0.08526802062988281, 0.09014511108398438, 0.09502220153808594, 0.0998992919921875, 0.10477638244628906, 0.10965347290039062, 0.11453056335449219, 0.11940765380859375, 0.12428474426269531, 0.12916183471679688, 0.13403892517089844, 0.138916015625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 10.0, 8.0, 13.0, 11.0, 20.0, 26.0, 29.0, 39.0, 50.0, 51.0, 48.0, 52.0, 61.0, 90.0, 58.0, 66.0, 66.0, 49.0, 52.0, 42.0, 30.0, 22.0, 19.0, 21.0, 9.0, 9.0, 7.0, 4.0, 10.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.8215738236904144e-05, -1.747719943523407e-05, -1.6738660633563995e-05, -1.600012183189392e-05, -1.5261583030223846e-05, -1.4523044228553772e-05, -1.3784505426883698e-05, -1.3045966625213623e-05, -1.2307427823543549e-05, -1.1568889021873474e-05, -1.08303502202034e-05, -1.0091811418533325e-05, -9.35327261686325e-06, -8.614733815193176e-06, -7.876195013523102e-06, -7.137656211853027e-06, -6.399117410182953e-06, -5.660578608512878e-06, -4.922039806842804e-06, -4.1835010051727295e-06, -3.444962203502655e-06, -2.7064234018325806e-06, -1.967884600162506e-06, -1.2293457984924316e-06, -4.908069968223572e-07, 2.477318048477173e-07, 9.862706065177917e-07, 1.7248094081878662e-06, 2.4633482098579407e-06, 3.201887011528015e-06, 3.94042581319809e-06, 4.678964614868164e-06, 5.4175034165382385e-06, 6.156042218208313e-06, 6.8945810198783875e-06, 7.633119821548462e-06, 8.371658623218536e-06, 9.11019742488861e-06, 9.848736226558685e-06, 1.058727502822876e-05, 1.1325813829898834e-05, 1.2064352631568909e-05, 1.2802891433238983e-05, 1.3541430234909058e-05, 1.4279969036579132e-05, 1.5018507838249207e-05, 1.575704663991928e-05, 1.6495585441589355e-05, 1.723412424325943e-05, 1.7972663044929504e-05, 1.871120184659958e-05, 1.9449740648269653e-05, 2.0188279449939728e-05, 2.0926818251609802e-05, 2.1665357053279877e-05, 2.240389585494995e-05, 2.3142434656620026e-05, 2.38809734582901e-05, 2.4619512259960175e-05, 2.535805106163025e-05, 2.6096589863300323e-05, 2.6835128664970398e-05, 2.7573667466640472e-05, 2.8312206268310547e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 2.0, 7.0, 4.0, 11.0, 15.0, 11.0, 14.0, 23.0, 35.0, 56.0, 75.0, 129.0, 167.0, 302.0, 501.0, 998.0, 2068.0, 4870.0, 13568.0, 48396.0, 208303.0, 523880.0, 181268.0, 42910.0, 12393.0, 4427.0, 1958.0, 891.0, 505.0, 270.0, 168.0, 110.0, 74.0, 50.0, 29.0, 17.0, 9.0, 15.0, 5.0, 2.0, 5.0, 2.0, 5.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1341552734375, -0.12960052490234375, -0.1250457763671875, -0.12049102783203125, -0.115936279296875, -0.11138153076171875, -0.1068267822265625, -0.10227203369140625, -0.09771728515625, -0.09316253662109375, -0.0886077880859375, -0.08405303955078125, -0.079498291015625, -0.07494354248046875, -0.0703887939453125, -0.06583404541015625, -0.061279296875, -0.05672454833984375, -0.0521697998046875, -0.04761505126953125, -0.043060302734375, -0.03850555419921875, -0.0339508056640625, -0.02939605712890625, -0.02484130859375, -0.02028656005859375, -0.0157318115234375, -0.01117706298828125, -0.006622314453125, -0.00206756591796875, 0.0024871826171875, 0.00704193115234375, 0.0115966796875, 0.01615142822265625, 0.0207061767578125, 0.02526092529296875, 0.029815673828125, 0.03437042236328125, 0.0389251708984375, 0.04347991943359375, 0.04803466796875, 0.05258941650390625, 0.0571441650390625, 0.06169891357421875, 0.066253662109375, 0.07080841064453125, 0.0753631591796875, 0.07991790771484375, 0.08447265625, 0.08902740478515625, 0.0935821533203125, 0.09813690185546875, 0.102691650390625, 0.10724639892578125, 0.1118011474609375, 0.11635589599609375, 0.12091064453125, 0.12546539306640625, 0.1300201416015625, 0.13457489013671875, 0.139129638671875, 0.14368438720703125, 0.1482391357421875, 0.15279388427734375, 0.1573486328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 6.0, 6.0, 6.0, 11.0, 12.0, 16.0, 21.0, 25.0, 33.0, 42.0, 48.0, 49.0, 57.0, 47.0, 72.0, 75.0, 65.0, 58.0, 64.0, 59.0, 47.0, 31.0, 26.0, 32.0, 15.0, 16.0, 14.0, 6.0, 8.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.072021484375, -0.06992053985595703, -0.06781959533691406, -0.0657186508178711, -0.06361770629882812, -0.061516761779785156, -0.05941581726074219, -0.05731487274169922, -0.05521392822265625, -0.05311298370361328, -0.05101203918457031, -0.048911094665527344, -0.046810150146484375, -0.044709205627441406, -0.04260826110839844, -0.04050731658935547, -0.0384063720703125, -0.03630542755126953, -0.03420448303222656, -0.032103538513183594, -0.030002593994140625, -0.027901649475097656, -0.025800704956054688, -0.02369976043701172, -0.02159881591796875, -0.01949787139892578, -0.017396926879882812, -0.015295982360839844, -0.013195037841796875, -0.011094093322753906, -0.008993148803710938, -0.006892204284667969, -0.004791259765625, -0.0026903152465820312, -0.0005893707275390625, 0.0015115737915039062, 0.003612518310546875, 0.005713462829589844, 0.007814407348632812, 0.009915351867675781, 0.01201629638671875, 0.014117240905761719, 0.016218185424804688, 0.018319129943847656, 0.020420074462890625, 0.022521018981933594, 0.024621963500976562, 0.02672290802001953, 0.0288238525390625, 0.03092479705810547, 0.03302574157714844, 0.035126686096191406, 0.037227630615234375, 0.039328575134277344, 0.04142951965332031, 0.04353046417236328, 0.04563140869140625, 0.04773235321044922, 0.04983329772949219, 0.051934242248535156, 0.054035186767578125, 0.056136131286621094, 0.05823707580566406, 0.06033802032470703, 0.06243896484375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 9.0, 26.0, 84.0, 344.0, 421.0, 86.0, 21.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4405770301818848, -1.237849473953247, -1.0351219177246094, -0.8323944807052612, -0.6296669244766235, -0.42693936824798584, -0.2242119312286377, -0.021484375, 0.1812431812286377, 0.383970707654953, 0.5866982340812683, 0.7894257307052612, 0.9921532869338989, 1.1948808431625366, 1.3976082801818848, 1.6003358364105225, 1.8030633926391602, 2.005790948867798, 2.2085185050964355, 2.411245822906494, 2.613973617553711, 2.8167009353637695, 3.0194284915924072, 3.222156047821045, 3.4248836040496826, 3.6276111602783203, 3.830338716506958, 4.033066272735596, 4.235793590545654, 4.438521385192871, 4.64124870300293, 4.843976020812988, 5.046703338623047, 5.2494306564331055, 5.452158451080322, 5.654885768890381, 5.857613563537598, 6.060340881347656, 6.263068199157715, 6.465795993804932, 6.668523788452148, 6.871251106262207, 7.073978900909424, 7.276706218719482, 7.479434013366699, 7.682161331176758, 7.884888648986816, 8.087615966796875, 8.29034423828125, 8.493071556091309, 8.695798873901367, 8.898527145385742, 9.1012544631958, 9.30398178100586, 9.506709098815918, 9.709436416625977, 9.912163734436035, 10.114891052246094, 10.317618370056152, 10.520346641540527, 10.723073959350586, 10.925801277160645, 11.128528594970703, 11.331256866455078, 11.533984184265137]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 9.0, 3.0, 9.0, 7.0, 7.0, 13.0, 10.0, 12.0, 19.0, 14.0, 16.0, 23.0, 24.0, 33.0, 23.0, 25.0, 23.0, 34.0, 32.0, 50.0, 40.0, 40.0, 41.0, 28.0, 43.0, 29.0, 44.0, 28.0, 27.0, 28.0, 38.0, 32.0, 28.0, 21.0, 18.0, 18.0, 21.0, 15.0, 15.0, 7.0, 11.0, 9.0, 9.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-1.9083850383758545, -1.853682041168213, -1.7989789247512817, -1.7442758083343506, -1.689572811126709, -1.6348698139190674, -1.5801666975021362, -1.525463581085205, -1.4707605838775635, -1.4160575866699219, -1.3613544702529907, -1.3066513538360596, -1.251948356628418, -1.1972453594207764, -1.1425422430038452, -1.087839126586914, -1.0331361293792725, -0.9784330725669861, -0.9237300157546997, -0.8690269589424133, -0.814323902130127, -0.7596208453178406, -0.7049177885055542, -0.6502147316932678, -0.5955116748809814, -0.5408086180686951, -0.4861055612564087, -0.4314025044441223, -0.37669944763183594, -0.32199639081954956, -0.2672933340072632, -0.2125902771949768, -0.15788722038269043, -0.10318416357040405, -0.048481106758117676, 0.006221950054168701, 0.06092500686645508, 0.11562806367874146, 0.17033112049102783, 0.2250341773033142, 0.2797372341156006, 0.33444029092788696, 0.38914334774017334, 0.4438464045524597, 0.4985494613647461, 0.5532525181770325, 0.6079555749893188, 0.6626586318016052, 0.7173616886138916, 0.772064745426178, 0.8267678022384644, 0.8814708590507507, 0.9361739158630371, 0.9908769726753235, 1.0455800294876099, 1.100283145904541, 1.1549861431121826, 1.2096891403198242, 1.2643922567367554, 1.3190953731536865, 1.3737983703613281, 1.4285013675689697, 1.4832044839859009, 1.537907600402832, 1.5926105976104736]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 9.0, 25.0, 33.0, 40.0, 62.0, 99.0, 152.0, 267.0, 441.0, 781.0, 1503.0, 3010.0, 6768.0, 18099.0, 68254.0, 488569.0, 3001380.0, 505377.0, 68496.0, 17936.0, 6596.0, 2958.0, 1489.0, 724.0, 443.0, 273.0, 163.0, 101.0, 61.0, 41.0, 38.0, 19.0, 17.0, 9.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.724609375, -0.7000503540039062, -0.6754913330078125, -0.6509323120117188, -0.626373291015625, -0.6018142700195312, -0.5772552490234375, -0.5526962280273438, -0.52813720703125, -0.5035781860351562, -0.4790191650390625, -0.45446014404296875, -0.429901123046875, -0.40534210205078125, -0.3807830810546875, -0.35622406005859375, -0.3316650390625, -0.30710601806640625, -0.2825469970703125, -0.25798797607421875, -0.233428955078125, -0.20886993408203125, -0.1843109130859375, -0.15975189208984375, -0.13519287109375, -0.11063385009765625, -0.0860748291015625, -0.06151580810546875, -0.036956787109375, -0.01239776611328125, 0.0121612548828125, 0.03672027587890625, 0.061279296875, 0.08583831787109375, 0.1103973388671875, 0.13495635986328125, 0.159515380859375, 0.18407440185546875, 0.2086334228515625, 0.23319244384765625, 0.25775146484375, 0.28231048583984375, 0.3068695068359375, 0.33142852783203125, 0.355987548828125, 0.38054656982421875, 0.4051055908203125, 0.42966461181640625, 0.4542236328125, 0.47878265380859375, 0.5033416748046875, 0.5279006958007812, 0.552459716796875, 0.5770187377929688, 0.6015777587890625, 0.6261367797851562, 0.65069580078125, 0.6752548217773438, 0.6998138427734375, 0.7243728637695312, 0.748931884765625, 0.7734909057617188, 0.7980499267578125, 0.8226089477539062, 0.84716796875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 3.0, 6.0, 15.0, 10.0, 19.0, 16.0, 20.0, 21.0, 33.0, 36.0, 45.0, 51.0, 74.0, 68.0, 55.0, 82.0, 73.0, 58.0, 49.0, 44.0, 38.0, 37.0, 35.0, 26.0, 18.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 11.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.84716796875, -0.8255615234375, -0.803955078125, -0.7823486328125, -0.7607421875, -0.7391357421875, -0.717529296875, -0.6959228515625, -0.67431640625, -0.6527099609375, -0.631103515625, -0.6094970703125, -0.587890625, -0.5662841796875, -0.544677734375, -0.5230712890625, -0.50146484375, -0.4798583984375, -0.458251953125, -0.4366455078125, -0.4150390625, -0.3934326171875, -0.371826171875, -0.3502197265625, -0.32861328125, -0.3070068359375, -0.285400390625, -0.2637939453125, -0.2421875, -0.2205810546875, -0.198974609375, -0.1773681640625, -0.15576171875, -0.1341552734375, -0.112548828125, -0.0909423828125, -0.0693359375, -0.0477294921875, -0.026123046875, -0.0045166015625, 0.01708984375, 0.0386962890625, 0.060302734375, 0.0819091796875, 0.103515625, 0.1251220703125, 0.146728515625, 0.1683349609375, 0.18994140625, 0.2115478515625, 0.233154296875, 0.2547607421875, 0.2763671875, 0.2979736328125, 0.319580078125, 0.3411865234375, 0.36279296875, 0.3843994140625, 0.406005859375, 0.4276123046875, 0.44921875, 0.4708251953125, 0.492431640625, 0.5140380859375, 0.53564453125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 9.0, 8.0, 19.0, 19.0, 36.0, 39.0, 61.0, 112.0, 164.0, 273.0, 451.0, 926.0, 1971.0, 4869.0, 14080.0, 57095.0, 452818.0, 3310145.0, 288779.0, 43170.0, 11607.0, 4004.0, 1653.0, 810.0, 422.0, 255.0, 157.0, 82.0, 82.0, 44.0, 31.0, 23.0, 25.0, 15.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.947265625, -0.9232330322265625, -0.899200439453125, -0.8751678466796875, -0.85113525390625, -0.8271026611328125, -0.803070068359375, -0.7790374755859375, -0.7550048828125, -0.7309722900390625, -0.706939697265625, -0.6829071044921875, -0.65887451171875, -0.6348419189453125, -0.610809326171875, -0.5867767333984375, -0.562744140625, -0.5387115478515625, -0.514678955078125, -0.4906463623046875, -0.46661376953125, -0.4425811767578125, -0.418548583984375, -0.3945159912109375, -0.3704833984375, -0.3464508056640625, -0.322418212890625, -0.2983856201171875, -0.27435302734375, -0.2503204345703125, -0.226287841796875, -0.2022552490234375, -0.17822265625, -0.1541900634765625, -0.130157470703125, -0.1061248779296875, -0.08209228515625, -0.0580596923828125, -0.034027099609375, -0.0099945068359375, 0.0140380859375, 0.0380706787109375, 0.062103271484375, 0.0861358642578125, 0.11016845703125, 0.1342010498046875, 0.158233642578125, 0.1822662353515625, 0.206298828125, 0.2303314208984375, 0.254364013671875, 0.2783966064453125, 0.30242919921875, 0.3264617919921875, 0.350494384765625, 0.3745269775390625, 0.3985595703125, 0.4225921630859375, 0.446624755859375, 0.4706573486328125, 0.49468994140625, 0.5187225341796875, 0.542755126953125, 0.5667877197265625, 0.5908203125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 10.0, 9.0, 19.0, 16.0, 32.0, 43.0, 45.0, 67.0, 109.0, 164.0, 279.0, 508.0, 736.0, 714.0, 477.0, 274.0, 201.0, 114.0, 68.0, 53.0, 41.0, 28.0, 13.0, 12.0, 10.0, 9.0, 5.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2427978515625, -0.23520851135253906, -0.22761917114257812, -0.2200298309326172, -0.21244049072265625, -0.2048511505126953, -0.19726181030273438, -0.18967247009277344, -0.1820831298828125, -0.17449378967285156, -0.16690444946289062, -0.1593151092529297, -0.15172576904296875, -0.1441364288330078, -0.13654708862304688, -0.12895774841308594, -0.121368408203125, -0.11377906799316406, -0.10618972778320312, -0.09860038757324219, -0.09101104736328125, -0.08342170715332031, -0.07583236694335938, -0.06824302673339844, -0.0606536865234375, -0.05306434631347656, -0.045475006103515625, -0.03788566589355469, -0.03029632568359375, -0.022706985473632812, -0.015117645263671875, -0.0075283050537109375, 6.103515625e-05, 0.0076503753662109375, 0.015239715576171875, 0.022829055786132812, 0.03041839599609375, 0.03800773620605469, 0.045597076416015625, 0.05318641662597656, 0.0607757568359375, 0.06836509704589844, 0.07595443725585938, 0.08354377746582031, 0.09113311767578125, 0.09872245788574219, 0.10631179809570312, 0.11390113830566406, 0.121490478515625, 0.12907981872558594, 0.13666915893554688, 0.1442584991455078, 0.15184783935546875, 0.1594371795654297, 0.16702651977539062, 0.17461585998535156, 0.1822052001953125, 0.18979454040527344, 0.19738388061523438, 0.2049732208251953, 0.21256256103515625, 0.2201519012451172, 0.22774124145507812, 0.23533058166503906, 0.242919921875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 13.0, 15.0, 32.0, 42.0, 101.0, 111.0, 134.0, 170.0, 151.0, 101.0, 46.0, 38.0, 12.0, 8.0, 2.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150179386138916, -1.1009091138839722, -1.0516388416290283, -1.0023685693740845, -0.9530983567237854, -0.9038280844688416, -0.8545578122138977, -0.8052875995635986, -0.7560173273086548, -0.7067470550537109, -0.6574767827987671, -0.6082065105438232, -0.5589362978935242, -0.5096660256385803, -0.4603957533836365, -0.411125510931015, -0.3618552088737488, -0.31258493661880493, -0.26331469416618347, -0.21404442191123962, -0.16477416455745697, -0.11550390720367432, -0.06623363494873047, -0.01696339249610901, 0.03230687975883484, 0.08157713711261749, 0.13084739446640015, 0.180117666721344, 0.22938792407512665, 0.2786581814289093, 0.32792845368385315, 0.3771986961364746, 0.42646896839141846, 0.4757392406463623, 0.5250095129013062, 0.57427978515625, 0.6235499978065491, 0.6728202700614929, 0.7220905423164368, 0.7713607549667358, 0.8206310272216797, 0.8699012994766235, 0.9191715717315674, 0.9684418439865112, 1.017712116241455, 1.0669822692871094, 1.1162526607513428, 1.165522813796997, 1.2147932052612305, 1.2640634775161743, 1.3133337497711182, 1.362604022026062, 1.4118742942810059, 1.4611444473266602, 1.5104148387908936, 1.5596849918365479, 1.6089552640914917, 1.6582255363464355, 1.7074958086013794, 1.7567660808563232, 1.806036353111267, 1.855306625366211, 1.9045767784118652, 1.953847050666809, 2.003117322921753]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 16.0, 18.0, 22.0, 28.0, 27.0, 22.0, 44.0, 46.0, 53.0, 45.0, 54.0, 51.0, 63.0, 51.0, 64.0, 58.0, 57.0, 48.0, 41.0, 45.0, 26.0, 31.0, 18.0, 18.0, 5.0, 7.0, 6.0, 8.0, 8.0, 5.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9268340468406677, -0.9035760760307312, -0.8803180456161499, -0.8570600748062134, -0.8338020443916321, -0.8105440735816956, -0.7872860431671143, -0.7640280723571777, -0.7407701015472412, -0.7175121307373047, -0.6942541003227234, -0.6709961295127869, -0.6477380990982056, -0.624480128288269, -0.6012221574783325, -0.5779641270637512, -0.5547060966491699, -0.5314481258392334, -0.5081900954246521, -0.4849321246147156, -0.4616740942001343, -0.43841612339019775, -0.41515812277793884, -0.39190012216567993, -0.368642121553421, -0.3453841209411621, -0.3221261203289032, -0.2988681197166443, -0.27561014890670776, -0.25235211849212646, -0.22909414768218994, -0.20583614706993103, -0.18257814645767212, -0.1593201458454132, -0.1360621452331543, -0.11280415952205658, -0.08954615890979767, -0.06628815829753876, -0.04303017258644104, -0.01977217197418213, 0.0034858286380767822, 0.026743825525045395, 0.05000182241201401, 0.07325981557369232, 0.09651781618595123, 0.11977581679821014, 0.14303380250930786, 0.16629180312156677, 0.18954980373382568, 0.2128078043460846, 0.2360658049583435, 0.25932377576828003, 0.28258180618286133, 0.30583977699279785, 0.32909777760505676, 0.3523557782173157, 0.3756137788295746, 0.3988717794418335, 0.4221297800540924, 0.4453877806663513, 0.46864575147628784, 0.49190378189086914, 0.5151617527008057, 0.5384197235107422, 0.5616777539253235]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 5.0, 6.0, 10.0, 13.0, 16.0, 22.0, 47.0, 61.0, 104.0, 132.0, 231.0, 447.0, 812.0, 1659.0, 3766.0, 9739.0, 30555.0, 145575.0, 556677.0, 233360.0, 43434.0, 12668.0, 4769.0, 2177.0, 1030.0, 532.0, 271.0, 169.0, 84.0, 64.0, 43.0, 24.0, 16.0, 12.0, 7.0, 4.0, 2.0, 3.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1309814453125, -0.12684059143066406, -0.12269973754882812, -0.11855888366699219, -0.11441802978515625, -0.11027717590332031, -0.10613632202148438, -0.10199546813964844, -0.0978546142578125, -0.09371376037597656, -0.08957290649414062, -0.08543205261230469, -0.08129119873046875, -0.07715034484863281, -0.07300949096679688, -0.06886863708496094, -0.064727783203125, -0.06058692932128906, -0.056446075439453125, -0.05230522155761719, -0.04816436767578125, -0.04402351379394531, -0.039882659912109375, -0.03574180603027344, -0.0316009521484375, -0.027460098266601562, -0.023319244384765625, -0.019178390502929688, -0.01503753662109375, -0.010896682739257812, -0.006755828857421875, -0.0026149749755859375, 0.00152587890625, 0.0056667327880859375, 0.009807586669921875, 0.013948440551757812, 0.01808929443359375, 0.022230148315429688, 0.026371002197265625, 0.030511856079101562, 0.0346527099609375, 0.03879356384277344, 0.042934417724609375, 0.04707527160644531, 0.05121612548828125, 0.05535697937011719, 0.059497833251953125, 0.06363868713378906, 0.067779541015625, 0.07192039489746094, 0.07606124877929688, 0.08020210266113281, 0.08434295654296875, 0.08848381042480469, 0.09262466430664062, 0.09676551818847656, 0.1009063720703125, 0.10504722595214844, 0.10918807983398438, 0.11332893371582031, 0.11746978759765625, 0.12161064147949219, 0.12575149536132812, 0.12989234924316406, 0.134033203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 6.0, 5.0, 10.0, 28.0, 23.0, 28.0, 27.0, 32.0, 63.0, 50.0, 46.0, 57.0, 67.0, 82.0, 71.0, 66.0, 66.0, 62.0, 47.0, 34.0, 29.0, 29.0, 21.0, 9.0, 9.0, 5.0, 10.0, 6.0, 4.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66455078125, -0.6459274291992188, -0.6273040771484375, -0.6086807250976562, -0.590057373046875, -0.5714340209960938, -0.5528106689453125, -0.5341873168945312, -0.51556396484375, -0.49694061279296875, -0.4783172607421875, -0.45969390869140625, -0.441070556640625, -0.42244720458984375, -0.4038238525390625, -0.38520050048828125, -0.3665771484375, -0.34795379638671875, -0.3293304443359375, -0.31070709228515625, -0.292083740234375, -0.27346038818359375, -0.2548370361328125, -0.23621368408203125, -0.21759033203125, -0.19896697998046875, -0.1803436279296875, -0.16172027587890625, -0.143096923828125, -0.12447357177734375, -0.1058502197265625, -0.08722686767578125, -0.068603515625, -0.04998016357421875, -0.0313568115234375, -0.01273345947265625, 0.005889892578125, 0.02451324462890625, 0.0431365966796875, 0.06175994873046875, 0.08038330078125, 0.09900665283203125, 0.1176300048828125, 0.13625335693359375, 0.154876708984375, 0.17350006103515625, 0.1921234130859375, 0.21074676513671875, 0.2293701171875, 0.24799346923828125, 0.2666168212890625, 0.28524017333984375, 0.303863525390625, 0.32248687744140625, 0.3411102294921875, 0.35973358154296875, 0.37835693359375, 0.39698028564453125, 0.4156036376953125, 0.43422698974609375, 0.452850341796875, 0.47147369384765625, 0.4900970458984375, 0.5087203979492188, 0.52734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 9.0, 8.0, 16.0, 34.0, 50.0, 60.0, 121.0, 166.0, 405.0, 900.0, 2645.0, 11586.0, 115911.0, 746123.0, 152074.0, 13596.0, 2934.0, 1003.0, 403.0, 212.0, 106.0, 65.0, 34.0, 16.0, 12.0, 15.0, 14.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1942138671875, -0.188751220703125, -0.18328857421875, -0.177825927734375, -0.17236328125, -0.166900634765625, -0.16143798828125, -0.155975341796875, -0.1505126953125, -0.145050048828125, -0.13958740234375, -0.134124755859375, -0.128662109375, -0.123199462890625, -0.11773681640625, -0.112274169921875, -0.1068115234375, -0.101348876953125, -0.09588623046875, -0.090423583984375, -0.0849609375, -0.079498291015625, -0.07403564453125, -0.068572998046875, -0.0631103515625, -0.057647705078125, -0.05218505859375, -0.046722412109375, -0.041259765625, -0.035797119140625, -0.03033447265625, -0.024871826171875, -0.0194091796875, -0.013946533203125, -0.00848388671875, -0.003021240234375, 0.00244140625, 0.007904052734375, 0.01336669921875, 0.018829345703125, 0.0242919921875, 0.029754638671875, 0.03521728515625, 0.040679931640625, 0.046142578125, 0.051605224609375, 0.05706787109375, 0.062530517578125, 0.0679931640625, 0.073455810546875, 0.07891845703125, 0.084381103515625, 0.08984375, 0.095306396484375, 0.10076904296875, 0.106231689453125, 0.1116943359375, 0.117156982421875, 0.12261962890625, 0.128082275390625, 0.133544921875, 0.139007568359375, 0.14447021484375, 0.149932861328125, 0.1553955078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 2.0, 0.0, 7.0, 4.0, 6.0, 3.0, 9.0, 12.0, 17.0, 17.0, 19.0, 21.0, 25.0, 30.0, 26.0, 38.0, 44.0, 30.0, 41.0, 42.0, 43.0, 50.0, 43.0, 47.0, 40.0, 44.0, 28.0, 36.0, 35.0, 25.0, 48.0, 29.0, 18.0, 25.0, 24.0, 21.0, 15.0, 5.0, 12.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.728515625, -0.7033615112304688, -0.6782073974609375, -0.6530532836914062, -0.627899169921875, -0.6027450561523438, -0.5775909423828125, -0.5524368286132812, -0.52728271484375, -0.5021286010742188, -0.4769744873046875, -0.45182037353515625, -0.426666259765625, -0.40151214599609375, -0.3763580322265625, -0.35120391845703125, -0.3260498046875, -0.30089569091796875, -0.2757415771484375, -0.25058746337890625, -0.225433349609375, -0.20027923583984375, -0.1751251220703125, -0.14997100830078125, -0.12481689453125, -0.09966278076171875, -0.0745086669921875, -0.04935455322265625, -0.024200439453125, 0.00095367431640625, 0.0261077880859375, 0.05126190185546875, 0.076416015625, 0.10157012939453125, 0.1267242431640625, 0.15187835693359375, 0.177032470703125, 0.20218658447265625, 0.2273406982421875, 0.25249481201171875, 0.27764892578125, 0.30280303955078125, 0.3279571533203125, 0.35311126708984375, 0.378265380859375, 0.40341949462890625, 0.4285736083984375, 0.45372772216796875, 0.4788818359375, 0.5040359497070312, 0.5291900634765625, 0.5543441772460938, 0.579498291015625, 0.6046524047851562, 0.6298065185546875, 0.6549606323242188, 0.68011474609375, 0.7052688598632812, 0.7304229736328125, 0.7555770874023438, 0.780731201171875, 0.8058853149414062, 0.8310394287109375, 0.8561935424804688, 0.88134765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 8.0, 14.0, 8.0, 18.0, 26.0, 58.0, 96.0, 237.0, 578.0, 1698.0, 7714.0, 110704.0, 854485.0, 64921.0, 5758.0, 1324.0, 476.0, 204.0, 87.0, 56.0, 35.0, 21.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07965087890625, -0.07694339752197266, -0.07423591613769531, -0.07152843475341797, -0.06882095336914062, -0.06611347198486328, -0.06340599060058594, -0.060698509216308594, -0.05799102783203125, -0.055283546447753906, -0.05257606506347656, -0.04986858367919922, -0.047161102294921875, -0.04445362091064453, -0.04174613952636719, -0.039038658142089844, -0.0363311767578125, -0.033623695373535156, -0.030916213989257812, -0.02820873260498047, -0.025501251220703125, -0.02279376983642578, -0.020086288452148438, -0.017378807067871094, -0.01467132568359375, -0.011963844299316406, -0.009256362915039062, -0.006548881530761719, -0.003841400146484375, -0.0011339187622070312, 0.0015735626220703125, 0.004281044006347656, 0.006988525390625, 0.009696006774902344, 0.012403488159179688, 0.015110969543457031, 0.017818450927734375, 0.02052593231201172, 0.023233413696289062, 0.025940895080566406, 0.02864837646484375, 0.031355857849121094, 0.03406333923339844, 0.03677082061767578, 0.039478302001953125, 0.04218578338623047, 0.04489326477050781, 0.047600746154785156, 0.0503082275390625, 0.053015708923339844, 0.05572319030761719, 0.05843067169189453, 0.061138153076171875, 0.06384563446044922, 0.06655311584472656, 0.0692605972290039, 0.07196807861328125, 0.0746755599975586, 0.07738304138183594, 0.08009052276611328, 0.08279800415039062, 0.08550548553466797, 0.08821296691894531, 0.09092044830322266, 0.0936279296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 8.0, 6.0, 11.0, 14.0, 22.0, 31.0, 46.0, 44.0, 55.0, 73.0, 93.0, 84.0, 104.0, 70.0, 84.0, 70.0, 36.0, 43.0, 29.0, 16.0, 15.0, 9.0, 5.0, 9.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.811981201171875e-05, -1.742597669363022e-05, -1.6732141375541687e-05, -1.6038306057453156e-05, -1.5344470739364624e-05, -1.4650635421276093e-05, -1.3956800103187561e-05, -1.326296478509903e-05, -1.2569129467010498e-05, -1.1875294148921967e-05, -1.1181458830833435e-05, -1.0487623512744904e-05, -9.793788194656372e-06, -9.09995287656784e-06, -8.406117558479309e-06, -7.712282240390778e-06, -7.018446922302246e-06, -6.324611604213715e-06, -5.630776286125183e-06, -4.936940968036652e-06, -4.24310564994812e-06, -3.5492703318595886e-06, -2.855435013771057e-06, -2.1615996956825256e-06, -1.4677643775939941e-06, -7.739290595054626e-07, -8.009374141693115e-08, 6.137415766716003e-07, 1.3075768947601318e-06, 2.0014122128486633e-06, 2.695247530937195e-06, 3.3890828490257263e-06, 4.082918167114258e-06, 4.776753485202789e-06, 5.470588803291321e-06, 6.164424121379852e-06, 6.858259439468384e-06, 7.552094757556915e-06, 8.245930075645447e-06, 8.939765393733978e-06, 9.63360071182251e-06, 1.0327436029911041e-05, 1.1021271347999573e-05, 1.1715106666088104e-05, 1.2408941984176636e-05, 1.3102777302265167e-05, 1.3796612620353699e-05, 1.449044793844223e-05, 1.5184283256530762e-05, 1.5878118574619293e-05, 1.6571953892707825e-05, 1.7265789210796356e-05, 1.7959624528884888e-05, 1.865345984697342e-05, 1.934729516506195e-05, 2.0041130483150482e-05, 2.0734965801239014e-05, 2.1428801119327545e-05, 2.2122636437416077e-05, 2.2816471755504608e-05, 2.351030707359314e-05, 2.420414239168167e-05, 2.4897977709770203e-05, 2.5591813027858734e-05, 2.6285648345947266e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 10.0, 29.0, 20.0, 22.0, 40.0, 67.0, 89.0, 147.0, 217.0, 361.0, 684.0, 1394.0, 3467.0, 10411.0, 37575.0, 174091.0, 540624.0, 214667.0, 44810.0, 12167.0, 4086.0, 1701.0, 798.0, 400.0, 224.0, 142.0, 88.0, 60.0, 39.0, 26.0, 23.0, 16.0, 13.0, 5.0, 7.0, 10.0, 5.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.04315185546875, -0.041826725006103516, -0.04050159454345703, -0.03917646408081055, -0.03785133361816406, -0.03652620315551758, -0.035201072692871094, -0.03387594223022461, -0.032550811767578125, -0.03122568130493164, -0.029900550842285156, -0.028575420379638672, -0.027250289916992188, -0.025925159454345703, -0.02460002899169922, -0.023274898529052734, -0.02194976806640625, -0.020624637603759766, -0.01929950714111328, -0.017974376678466797, -0.016649246215820312, -0.015324115753173828, -0.013998985290527344, -0.01267385482788086, -0.011348724365234375, -0.01002359390258789, -0.008698463439941406, -0.007373332977294922, -0.0060482025146484375, -0.004723072052001953, -0.0033979415893554688, -0.0020728111267089844, -0.0007476806640625, 0.0005774497985839844, 0.0019025802612304688, 0.003227710723876953, 0.0045528411865234375, 0.005877971649169922, 0.007203102111816406, 0.00852823257446289, 0.009853363037109375, 0.01117849349975586, 0.012503623962402344, 0.013828754425048828, 0.015153884887695312, 0.016479015350341797, 0.01780414581298828, 0.019129276275634766, 0.02045440673828125, 0.021779537200927734, 0.02310466766357422, 0.024429798126220703, 0.025754928588867188, 0.027080059051513672, 0.028405189514160156, 0.02973031997680664, 0.031055450439453125, 0.03238058090209961, 0.033705711364746094, 0.03503084182739258, 0.03635597229003906, 0.03768110275268555, 0.03900623321533203, 0.040331363677978516, 0.041656494140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 11.0, 15.0, 27.0, 24.0, 40.0, 56.0, 78.0, 98.0, 126.0, 110.0, 91.0, 92.0, 69.0, 37.0, 25.0, 27.0, 15.0, 12.0, 7.0, 6.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.019439697265625, -0.018941283226013184, -0.018442869186401367, -0.01794445514678955, -0.017446041107177734, -0.016947627067565918, -0.0164492130279541, -0.015950798988342285, -0.015452384948730469, -0.014953970909118652, -0.014455556869506836, -0.01395714282989502, -0.013458728790283203, -0.012960314750671387, -0.01246190071105957, -0.011963486671447754, -0.011465072631835938, -0.010966658592224121, -0.010468244552612305, -0.009969830513000488, -0.009471416473388672, -0.008973002433776855, -0.008474588394165039, -0.007976174354553223, -0.007477760314941406, -0.00697934627532959, -0.0064809322357177734, -0.005982518196105957, -0.005484104156494141, -0.004985690116882324, -0.004487276077270508, -0.003988862037658691, -0.003490447998046875, -0.0029920339584350586, -0.002493619918823242, -0.0019952058792114258, -0.0014967918395996094, -0.000998377799987793, -0.0004999637603759766, -1.5497207641601562e-06, 0.0004968643188476562, 0.0009952783584594727, 0.001493692398071289, 0.0019921064376831055, 0.002490520477294922, 0.0029889345169067383, 0.0034873485565185547, 0.003985762596130371, 0.0044841766357421875, 0.004982590675354004, 0.00548100471496582, 0.005979418754577637, 0.006477832794189453, 0.0069762468338012695, 0.007474660873413086, 0.007973074913024902, 0.008471488952636719, 0.008969902992248535, 0.009468317031860352, 0.009966731071472168, 0.010465145111083984, 0.0109635591506958, 0.011461973190307617, 0.011960387229919434, 0.01245880126953125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 11.0, 18.0, 23.0, 53.0, 99.0, 143.0, 165.0, 191.0, 123.0, 74.0, 34.0, 26.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7739453315734863, -0.7385914325714111, -0.7032375335693359, -0.6678836345672607, -0.6325297355651855, -0.5971758365631104, -0.5618219971656799, -0.5264680981636047, -0.49111419916152954, -0.45576030015945435, -0.42040640115737915, -0.38505253195762634, -0.34969863295555115, -0.31434473395347595, -0.27899086475372314, -0.24363696575164795, -0.20828306674957275, -0.17292916774749756, -0.13757528364658356, -0.10222139209508896, -0.06686750054359436, -0.031513601541519165, 0.0038402825593948364, 0.03919416666030884, 0.07454806566238403, 0.10990195721387863, 0.14525584876537323, 0.18060973286628723, 0.21596363186836243, 0.2513175308704376, 0.28667140007019043, 0.3220252990722656, 0.35737931728363037, 0.39273321628570557, 0.42808711528778076, 0.46344098448753357, 0.49879488348960876, 0.5341488122940063, 0.5695026516914368, 0.604856550693512, 0.6402104496955872, 0.6755643486976624, 0.7109182476997375, 0.7462721467018127, 0.7816259860992432, 0.8169798851013184, 0.8523337841033936, 0.8876876831054688, 0.923041582107544, 0.9583954811096191, 0.9937493801116943, 1.0291032791137695, 1.0644571781158447, 1.09981107711792, 1.1351649761199951, 1.1705188751220703, 1.2058727741241455, 1.2412266731262207, 1.276580572128296, 1.311934471130371, 1.3472883701324463, 1.3826422691345215, 1.4179961681365967, 1.4533500671386719, 1.4887038469314575]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 9.0, 19.0, 18.0, 15.0, 30.0, 28.0, 29.0, 52.0, 57.0, 53.0, 42.0, 66.0, 59.0, 63.0, 74.0, 61.0, 64.0, 47.0, 34.0, 51.0, 24.0, 27.0, 19.0, 8.0, 8.0, 6.0, 8.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6286386847496033, -0.6116711497306824, -0.5947036147117615, -0.5777360796928406, -0.5607685446739197, -0.543800950050354, -0.5268334150314331, -0.5098658800125122, -0.4928983449935913, -0.4759308099746704, -0.4589632749557495, -0.4419957399368286, -0.4250281751155853, -0.40806064009666443, -0.39109310507774353, -0.37412557005882263, -0.35715803503990173, -0.34019050002098083, -0.32322296500205994, -0.30625540018081665, -0.28928786516189575, -0.27232033014297485, -0.25535279512405396, -0.23838526010513306, -0.22141771018505096, -0.20445017516613007, -0.18748262524604797, -0.17051509022712708, -0.15354755520820618, -0.13658000528812408, -0.11961247026920319, -0.10264492779970169, -0.08567735552787781, -0.06870981305837631, -0.051742274314165115, -0.03477473556995392, -0.017807193100452423, -0.0008396506309509277, 0.01612788438796997, 0.033095426857471466, 0.05006296932697296, 0.06703051179647446, 0.08399805426597595, 0.10096558928489685, 0.11793313175439835, 0.13490067422389984, 0.15186820924282074, 0.16883575916290283, 0.18580329418182373, 0.20277082920074463, 0.21973837912082672, 0.23670591413974762, 0.2536734640598297, 0.2706409990787506, 0.2876085340976715, 0.3045760691165924, 0.3215436339378357, 0.3385111689567566, 0.3554787039756775, 0.3724462389945984, 0.3894138038158417, 0.4063813388347626, 0.42334887385368347, 0.44031640887260437, 0.45728394389152527]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 15.0, 18.0, 27.0, 26.0, 52.0, 65.0, 97.0, 152.0, 240.0, 371.0, 542.0, 984.0, 1742.0, 3274.0, 6292.0, 14167.0, 38506.0, 148930.0, 630759.0, 138168.0, 36640.0, 14022.0, 6118.0, 3119.0, 1621.0, 931.0, 556.0, 372.0, 224.0, 156.0, 98.0, 61.0, 53.0, 42.0, 25.0, 15.0, 12.0, 9.0, 9.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3858642578125, -0.372314453125, -0.3587646484375, -0.34521484375, -0.3316650390625, -0.318115234375, -0.3045654296875, -0.291015625, -0.2774658203125, -0.263916015625, -0.2503662109375, -0.23681640625, -0.2232666015625, -0.209716796875, -0.1961669921875, -0.1826171875, -0.1690673828125, -0.155517578125, -0.1419677734375, -0.12841796875, -0.1148681640625, -0.101318359375, -0.0877685546875, -0.07421875, -0.0606689453125, -0.047119140625, -0.0335693359375, -0.02001953125, -0.0064697265625, 0.007080078125, 0.0206298828125, 0.0341796875, 0.0477294921875, 0.061279296875, 0.0748291015625, 0.08837890625, 0.1019287109375, 0.115478515625, 0.1290283203125, 0.142578125, 0.1561279296875, 0.169677734375, 0.1832275390625, 0.19677734375, 0.2103271484375, 0.223876953125, 0.2374267578125, 0.2509765625, 0.2645263671875, 0.278076171875, 0.2916259765625, 0.30517578125, 0.3187255859375, 0.332275390625, 0.3458251953125, 0.359375, 0.3729248046875, 0.386474609375, 0.4000244140625, 0.41357421875, 0.4271240234375, 0.440673828125, 0.4542236328125, 0.4677734375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 4.0, 8.0, 13.0, 17.0, 18.0, 22.0, 26.0, 37.0, 42.0, 47.0, 54.0, 57.0, 50.0, 66.0, 64.0, 64.0, 76.0, 70.0, 67.0, 33.0, 37.0, 38.0, 13.0, 20.0, 7.0, 4.0, 8.0, 10.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2230072021484375, -1.187225341796875, -1.1514434814453125, -1.11566162109375, -1.0798797607421875, -1.044097900390625, -1.0083160400390625, -0.9725341796875, -0.9367523193359375, -0.900970458984375, -0.8651885986328125, -0.82940673828125, -0.7936248779296875, -0.757843017578125, -0.7220611572265625, -0.686279296875, -0.6504974365234375, -0.614715576171875, -0.5789337158203125, -0.54315185546875, -0.5073699951171875, -0.471588134765625, -0.4358062744140625, -0.4000244140625, -0.3642425537109375, -0.328460693359375, -0.2926788330078125, -0.25689697265625, -0.2211151123046875, -0.185333251953125, -0.1495513916015625, -0.11376953125, -0.0779876708984375, -0.042205810546875, -0.0064239501953125, 0.02935791015625, 0.0651397705078125, 0.100921630859375, 0.1367034912109375, 0.1724853515625, 0.2082672119140625, 0.244049072265625, 0.2798309326171875, 0.31561279296875, 0.3513946533203125, 0.387176513671875, 0.4229583740234375, 0.458740234375, 0.4945220947265625, 0.530303955078125, 0.5660858154296875, 0.60186767578125, 0.6376495361328125, 0.673431396484375, 0.7092132568359375, 0.7449951171875, 0.7807769775390625, 0.816558837890625, 0.8523406982421875, 0.88812255859375, 0.9239044189453125, 0.959686279296875, 0.9954681396484375, 1.03125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 8.0, 2.0, 13.0, 14.0, 24.0, 22.0, 25.0, 35.0, 67.0, 101.0, 114.0, 233.0, 333.0, 663.0, 1576.0, 4367.0, 15221.0, 77891.0, 755247.0, 158287.0, 23947.0, 6281.0, 2123.0, 854.0, 386.0, 257.0, 128.0, 104.0, 61.0, 43.0, 40.0, 22.0, 13.0, 12.0, 8.0, 9.0, 9.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.5458984375, -0.5291824340820312, -0.5124664306640625, -0.49575042724609375, -0.479034423828125, -0.46231842041015625, -0.4456024169921875, -0.42888641357421875, -0.41217041015625, -0.39545440673828125, -0.3787384033203125, -0.36202239990234375, -0.345306396484375, -0.32859039306640625, -0.3118743896484375, -0.29515838623046875, -0.2784423828125, -0.26172637939453125, -0.2450103759765625, -0.22829437255859375, -0.211578369140625, -0.19486236572265625, -0.1781463623046875, -0.16143035888671875, -0.14471435546875, -0.12799835205078125, -0.1112823486328125, -0.09456634521484375, -0.077850341796875, -0.06113433837890625, -0.0444183349609375, -0.02770233154296875, -0.010986328125, 0.00572967529296875, 0.0224456787109375, 0.03916168212890625, 0.055877685546875, 0.07259368896484375, 0.0893096923828125, 0.10602569580078125, 0.12274169921875, 0.13945770263671875, 0.1561737060546875, 0.17288970947265625, 0.189605712890625, 0.20632171630859375, 0.2230377197265625, 0.23975372314453125, 0.2564697265625, 0.27318572998046875, 0.2899017333984375, 0.30661773681640625, 0.323333740234375, 0.34004974365234375, 0.3567657470703125, 0.37348175048828125, 0.39019775390625, 0.40691375732421875, 0.4236297607421875, 0.44034576416015625, 0.457061767578125, 0.47377777099609375, 0.4904937744140625, 0.5072097778320312, 0.52392578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 5.0, 9.0, 9.0, 13.0, 14.0, 15.0, 14.0, 28.0, 31.0, 39.0, 43.0, 45.0, 48.0, 43.0, 44.0, 53.0, 53.0, 65.0, 55.0, 46.0, 47.0, 33.0, 31.0, 46.0, 27.0, 27.0, 25.0, 20.0, 15.0, 8.0, 13.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.2158203125, -1.1785430908203125, -1.141265869140625, -1.1039886474609375, -1.06671142578125, -1.0294342041015625, -0.992156982421875, -0.9548797607421875, -0.9176025390625, -0.8803253173828125, -0.843048095703125, -0.8057708740234375, -0.76849365234375, -0.7312164306640625, -0.693939208984375, -0.6566619873046875, -0.619384765625, -0.5821075439453125, -0.544830322265625, -0.5075531005859375, -0.47027587890625, -0.4329986572265625, -0.395721435546875, -0.3584442138671875, -0.3211669921875, -0.2838897705078125, -0.246612548828125, -0.2093353271484375, -0.17205810546875, -0.1347808837890625, -0.097503662109375, -0.0602264404296875, -0.02294921875, 0.0143280029296875, 0.051605224609375, 0.0888824462890625, 0.12615966796875, 0.1634368896484375, 0.200714111328125, 0.2379913330078125, 0.2752685546875, 0.3125457763671875, 0.349822998046875, 0.3871002197265625, 0.42437744140625, 0.4616546630859375, 0.498931884765625, 0.5362091064453125, 0.573486328125, 0.6107635498046875, 0.648040771484375, 0.6853179931640625, 0.72259521484375, 0.7598724365234375, 0.797149658203125, 0.8344268798828125, 0.8717041015625, 0.9089813232421875, 0.946258544921875, 0.9835357666015625, 1.02081298828125, 1.0580902099609375, 1.095367431640625, 1.1326446533203125, 1.169921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 11.0, 15.0, 11.0, 21.0, 20.0, 32.0, 49.0, 63.0, 102.0, 140.0, 201.0, 343.0, 612.0, 1042.0, 2182.0, 4737.0, 13996.0, 64539.0, 662850.0, 245559.0, 35455.0, 9209.0, 3427.0, 1600.0, 874.0, 466.0, 306.0, 224.0, 130.0, 91.0, 57.0, 51.0, 36.0, 26.0, 14.0, 14.0, 14.0, 5.0, 3.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.166259765625, -0.160491943359375, -0.15472412109375, -0.148956298828125, -0.1431884765625, -0.137420654296875, -0.13165283203125, -0.125885009765625, -0.1201171875, -0.114349365234375, -0.10858154296875, -0.102813720703125, -0.0970458984375, -0.091278076171875, -0.08551025390625, -0.079742431640625, -0.073974609375, -0.068206787109375, -0.06243896484375, -0.056671142578125, -0.0509033203125, -0.045135498046875, -0.03936767578125, -0.033599853515625, -0.02783203125, -0.022064208984375, -0.01629638671875, -0.010528564453125, -0.0047607421875, 0.001007080078125, 0.00677490234375, 0.012542724609375, 0.018310546875, 0.024078369140625, 0.02984619140625, 0.035614013671875, 0.0413818359375, 0.047149658203125, 0.05291748046875, 0.058685302734375, 0.064453125, 0.070220947265625, 0.07598876953125, 0.081756591796875, 0.0875244140625, 0.093292236328125, 0.09906005859375, 0.104827880859375, 0.110595703125, 0.116363525390625, 0.12213134765625, 0.127899169921875, 0.1336669921875, 0.139434814453125, 0.14520263671875, 0.150970458984375, 0.15673828125, 0.162506103515625, 0.16827392578125, 0.174041748046875, 0.1798095703125, 0.185577392578125, 0.19134521484375, 0.197113037109375, 0.202880859375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 8.0, 6.0, 6.0, 14.0, 18.0, 25.0, 29.0, 35.0, 55.0, 80.0, 132.0, 211.0, 94.0, 54.0, 57.0, 34.0, 32.0, 24.0, 9.0, 17.0, 9.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.314018249511719e-05, -3.2316893339157104e-05, -3.149360418319702e-05, -3.067031502723694e-05, -2.9847025871276855e-05, -2.9023736715316772e-05, -2.820044755935669e-05, -2.7377158403396606e-05, -2.6553869247436523e-05, -2.573058009147644e-05, -2.4907290935516357e-05, -2.4084001779556274e-05, -2.326071262359619e-05, -2.243742346763611e-05, -2.1614134311676025e-05, -2.0790845155715942e-05, -1.996755599975586e-05, -1.9144266843795776e-05, -1.8320977687835693e-05, -1.749768853187561e-05, -1.6674399375915527e-05, -1.5851110219955444e-05, -1.5027821063995361e-05, -1.4204531908035278e-05, -1.3381242752075195e-05, -1.2557953596115112e-05, -1.173466444015503e-05, -1.0911375284194946e-05, -1.0088086128234863e-05, -9.26479697227478e-06, -8.441507816314697e-06, -7.618218660354614e-06, -6.794929504394531e-06, -5.971640348434448e-06, -5.148351192474365e-06, -4.325062036514282e-06, -3.5017728805541992e-06, -2.678483724594116e-06, -1.8551945686340332e-06, -1.0319054126739502e-06, -2.086162567138672e-07, 6.146728992462158e-07, 1.4379620552062988e-06, 2.261251211166382e-06, 3.084540367126465e-06, 3.907829523086548e-06, 4.731118679046631e-06, 5.554407835006714e-06, 6.377696990966797e-06, 7.20098614692688e-06, 8.024275302886963e-06, 8.847564458847046e-06, 9.670853614807129e-06, 1.0494142770767212e-05, 1.1317431926727295e-05, 1.2140721082687378e-05, 1.2964010238647461e-05, 1.3787299394607544e-05, 1.4610588550567627e-05, 1.543387770652771e-05, 1.6257166862487793e-05, 1.7080456018447876e-05, 1.790374517440796e-05, 1.8727034330368042e-05, 1.9550323486328125e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 9.0, 0.0, 8.0, 10.0, 24.0, 14.0, 27.0, 32.0, 57.0, 68.0, 80.0, 142.0, 185.0, 300.0, 439.0, 690.0, 1126.0, 2047.0, 3835.0, 8750.0, 25453.0, 109678.0, 685609.0, 155891.0, 33171.0, 10479.0, 4510.0, 2264.0, 1265.0, 829.0, 489.0, 329.0, 207.0, 171.0, 77.0, 67.0, 63.0, 41.0, 28.0, 26.0, 21.0, 13.0, 6.0, 9.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.1522216796875, -0.1470794677734375, -0.141937255859375, -0.1367950439453125, -0.13165283203125, -0.1265106201171875, -0.121368408203125, -0.1162261962890625, -0.111083984375, -0.1059417724609375, -0.100799560546875, -0.0956573486328125, -0.09051513671875, -0.0853729248046875, -0.080230712890625, -0.0750885009765625, -0.0699462890625, -0.0648040771484375, -0.059661865234375, -0.0545196533203125, -0.04937744140625, -0.0442352294921875, -0.039093017578125, -0.0339508056640625, -0.02880859375, -0.0236663818359375, -0.018524169921875, -0.0133819580078125, -0.00823974609375, -0.0030975341796875, 0.002044677734375, 0.0071868896484375, 0.0123291015625, 0.0174713134765625, 0.022613525390625, 0.0277557373046875, 0.03289794921875, 0.0380401611328125, 0.043182373046875, 0.0483245849609375, 0.053466796875, 0.0586090087890625, 0.063751220703125, 0.0688934326171875, 0.07403564453125, 0.0791778564453125, 0.084320068359375, 0.0894622802734375, 0.0946044921875, 0.0997467041015625, 0.104888916015625, 0.1100311279296875, 0.11517333984375, 0.1203155517578125, 0.125457763671875, 0.1305999755859375, 0.1357421875, 0.1408843994140625, 0.146026611328125, 0.1511688232421875, 0.15631103515625, 0.1614532470703125, 0.166595458984375, 0.1717376708984375, 0.1768798828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 0.0, 5.0, 3.0, 7.0, 8.0, 8.0, 9.0, 6.0, 17.0, 15.0, 17.0, 39.0, 39.0, 65.0, 85.0, 289.0, 121.0, 62.0, 38.0, 31.0, 36.0, 21.0, 16.0, 14.0, 16.0, 9.0, 6.0, 4.0, 4.0, 1.0, 6.0, 0.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.11865234375, -0.11573410034179688, -0.11281585693359375, -0.10989761352539062, -0.1069793701171875, -0.10406112670898438, -0.10114288330078125, -0.09822463989257812, -0.095306396484375, -0.09238815307617188, -0.08946990966796875, -0.08655166625976562, -0.0836334228515625, -0.08071517944335938, -0.07779693603515625, -0.07487869262695312, -0.07196044921875, -0.06904220581054688, -0.06612396240234375, -0.06320571899414062, -0.0602874755859375, -0.057369232177734375, -0.05445098876953125, -0.051532745361328125, -0.048614501953125, -0.045696258544921875, -0.04277801513671875, -0.039859771728515625, -0.0369415283203125, -0.034023284912109375, -0.03110504150390625, -0.028186798095703125, -0.0252685546875, -0.022350311279296875, -0.01943206787109375, -0.016513824462890625, -0.0135955810546875, -0.010677337646484375, -0.00775909423828125, -0.004840850830078125, -0.001922607421875, 0.000995635986328125, 0.00391387939453125, 0.006832122802734375, 0.0097503662109375, 0.012668609619140625, 0.01558685302734375, 0.018505096435546875, 0.02142333984375, 0.024341583251953125, 0.02725982666015625, 0.030178070068359375, 0.0330963134765625, 0.036014556884765625, 0.03893280029296875, 0.041851043701171875, 0.044769287109375, 0.047687530517578125, 0.05060577392578125, 0.053524017333984375, 0.0564422607421875, 0.059360504150390625, 0.06227874755859375, 0.06519699096679688, 0.068115234375]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 8.0, 3.0, 10.0, 15.0, 36.0, 54.0, 100.0, 128.0, 187.0, 173.0, 105.0, 76.0, 42.0, 23.0, 12.0, 4.0, 3.0, 4.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.635367512702942, -1.566827654838562, -1.4982876777648926, -1.4297478199005127, -1.3612079620361328, -1.292668104171753, -1.2241281270980835, -1.1555882692337036, -1.0870482921600342, -1.0185084342956543, -0.9499685168266296, -0.881428599357605, -0.8128887414932251, -0.7443488240242004, -0.6758089065551758, -0.6072690486907959, -0.538729190826416, -0.47018930315971375, -0.4016494154930115, -0.3331094980239868, -0.26456961035728455, -0.19602972269058228, -0.12748980522155762, -0.05894991755485535, 0.009589970111846924, 0.07812986522912979, 0.14666976034641266, 0.21520966291427612, 0.2837495505809784, 0.35228943824768066, 0.4208293557167053, 0.4893692433834076, 0.5579092502593994, 0.6264491677284241, 0.694989025592804, 0.7635289430618286, 0.8320688009262085, 0.9006087183952332, 0.9691486358642578, 1.0376884937286377, 1.1062283515930176, 1.1747682094573975, 1.243308186531067, 1.3118480443954468, 1.3803879022598267, 1.448927879333496, 1.517467737197876, 1.5860075950622559, 1.6545475721359253, 1.7230874300003052, 1.7916274070739746, 1.8601672649383545, 1.9287071228027344, 1.9972469806671143, 2.065786838531494, 2.134326934814453, 2.202866792678833, 2.271406650543213, 2.3399465084075928, 2.4084863662719727, 2.4770264625549316, 2.5455663204193115, 2.6141061782836914, 2.6826460361480713, 2.751185894012451]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 1.0, 12.0, 4.0, 6.0, 10.0, 12.0, 15.0, 14.0, 16.0, 22.0, 24.0, 34.0, 26.0, 30.0, 26.0, 29.0, 40.0, 30.0, 29.0, 34.0, 41.0, 41.0, 49.0, 34.0, 42.0, 45.0, 31.0, 34.0, 24.0, 35.0, 20.0, 21.0, 22.0, 11.0, 20.0, 15.0, 15.0, 11.0, 19.0, 10.0, 9.0, 8.0, 3.0, 5.0, 9.0, 6.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4208166599273682, -1.3733447790145874, -1.325872778892517, -1.2784008979797363, -1.230928897857666, -1.1834570169448853, -1.135985016822815, -1.0885131359100342, -1.0410411357879639, -0.9935691952705383, -0.9460972547531128, -0.8986253142356873, -0.8511533737182617, -0.8036814332008362, -0.7562094926834106, -0.7087376117706299, -0.6612656712532043, -0.6137937307357788, -0.5663217902183533, -0.5188498497009277, -0.4713779091835022, -0.42390596866607666, -0.3764340579509735, -0.328962117433548, -0.28149017691612244, -0.2340182363986969, -0.18654629588127136, -0.13907437026500702, -0.09160242974758148, -0.044130489230155945, 0.0033414363861083984, 0.050813376903533936, 0.09828531742095947, 0.145757257938385, 0.19322919845581055, 0.2407011240720749, 0.2881730794906616, 0.33564502000808716, 0.3831169307231903, 0.43058887124061584, 0.4780608117580414, 0.5255327224731445, 0.5730046629905701, 0.6204766035079956, 0.6679485440254211, 0.7154204845428467, 0.7628924250602722, 0.8103643655776978, 0.8578363060951233, 0.9053082466125488, 0.9527801871299744, 1.0002521276474, 1.0477240085601807, 1.095196008682251, 1.1426678895950317, 1.190139889717102, 1.2376117706298828, 1.2850836515426636, 1.3325556516647339, 1.3800275325775146, 1.427499532699585, 1.4749714136123657, 1.522443413734436, 1.5699152946472168, 1.617387294769287]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 12.0, 17.0, 17.0, 31.0, 32.0, 33.0, 55.0, 81.0, 101.0, 142.0, 202.0, 312.0, 498.0, 861.0, 1399.0, 2468.0, 4862.0, 11119.0, 29758.0, 109475.0, 736566.0, 2778230.0, 408661.0, 70746.0, 20875.0, 8452.0, 3989.0, 2100.0, 1094.0, 693.0, 407.0, 296.0, 196.0, 125.0, 92.0, 75.0, 46.0, 42.0, 28.0, 18.0, 15.0, 14.0, 14.0, 9.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60546875, -0.5841217041015625, -0.562774658203125, -0.5414276123046875, -0.52008056640625, -0.4987335205078125, -0.477386474609375, -0.4560394287109375, -0.4346923828125, -0.4133453369140625, -0.391998291015625, -0.3706512451171875, -0.34930419921875, -0.3279571533203125, -0.306610107421875, -0.2852630615234375, -0.263916015625, -0.2425689697265625, -0.221221923828125, -0.1998748779296875, -0.17852783203125, -0.1571807861328125, -0.135833740234375, -0.1144866943359375, -0.0931396484375, -0.0717926025390625, -0.050445556640625, -0.0290985107421875, -0.00775146484375, 0.0135955810546875, 0.034942626953125, 0.0562896728515625, 0.07763671875, 0.0989837646484375, 0.120330810546875, 0.1416778564453125, 0.16302490234375, 0.1843719482421875, 0.205718994140625, 0.2270660400390625, 0.2484130859375, 0.2697601318359375, 0.291107177734375, 0.3124542236328125, 0.33380126953125, 0.3551483154296875, 0.376495361328125, 0.3978424072265625, 0.419189453125, 0.4405364990234375, 0.461883544921875, 0.4832305908203125, 0.50457763671875, 0.5259246826171875, 0.547271728515625, 0.5686187744140625, 0.5899658203125, 0.6113128662109375, 0.632659912109375, 0.6540069580078125, 0.67535400390625, 0.6967010498046875, 0.718048095703125, 0.7393951416015625, 0.7607421875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 14.0, 14.0, 21.0, 20.0, 33.0, 39.0, 63.0, 58.0, 78.0, 80.0, 67.0, 77.0, 70.0, 71.0, 57.0, 46.0, 39.0, 31.0, 29.0, 20.0, 18.0, 13.0, 8.0, 6.0, 2.0, 3.0, 3.0, 0.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.91796875, -0.8950424194335938, -0.8721160888671875, -0.8491897583007812, -0.826263427734375, -0.8033370971679688, -0.7804107666015625, -0.7574844360351562, -0.73455810546875, -0.7116317749023438, -0.6887054443359375, -0.6657791137695312, -0.642852783203125, -0.6199264526367188, -0.5970001220703125, -0.5740737915039062, -0.5511474609375, -0.5282211303710938, -0.5052947998046875, -0.48236846923828125, -0.459442138671875, -0.43651580810546875, -0.4135894775390625, -0.39066314697265625, -0.36773681640625, -0.34481048583984375, -0.3218841552734375, -0.29895782470703125, -0.276031494140625, -0.25310516357421875, -0.2301788330078125, -0.20725250244140625, -0.184326171875, -0.16139984130859375, -0.1384735107421875, -0.11554718017578125, -0.092620849609375, -0.06969451904296875, -0.0467681884765625, -0.02384185791015625, -0.00091552734375, 0.02201080322265625, 0.0449371337890625, 0.06786346435546875, 0.090789794921875, 0.11371612548828125, 0.1366424560546875, 0.15956878662109375, 0.1824951171875, 0.20542144775390625, 0.2283477783203125, 0.25127410888671875, 0.274200439453125, 0.29712677001953125, 0.3200531005859375, 0.34297943115234375, 0.36590576171875, 0.38883209228515625, 0.4117584228515625, 0.43468475341796875, 0.457611083984375, 0.48053741455078125, 0.5034637451171875, 0.5263900756835938, 0.54931640625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 13.0, 6.0, 8.0, 18.0, 29.0, 42.0, 70.0, 143.0, 217.0, 439.0, 817.0, 1982.0, 5299.0, 17995.0, 90076.0, 1489551.0, 2436977.0, 118445.0, 21597.0, 6341.0, 2202.0, 912.0, 464.0, 239.0, 145.0, 81.0, 51.0, 27.0, 31.0, 17.0, 7.0, 8.0, 8.0, 2.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7303390502929688, -0.7033538818359375, -0.6763687133789062, -0.649383544921875, -0.6223983764648438, -0.5954132080078125, -0.5684280395507812, -0.54144287109375, -0.5144577026367188, -0.4874725341796875, -0.46048736572265625, -0.433502197265625, -0.40651702880859375, -0.3795318603515625, -0.35254669189453125, -0.3255615234375, -0.29857635498046875, -0.2715911865234375, -0.24460601806640625, -0.217620849609375, -0.19063568115234375, -0.1636505126953125, -0.13666534423828125, -0.10968017578125, -0.08269500732421875, -0.0557098388671875, -0.02872467041015625, -0.001739501953125, 0.02524566650390625, 0.0522308349609375, 0.07921600341796875, 0.106201171875, 0.13318634033203125, 0.1601715087890625, 0.18715667724609375, 0.214141845703125, 0.24112701416015625, 0.2681121826171875, 0.29509735107421875, 0.32208251953125, 0.34906768798828125, 0.3760528564453125, 0.40303802490234375, 0.430023193359375, 0.45700836181640625, 0.4839935302734375, 0.5109786987304688, 0.5379638671875, 0.5649490356445312, 0.5919342041015625, 0.6189193725585938, 0.645904541015625, 0.6728897094726562, 0.6998748779296875, 0.7268600463867188, 0.75384521484375, 0.7808303833007812, 0.8078155517578125, 0.8348007202148438, 0.861785888671875, 0.8887710571289062, 0.9157562255859375, 0.9427413940429688, 0.9697265625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 4.0, 9.0, 15.0, 11.0, 19.0, 22.0, 30.0, 37.0, 50.0, 78.0, 92.0, 186.0, 253.0, 397.0, 563.0, 695.0, 538.0, 366.0, 209.0, 139.0, 94.0, 58.0, 56.0, 41.0, 27.0, 16.0, 8.0, 9.0, 10.0, 2.0, 9.0, 9.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1898193359375, -0.18312835693359375, -0.1764373779296875, -0.16974639892578125, -0.163055419921875, -0.15636444091796875, -0.1496734619140625, -0.14298248291015625, -0.13629150390625, -0.12960052490234375, -0.1229095458984375, -0.11621856689453125, -0.109527587890625, -0.10283660888671875, -0.0961456298828125, -0.08945465087890625, -0.082763671875, -0.07607269287109375, -0.0693817138671875, -0.06269073486328125, -0.055999755859375, -0.04930877685546875, -0.0426177978515625, -0.03592681884765625, -0.02923583984375, -0.02254486083984375, -0.0158538818359375, -0.00916290283203125, -0.002471923828125, 0.00421905517578125, 0.0109100341796875, 0.01760101318359375, 0.0242919921875, 0.03098297119140625, 0.0376739501953125, 0.04436492919921875, 0.051055908203125, 0.05774688720703125, 0.0644378662109375, 0.07112884521484375, 0.07781982421875, 0.08451080322265625, 0.0912017822265625, 0.09789276123046875, 0.104583740234375, 0.11127471923828125, 0.1179656982421875, 0.12465667724609375, 0.13134765625, 0.13803863525390625, 0.1447296142578125, 0.15142059326171875, 0.158111572265625, 0.16480255126953125, 0.1714935302734375, 0.17818450927734375, 0.18487548828125, 0.19156646728515625, 0.1982574462890625, 0.20494842529296875, 0.211639404296875, 0.21833038330078125, 0.2250213623046875, 0.23171234130859375, 0.2384033203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 8.0, 20.0, 23.0, 46.0, 66.0, 91.0, 141.0, 150.0, 138.0, 116.0, 79.0, 38.0, 23.0, 11.0, 13.0, 6.0, 6.0, 3.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0598151683807373, -1.0149309635162354, -0.970046877861023, -0.9251627326011658, -0.8802785873413086, -0.8353944420814514, -0.7905102968215942, -0.7456261515617371, -0.7007420063018799, -0.6558578610420227, -0.6109737157821655, -0.5660895705223083, -0.5212054252624512, -0.476321280002594, -0.4314371347427368, -0.38655298948287964, -0.34166884422302246, -0.2967846989631653, -0.2519005537033081, -0.20701640844345093, -0.16213226318359375, -0.11724811792373657, -0.0723639726638794, -0.027479827404022217, 0.01740431785583496, 0.06228846311569214, 0.10717260837554932, 0.1520567536354065, 0.19694089889526367, 0.24182504415512085, 0.286709189414978, 0.3315933346748352, 0.3764774799346924, 0.42136162519454956, 0.46624577045440674, 0.5111299157142639, 0.5560140609741211, 0.6008982062339783, 0.6457823514938354, 0.6906664967536926, 0.7355506420135498, 0.780434787273407, 0.8253189325332642, 0.8702030777931213, 0.9150872230529785, 0.9599713683128357, 1.0048555135726929, 1.0497395992279053, 1.0946238040924072, 1.1395080089569092, 1.1843920946121216, 1.229276180267334, 1.274160385131836, 1.319044589996338, 1.3639286756515503, 1.4088127613067627, 1.4536969661712646, 1.4985811710357666, 1.543465256690979, 1.5883493423461914, 1.6332335472106934, 1.6781177520751953, 1.7230018377304077, 1.7678859233856201, 1.812770128250122]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 11.0, 11.0, 15.0, 17.0, 20.0, 32.0, 32.0, 43.0, 48.0, 45.0, 62.0, 64.0, 50.0, 40.0, 43.0, 57.0, 50.0, 44.0, 48.0, 49.0, 37.0, 32.0, 23.0, 17.0, 22.0, 15.0, 15.0, 9.0, 8.0, 10.0, 3.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.7947525978088379, -0.7748867273330688, -0.7550208568572998, -0.735154926776886, -0.7152890563011169, -0.6954231858253479, -0.6755573153495789, -0.6556914448738098, -0.635825514793396, -0.615959644317627, -0.5960937738418579, -0.5762278437614441, -0.556361973285675, -0.536496102809906, -0.516630232334137, -0.4967643618583679, -0.4768984913825989, -0.45703262090682983, -0.4371667206287384, -0.41730085015296936, -0.39743494987487793, -0.3775690793991089, -0.35770320892333984, -0.3378373384475708, -0.31797143816947937, -0.2981055676937103, -0.2782396674156189, -0.25837379693984985, -0.23850791156291962, -0.21864202618598938, -0.19877615571022034, -0.1789102703332901, -0.15904444456100464, -0.1391785591840744, -0.11931268125772476, -0.09944680333137512, -0.07958091795444489, -0.05971503257751465, -0.03984915465116501, -0.01998327672481537, -0.00011739134788513184, 0.019748490303754807, 0.039614371955394745, 0.05948025360703468, 0.07934613525867462, 0.09921202063560486, 0.1190778985619545, 0.13894377648830414, 0.15880966186523438, 0.1786755472421646, 0.19854143261909485, 0.2184073030948639, 0.23827318847179413, 0.25813907384872437, 0.2780049443244934, 0.29787081480026245, 0.3177367150783539, 0.3376025855541229, 0.35746848583221436, 0.3773343563079834, 0.39720022678375244, 0.41706612706184387, 0.4369319975376129, 0.45679789781570435, 0.4766637682914734]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 7.0, 9.0, 20.0, 29.0, 57.0, 75.0, 130.0, 193.0, 344.0, 604.0, 1127.0, 2359.0, 4869.0, 12318.0, 41881.0, 232869.0, 564448.0, 141105.0, 28622.0, 9316.0, 3930.0, 1946.0, 996.0, 541.0, 296.0, 161.0, 101.0, 65.0, 42.0, 30.0, 17.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14635658264160156, -0.14183425903320312, -0.1373119354248047, -0.13278961181640625, -0.1282672882080078, -0.12374496459960938, -0.11922264099121094, -0.1147003173828125, -0.11017799377441406, -0.10565567016601562, -0.10113334655761719, -0.09661102294921875, -0.09208869934082031, -0.08756637573242188, -0.08304405212402344, -0.078521728515625, -0.07399940490722656, -0.06947708129882812, -0.06495475769042969, -0.06043243408203125, -0.05591011047363281, -0.051387786865234375, -0.04686546325683594, -0.0423431396484375, -0.03782081604003906, -0.033298492431640625, -0.028776168823242188, -0.02425384521484375, -0.019731521606445312, -0.015209197998046875, -0.010686874389648438, -0.00616455078125, -0.0016422271728515625, 0.002880096435546875, 0.0074024200439453125, 0.01192474365234375, 0.016447067260742188, 0.020969390869140625, 0.025491714477539062, 0.0300140380859375, 0.03453636169433594, 0.039058685302734375, 0.04358100891113281, 0.04810333251953125, 0.05262565612792969, 0.057147979736328125, 0.06167030334472656, 0.066192626953125, 0.07071495056152344, 0.07523727416992188, 0.07975959777832031, 0.08428192138671875, 0.08880424499511719, 0.09332656860351562, 0.09784889221191406, 0.1023712158203125, 0.10689353942871094, 0.11141586303710938, 0.11593818664550781, 0.12046051025390625, 0.12498283386230469, 0.12950515747070312, 0.13402748107910156, 0.1385498046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 14.0, 10.0, 10.0, 17.0, 26.0, 29.0, 36.0, 42.0, 55.0, 68.0, 84.0, 74.0, 79.0, 71.0, 58.0, 68.0, 58.0, 45.0, 38.0, 31.0, 21.0, 15.0, 14.0, 7.0, 11.0, 8.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57666015625, -0.558929443359375, -0.54119873046875, -0.523468017578125, -0.5057373046875, -0.488006591796875, -0.47027587890625, -0.452545166015625, -0.434814453125, -0.417083740234375, -0.39935302734375, -0.381622314453125, -0.3638916015625, -0.346160888671875, -0.32843017578125, -0.310699462890625, -0.29296875, -0.275238037109375, -0.25750732421875, -0.239776611328125, -0.2220458984375, -0.204315185546875, -0.18658447265625, -0.168853759765625, -0.151123046875, -0.133392333984375, -0.11566162109375, -0.097930908203125, -0.0802001953125, -0.062469482421875, -0.04473876953125, -0.027008056640625, -0.00927734375, 0.008453369140625, 0.02618408203125, 0.043914794921875, 0.0616455078125, 0.079376220703125, 0.09710693359375, 0.114837646484375, 0.132568359375, 0.150299072265625, 0.16802978515625, 0.185760498046875, 0.2034912109375, 0.221221923828125, 0.23895263671875, 0.256683349609375, 0.2744140625, 0.292144775390625, 0.30987548828125, 0.327606201171875, 0.3453369140625, 0.363067626953125, 0.38079833984375, 0.398529052734375, 0.416259765625, 0.433990478515625, 0.45172119140625, 0.469451904296875, 0.4871826171875, 0.504913330078125, 0.52264404296875, 0.540374755859375, 0.55810546875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 7.0, 9.0, 20.0, 18.0, 32.0, 43.0, 54.0, 111.0, 171.0, 352.0, 590.0, 1224.0, 2660.0, 7148.0, 30185.0, 325138.0, 598905.0, 63870.0, 10868.0, 3647.0, 1596.0, 786.0, 437.0, 232.0, 152.0, 94.0, 57.0, 32.0, 31.0, 23.0, 20.0, 8.0, 5.0, 1.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.15576171875, -0.15092086791992188, -0.14608001708984375, -0.14123916625976562, -0.1363983154296875, -0.13155746459960938, -0.12671661376953125, -0.12187576293945312, -0.117034912109375, -0.11219406127929688, -0.10735321044921875, -0.10251235961914062, -0.0976715087890625, -0.09283065795898438, -0.08798980712890625, -0.08314895629882812, -0.07830810546875, -0.07346725463867188, -0.06862640380859375, -0.06378555297851562, -0.0589447021484375, -0.054103851318359375, -0.04926300048828125, -0.044422149658203125, -0.039581298828125, -0.034740447998046875, -0.02989959716796875, -0.025058746337890625, -0.0202178955078125, -0.015377044677734375, -0.01053619384765625, -0.005695343017578125, -0.0008544921875, 0.003986358642578125, 0.00882720947265625, 0.013668060302734375, 0.0185089111328125, 0.023349761962890625, 0.02819061279296875, 0.033031463623046875, 0.037872314453125, 0.042713165283203125, 0.04755401611328125, 0.052394866943359375, 0.0572357177734375, 0.062076568603515625, 0.06691741943359375, 0.07175827026367188, 0.07659912109375, 0.08143997192382812, 0.08628082275390625, 0.09112167358398438, 0.0959625244140625, 0.10080337524414062, 0.10564422607421875, 0.11048507690429688, 0.115325927734375, 0.12016677856445312, 0.12500762939453125, 0.12984848022460938, 0.1346893310546875, 0.13953018188476562, 0.14437103271484375, 0.14921188354492188, 0.154052734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 10.0, 12.0, 13.0, 14.0, 16.0, 20.0, 15.0, 14.0, 29.0, 25.0, 32.0, 32.0, 30.0, 42.0, 37.0, 37.0, 40.0, 44.0, 41.0, 45.0, 45.0, 42.0, 29.0, 39.0, 41.0, 28.0, 27.0, 31.0, 22.0, 18.0, 13.0, 9.0, 17.0, 17.0, 14.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.70263671875, -0.6811752319335938, -0.6597137451171875, -0.6382522583007812, -0.616790771484375, -0.5953292846679688, -0.5738677978515625, -0.5524063110351562, -0.53094482421875, -0.5094833374023438, -0.4880218505859375, -0.46656036376953125, -0.445098876953125, -0.42363739013671875, -0.4021759033203125, -0.38071441650390625, -0.3592529296875, -0.33779144287109375, -0.3163299560546875, -0.29486846923828125, -0.273406982421875, -0.25194549560546875, -0.2304840087890625, -0.20902252197265625, -0.18756103515625, -0.16609954833984375, -0.1446380615234375, -0.12317657470703125, -0.101715087890625, -0.08025360107421875, -0.0587921142578125, -0.03733062744140625, -0.015869140625, 0.00559234619140625, 0.0270538330078125, 0.04851531982421875, 0.069976806640625, 0.09143829345703125, 0.1128997802734375, 0.13436126708984375, 0.15582275390625, 0.17728424072265625, 0.1987457275390625, 0.22020721435546875, 0.241668701171875, 0.26313018798828125, 0.2845916748046875, 0.30605316162109375, 0.3275146484375, 0.34897613525390625, 0.3704376220703125, 0.39189910888671875, 0.413360595703125, 0.43482208251953125, 0.4562835693359375, 0.47774505615234375, 0.49920654296875, 0.5206680297851562, 0.5421295166015625, 0.5635910034179688, 0.585052490234375, 0.6065139770507812, 0.6279754638671875, 0.6494369506835938, 0.6708984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 19.0, 27.0, 44.0, 72.0, 130.0, 199.0, 352.0, 750.0, 1766.0, 4843.0, 17723.0, 244972.0, 728433.0, 37134.0, 7472.0, 2444.0, 1032.0, 485.0, 258.0, 147.0, 84.0, 57.0, 34.0, 19.0, 17.0, 6.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1334228515625, -0.13010311126708984, -0.1267833709716797, -0.12346363067626953, -0.12014389038085938, -0.11682415008544922, -0.11350440979003906, -0.1101846694946289, -0.10686492919921875, -0.1035451889038086, -0.10022544860839844, -0.09690570831298828, -0.09358596801757812, -0.09026622772216797, -0.08694648742675781, -0.08362674713134766, -0.0803070068359375, -0.07698726654052734, -0.07366752624511719, -0.07034778594970703, -0.06702804565429688, -0.06370830535888672, -0.06038856506347656, -0.057068824768066406, -0.05374908447265625, -0.050429344177246094, -0.04710960388183594, -0.04378986358642578, -0.040470123291015625, -0.03715038299560547, -0.03383064270019531, -0.030510902404785156, -0.027191162109375, -0.023871421813964844, -0.020551681518554688, -0.01723194122314453, -0.013912200927734375, -0.010592460632324219, -0.0072727203369140625, -0.003952980041503906, -0.00063323974609375, 0.0026865005493164062, 0.0060062408447265625, 0.009325981140136719, 0.012645721435546875, 0.01596546173095703, 0.019285202026367188, 0.022604942321777344, 0.0259246826171875, 0.029244422912597656, 0.03256416320800781, 0.03588390350341797, 0.039203643798828125, 0.04252338409423828, 0.04584312438964844, 0.049162864685058594, 0.05248260498046875, 0.055802345275878906, 0.05912208557128906, 0.06244182586669922, 0.06576156616210938, 0.06908130645751953, 0.07240104675292969, 0.07572078704833984, 0.07904052734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 10.0, 12.0, 28.0, 64.0, 144.0, 247.0, 236.0, 140.0, 60.0, 28.0, 9.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.823373794555664e-05, -5.590450018644333e-05, -5.357526242733002e-05, -5.1246024668216705e-05, -4.8916786909103394e-05, -4.658754914999008e-05, -4.425831139087677e-05, -4.192907363176346e-05, -3.9599835872650146e-05, -3.7270598113536835e-05, -3.494136035442352e-05, -3.261212259531021e-05, -3.02828848361969e-05, -2.7953647077083588e-05, -2.5624409317970276e-05, -2.3295171558856964e-05, -2.0965933799743652e-05, -1.863669604063034e-05, -1.630745828151703e-05, -1.3978220522403717e-05, -1.1648982763290405e-05, -9.319745004177094e-06, -6.990507245063782e-06, -4.66126948595047e-06, -2.332031726837158e-06, -2.7939677238464355e-09, 2.3264437913894653e-06, 4.655681550502777e-06, 6.984919309616089e-06, 9.3141570687294e-06, 1.1643394827842712e-05, 1.3972632586956024e-05, 1.6301870346069336e-05, 1.8631108105182648e-05, 2.096034586429596e-05, 2.328958362340927e-05, 2.5618821382522583e-05, 2.7948059141635895e-05, 3.0277296900749207e-05, 3.260653465986252e-05, 3.493577241897583e-05, 3.726501017808914e-05, 3.9594247937202454e-05, 4.1923485696315765e-05, 4.425272345542908e-05, 4.658196121454239e-05, 4.89111989736557e-05, 5.124043673276901e-05, 5.3569674491882324e-05, 5.5898912250995636e-05, 5.822815001010895e-05, 6.055738776922226e-05, 6.288662552833557e-05, 6.521586328744888e-05, 6.75451010465622e-05, 6.98743388056755e-05, 7.220357656478882e-05, 7.453281432390213e-05, 7.686205208301544e-05, 7.919128984212875e-05, 8.152052760124207e-05, 8.384976536035538e-05, 8.617900311946869e-05, 8.8508240878582e-05, 9.083747863769531e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 11.0, 20.0, 21.0, 32.0, 28.0, 74.0, 79.0, 124.0, 175.0, 306.0, 433.0, 803.0, 1334.0, 2337.0, 4465.0, 9277.0, 25771.0, 112494.0, 525678.0, 284047.0, 51739.0, 15302.0, 6316.0, 3139.0, 1822.0, 1066.0, 593.0, 353.0, 221.0, 154.0, 113.0, 65.0, 41.0, 23.0, 25.0, 21.0, 12.0, 9.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06390380859375, -0.061953067779541016, -0.06000232696533203, -0.05805158615112305, -0.05610084533691406, -0.05415010452270508, -0.052199363708496094, -0.05024862289428711, -0.048297882080078125, -0.04634714126586914, -0.044396400451660156, -0.04244565963745117, -0.04049491882324219, -0.0385441780090332, -0.03659343719482422, -0.034642696380615234, -0.03269195556640625, -0.030741214752197266, -0.02879047393798828, -0.026839733123779297, -0.024888992309570312, -0.022938251495361328, -0.020987510681152344, -0.01903676986694336, -0.017086029052734375, -0.01513528823852539, -0.013184547424316406, -0.011233806610107422, -0.009283065795898438, -0.007332324981689453, -0.005381584167480469, -0.0034308433532714844, -0.0014801025390625, 0.0004706382751464844, 0.0024213790893554688, 0.004372119903564453, 0.0063228607177734375, 0.008273601531982422, 0.010224342346191406, 0.01217508316040039, 0.014125823974609375, 0.01607656478881836, 0.018027305603027344, 0.019978046417236328, 0.021928787231445312, 0.023879528045654297, 0.02583026885986328, 0.027781009674072266, 0.02973175048828125, 0.031682491302490234, 0.03363323211669922, 0.0355839729309082, 0.03753471374511719, 0.03948545455932617, 0.041436195373535156, 0.04338693618774414, 0.045337677001953125, 0.04728841781616211, 0.049239158630371094, 0.05118989944458008, 0.05314064025878906, 0.05509138107299805, 0.05704212188720703, 0.058992862701416016, 0.060943603515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 13.0, 24.0, 20.0, 26.0, 27.0, 56.0, 57.0, 88.0, 103.0, 105.0, 89.0, 93.0, 63.0, 53.0, 30.0, 26.0, 22.0, 13.0, 15.0, 10.0, 8.0, 4.0, 8.0, 6.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016693115234375, -0.0161287784576416, -0.015564441680908203, -0.015000104904174805, -0.014435768127441406, -0.013871431350708008, -0.01330709457397461, -0.012742757797241211, -0.012178421020507812, -0.011614084243774414, -0.011049747467041016, -0.010485410690307617, -0.009921073913574219, -0.00935673713684082, -0.008792400360107422, -0.008228063583374023, -0.007663726806640625, -0.0070993900299072266, -0.006535053253173828, -0.00597071647644043, -0.005406379699707031, -0.004842042922973633, -0.004277706146240234, -0.003713369369506836, -0.0031490325927734375, -0.002584695816040039, -0.0020203590393066406, -0.0014560222625732422, -0.0008916854858398438, -0.0003273487091064453, 0.00023698806762695312, 0.0008013248443603516, 0.00136566162109375, 0.0019299983978271484, 0.002494335174560547, 0.0030586719512939453, 0.0036230087280273438, 0.004187345504760742, 0.004751682281494141, 0.005316019058227539, 0.0058803558349609375, 0.006444692611694336, 0.007009029388427734, 0.007573366165161133, 0.008137702941894531, 0.00870203971862793, 0.009266376495361328, 0.009830713272094727, 0.010395050048828125, 0.010959386825561523, 0.011523723602294922, 0.01208806037902832, 0.012652397155761719, 0.013216733932495117, 0.013781070709228516, 0.014345407485961914, 0.014909744262695312, 0.015474081039428711, 0.01603841781616211, 0.016602754592895508, 0.017167091369628906, 0.017731428146362305, 0.018295764923095703, 0.0188601016998291, 0.0194244384765625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 11.0, 6.0, 11.0, 22.0, 28.0, 50.0, 81.0, 131.0, 187.0, 161.0, 136.0, 63.0, 53.0, 22.0, 9.0, 11.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7142701745033264, -0.6817948818206787, -0.649319589138031, -0.6168442964553833, -0.5843690633773804, -0.5518937110900879, -0.519418478012085, -0.48694318532943726, -0.45446789264678955, -0.42199259996414185, -0.38951730728149414, -0.3570420444011688, -0.3245667517185211, -0.2920914590358734, -0.2596161961555481, -0.2271409034729004, -0.19466561079025269, -0.16219031810760498, -0.12971504032611847, -0.09723975509405136, -0.06476446986198425, -0.03228917717933655, 0.00018610060214996338, 0.032661378383636475, 0.06513667106628418, 0.09761195629835129, 0.1300872415304184, 0.1625625193119049, 0.1950378119945526, 0.22751310467720032, 0.25998836755752563, 0.29246366024017334, 0.32493889331817627, 0.357414186000824, 0.3898894786834717, 0.422364741563797, 0.4548400342464447, 0.4873153269290924, 0.5197905898094177, 0.5522658824920654, 0.5847411751747131, 0.6172164678573608, 0.6496917605400085, 0.6821670532226562, 0.7146422863006592, 0.7471176385879517, 0.7795928716659546, 0.8120681643486023, 0.84454345703125, 0.8770187497138977, 0.9094940423965454, 0.9419693350791931, 0.9744446277618408, 1.0069198608398438, 1.0393952131271362, 1.0718704462051392, 1.1043457984924316, 1.1368210315704346, 1.169296383857727, 1.20177161693573, 1.2342469692230225, 1.2667222023010254, 1.2991975545883179, 1.3316727876663208, 1.3641480207443237]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 3.0, 10.0, 17.0, 14.0, 12.0, 23.0, 29.0, 36.0, 44.0, 39.0, 68.0, 73.0, 74.0, 67.0, 34.0, 57.0, 63.0, 52.0, 57.0, 54.0, 33.0, 28.0, 26.0, 18.0, 19.0, 8.0, 12.0, 9.0, 7.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5238039493560791, -0.50897616147995, -0.4941483438014984, -0.4793205261230469, -0.4644927382469177, -0.4496649205684662, -0.43483710289001465, -0.4200093150138855, -0.40518152713775635, -0.3903537094593048, -0.37552592158317566, -0.3606981039047241, -0.34587031602859497, -0.33104249835014343, -0.3162146806716919, -0.30138689279556274, -0.2865590751171112, -0.27173125743865967, -0.2569034695625305, -0.24207565188407898, -0.22724786400794983, -0.2124200463294983, -0.19759224355220795, -0.1827644407749176, -0.16793663799762726, -0.15310883522033691, -0.13828103244304657, -0.12345322221517563, -0.10862541943788528, -0.09379761666059494, -0.078969806432724, -0.06414200365543365, -0.0493142306804657, -0.034486427903175354, -0.01965862140059471, -0.004830814898014069, 0.009996987879276276, 0.02482479065656662, 0.03965260088443756, 0.054480403661727905, 0.06930820643901825, 0.0841360092163086, 0.09896381199359894, 0.11379162222146988, 0.12861943244934082, 0.14344722032546997, 0.1582750380039215, 0.17310284078121185, 0.1879306435585022, 0.20275844633579254, 0.21758624911308289, 0.23241406679153442, 0.24724185466766357, 0.2620696723461151, 0.27689749002456665, 0.2917252779006958, 0.30655306577682495, 0.3213808834552765, 0.33620867133140564, 0.3510364890098572, 0.36586427688598633, 0.38069209456443787, 0.3955199122428894, 0.41034770011901855, 0.4251755177974701]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 7.0, 12.0, 22.0, 22.0, 33.0, 32.0, 57.0, 97.0, 160.0, 218.0, 344.0, 578.0, 1012.0, 1853.0, 3962.0, 8435.0, 20297.0, 54946.0, 205963.0, 570509.0, 115488.0, 36955.0, 14713.0, 6242.0, 2882.0, 1593.0, 806.0, 470.0, 268.0, 181.0, 117.0, 61.0, 52.0, 31.0, 33.0, 27.0, 20.0, 17.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.35498046875, -0.344635009765625, -0.33428955078125, -0.323944091796875, -0.3135986328125, -0.303253173828125, -0.29290771484375, -0.282562255859375, -0.272216796875, -0.261871337890625, -0.25152587890625, -0.241180419921875, -0.2308349609375, -0.220489501953125, -0.21014404296875, -0.199798583984375, -0.189453125, -0.179107666015625, -0.16876220703125, -0.158416748046875, -0.1480712890625, -0.137725830078125, -0.12738037109375, -0.117034912109375, -0.106689453125, -0.096343994140625, -0.08599853515625, -0.075653076171875, -0.0653076171875, -0.054962158203125, -0.04461669921875, -0.034271240234375, -0.02392578125, -0.013580322265625, -0.00323486328125, 0.007110595703125, 0.0174560546875, 0.027801513671875, 0.03814697265625, 0.048492431640625, 0.058837890625, 0.069183349609375, 0.07952880859375, 0.089874267578125, 0.1002197265625, 0.110565185546875, 0.12091064453125, 0.131256103515625, 0.1416015625, 0.151947021484375, 0.16229248046875, 0.172637939453125, 0.1829833984375, 0.193328857421875, 0.20367431640625, 0.214019775390625, 0.224365234375, 0.234710693359375, 0.24505615234375, 0.255401611328125, 0.2657470703125, 0.276092529296875, 0.28643798828125, 0.296783447265625, 0.30712890625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 7.0, 6.0, 6.0, 10.0, 13.0, 11.0, 27.0, 18.0, 32.0, 29.0, 36.0, 44.0, 42.0, 56.0, 50.0, 53.0, 52.0, 52.0, 49.0, 57.0, 37.0, 37.0, 42.0, 29.0, 44.0, 25.0, 24.0, 15.0, 18.0, 14.0, 10.0, 10.0, 5.0, 8.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8671875, -0.8422927856445312, -0.8173980712890625, -0.7925033569335938, -0.767608642578125, -0.7427139282226562, -0.7178192138671875, -0.6929244995117188, -0.66802978515625, -0.6431350708007812, -0.6182403564453125, -0.5933456420898438, -0.568450927734375, -0.5435562133789062, -0.5186614990234375, -0.49376678466796875, -0.4688720703125, -0.44397735595703125, -0.4190826416015625, -0.39418792724609375, -0.369293212890625, -0.34439849853515625, -0.3195037841796875, -0.29460906982421875, -0.26971435546875, -0.24481964111328125, -0.2199249267578125, -0.19503021240234375, -0.170135498046875, -0.14524078369140625, -0.1203460693359375, -0.09545135498046875, -0.070556640625, -0.04566192626953125, -0.0207672119140625, 0.00412750244140625, 0.029022216796875, 0.05391693115234375, 0.0788116455078125, 0.10370635986328125, 0.12860107421875, 0.15349578857421875, 0.1783905029296875, 0.20328521728515625, 0.228179931640625, 0.25307464599609375, 0.2779693603515625, 0.30286407470703125, 0.3277587890625, 0.35265350341796875, 0.3775482177734375, 0.40244293212890625, 0.427337646484375, 0.45223236083984375, 0.4771270751953125, 0.5020217895507812, 0.52691650390625, 0.5518112182617188, 0.5767059326171875, 0.6016006469726562, 0.626495361328125, 0.6513900756835938, 0.6762847900390625, 0.7011795043945312, 0.72607421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 6.0, 7.0, 7.0, 4.0, 13.0, 14.0, 14.0, 20.0, 29.0, 44.0, 48.0, 69.0, 88.0, 146.0, 256.0, 587.0, 1886.0, 12416.0, 165786.0, 821526.0, 38907.0, 4682.0, 1021.0, 380.0, 166.0, 119.0, 77.0, 49.0, 47.0, 32.0, 23.0, 19.0, 12.0, 10.0, 9.0, 5.0, 11.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.80078125, -0.7766952514648438, -0.7526092529296875, -0.7285232543945312, -0.704437255859375, -0.6803512573242188, -0.6562652587890625, -0.6321792602539062, -0.60809326171875, -0.5840072631835938, -0.5599212646484375, -0.5358352661132812, -0.511749267578125, -0.48766326904296875, -0.4635772705078125, -0.43949127197265625, -0.4154052734375, -0.39131927490234375, -0.3672332763671875, -0.34314727783203125, -0.319061279296875, -0.29497528076171875, -0.2708892822265625, -0.24680328369140625, -0.22271728515625, -0.19863128662109375, -0.1745452880859375, -0.15045928955078125, -0.126373291015625, -0.10228729248046875, -0.0782012939453125, -0.05411529541015625, -0.030029296875, -0.00594329833984375, 0.0181427001953125, 0.04222869873046875, 0.066314697265625, 0.09040069580078125, 0.1144866943359375, 0.13857269287109375, 0.16265869140625, 0.18674468994140625, 0.2108306884765625, 0.23491668701171875, 0.259002685546875, 0.28308868408203125, 0.3071746826171875, 0.33126068115234375, 0.3553466796875, 0.37943267822265625, 0.4035186767578125, 0.42760467529296875, 0.451690673828125, 0.47577667236328125, 0.4998626708984375, 0.5239486694335938, 0.54803466796875, 0.5721206665039062, 0.5962066650390625, 0.6202926635742188, 0.644378662109375, 0.6684646606445312, 0.6925506591796875, 0.7166366577148438, 0.74072265625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 9.0, 14.0, 9.0, 12.0, 23.0, 18.0, 22.0, 33.0, 34.0, 39.0, 35.0, 40.0, 42.0, 46.0, 56.0, 60.0, 36.0, 53.0, 48.0, 52.0, 47.0, 41.0, 21.0, 26.0, 19.0, 20.0, 20.0, 13.0, 19.0, 15.0, 12.0, 9.0, 10.0, 9.0, 1.0, 7.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.873046875, -0.84375, -0.814453125, -0.78515625, -0.755859375, -0.7265625, -0.697265625, -0.66796875, -0.638671875, -0.609375, -0.580078125, -0.55078125, -0.521484375, -0.4921875, -0.462890625, -0.43359375, -0.404296875, -0.375, -0.345703125, -0.31640625, -0.287109375, -0.2578125, -0.228515625, -0.19921875, -0.169921875, -0.140625, -0.111328125, -0.08203125, -0.052734375, -0.0234375, 0.005859375, 0.03515625, 0.064453125, 0.09375, 0.123046875, 0.15234375, 0.181640625, 0.2109375, 0.240234375, 0.26953125, 0.298828125, 0.328125, 0.357421875, 0.38671875, 0.416015625, 0.4453125, 0.474609375, 0.50390625, 0.533203125, 0.5625, 0.591796875, 0.62109375, 0.650390625, 0.6796875, 0.708984375, 0.73828125, 0.767578125, 0.796875, 0.826171875, 0.85546875, 0.884765625, 0.9140625, 0.943359375, 0.97265625, 1.001953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 11.0, 15.0, 25.0, 40.0, 64.0, 116.0, 174.0, 293.0, 593.0, 1133.0, 3165.0, 12246.0, 77898.0, 788594.0, 138367.0, 18494.0, 4230.0, 1436.0, 734.0, 369.0, 178.0, 123.0, 86.0, 39.0, 35.0, 27.0, 12.0, 8.0, 11.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.18683242797851562, -0.18030548095703125, -0.17377853393554688, -0.1672515869140625, -0.16072463989257812, -0.15419769287109375, -0.14767074584960938, -0.141143798828125, -0.13461685180664062, -0.12808990478515625, -0.12156295776367188, -0.1150360107421875, -0.10850906372070312, -0.10198211669921875, -0.09545516967773438, -0.08892822265625, -0.08240127563476562, -0.07587432861328125, -0.06934738159179688, -0.0628204345703125, -0.056293487548828125, -0.04976654052734375, -0.043239593505859375, -0.036712646484375, -0.030185699462890625, -0.02365875244140625, -0.017131805419921875, -0.0106048583984375, -0.004077911376953125, 0.00244903564453125, 0.008975982666015625, 0.0155029296875, 0.022029876708984375, 0.02855682373046875, 0.035083770751953125, 0.0416107177734375, 0.048137664794921875, 0.05466461181640625, 0.061191558837890625, 0.067718505859375, 0.07424545288085938, 0.08077239990234375, 0.08729934692382812, 0.0938262939453125, 0.10035324096679688, 0.10688018798828125, 0.11340713500976562, 0.11993408203125, 0.12646102905273438, 0.13298797607421875, 0.13951492309570312, 0.1460418701171875, 0.15256881713867188, 0.15909576416015625, 0.16562271118164062, 0.172149658203125, 0.17867660522460938, 0.18520355224609375, 0.19173049926757812, 0.1982574462890625, 0.20478439331054688, 0.21131134033203125, 0.21783828735351562, 0.224365234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 6.0, 6.0, 12.0, 11.0, 19.0, 23.0, 29.0, 43.0, 64.0, 88.0, 157.0, 180.0, 88.0, 61.0, 52.0, 32.0, 29.0, 21.0, 20.0, 8.0, 9.0, 10.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.5093555450439453e-05, -2.4335458874702454e-05, -2.3577362298965454e-05, -2.2819265723228455e-05, -2.2061169147491455e-05, -2.1303072571754456e-05, -2.0544975996017456e-05, -1.9786879420280457e-05, -1.9028782844543457e-05, -1.8270686268806458e-05, -1.7512589693069458e-05, -1.675449311733246e-05, -1.599639654159546e-05, -1.523829996585846e-05, -1.448020339012146e-05, -1.372210681438446e-05, -1.2964010238647461e-05, -1.2205913662910461e-05, -1.1447817087173462e-05, -1.0689720511436462e-05, -9.931623935699463e-06, -9.173527359962463e-06, -8.415430784225464e-06, -7.657334208488464e-06, -6.899237632751465e-06, -6.141141057014465e-06, -5.383044481277466e-06, -4.624947905540466e-06, -3.866851329803467e-06, -3.1087547540664673e-06, -2.3506581783294678e-06, -1.5925616025924683e-06, -8.344650268554688e-07, -7.636845111846924e-08, 6.817281246185303e-07, 1.4398247003555298e-06, 2.1979212760925293e-06, 2.956017851829529e-06, 3.7141144275665283e-06, 4.472211003303528e-06, 5.230307579040527e-06, 5.988404154777527e-06, 6.746500730514526e-06, 7.504597306251526e-06, 8.262693881988525e-06, 9.020790457725525e-06, 9.778887033462524e-06, 1.0536983609199524e-05, 1.1295080184936523e-05, 1.2053176760673523e-05, 1.2811273336410522e-05, 1.3569369912147522e-05, 1.4327466487884521e-05, 1.5085563063621521e-05, 1.584365963935852e-05, 1.660175621509552e-05, 1.735985279083252e-05, 1.811794936656952e-05, 1.887604594230652e-05, 1.9634142518043518e-05, 2.0392239093780518e-05, 2.1150335669517517e-05, 2.1908432245254517e-05, 2.2666528820991516e-05, 2.3424625396728516e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 14.0, 11.0, 16.0, 30.0, 28.0, 38.0, 74.0, 94.0, 164.0, 296.0, 707.0, 1842.0, 6249.0, 30722.0, 225918.0, 705903.0, 60811.0, 10816.0, 2825.0, 981.0, 433.0, 224.0, 126.0, 72.0, 46.0, 23.0, 24.0, 18.0, 8.0, 7.0, 6.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.194580078125, -0.18813514709472656, -0.18169021606445312, -0.1752452850341797, -0.16880035400390625, -0.1623554229736328, -0.15591049194335938, -0.14946556091308594, -0.1430206298828125, -0.13657569885253906, -0.13013076782226562, -0.12368583679199219, -0.11724090576171875, -0.11079597473144531, -0.10435104370117188, -0.09790611267089844, -0.091461181640625, -0.08501625061035156, -0.07857131958007812, -0.07212638854980469, -0.06568145751953125, -0.05923652648925781, -0.052791595458984375, -0.04634666442871094, -0.0399017333984375, -0.03345680236816406, -0.027011871337890625, -0.020566940307617188, -0.01412200927734375, -0.0076770782470703125, -0.001232147216796875, 0.0052127838134765625, 0.01165771484375, 0.018102645874023438, 0.024547576904296875, 0.030992507934570312, 0.03743743896484375, 0.04388236999511719, 0.050327301025390625, 0.05677223205566406, 0.0632171630859375, 0.06966209411621094, 0.07610702514648438, 0.08255195617675781, 0.08899688720703125, 0.09544181823730469, 0.10188674926757812, 0.10833168029785156, 0.114776611328125, 0.12122154235839844, 0.12766647338867188, 0.1341114044189453, 0.14055633544921875, 0.1470012664794922, 0.15344619750976562, 0.15989112854003906, 0.1663360595703125, 0.17278099060058594, 0.17922592163085938, 0.1856708526611328, 0.19211578369140625, 0.1985607147216797, 0.20500564575195312, 0.21145057678222656, 0.2178955078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 5.0, 7.0, 15.0, 14.0, 25.0, 24.0, 41.0, 71.0, 103.0, 196.0, 217.0, 85.0, 69.0, 43.0, 21.0, 18.0, 13.0, 7.0, 9.0, 6.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11785888671875, -0.11483573913574219, -0.11181259155273438, -0.10878944396972656, -0.10576629638671875, -0.10274314880371094, -0.09972000122070312, -0.09669685363769531, -0.0936737060546875, -0.09065055847167969, -0.08762741088867188, -0.08460426330566406, -0.08158111572265625, -0.07855796813964844, -0.07553482055664062, -0.07251167297363281, -0.069488525390625, -0.06646537780761719, -0.06344223022460938, -0.06041908264160156, -0.05739593505859375, -0.05437278747558594, -0.051349639892578125, -0.04832649230957031, -0.0453033447265625, -0.04228019714355469, -0.039257049560546875, -0.03623390197753906, -0.03321075439453125, -0.030187606811523438, -0.027164459228515625, -0.024141311645507812, -0.0211181640625, -0.018095016479492188, -0.015071868896484375, -0.012048721313476562, -0.00902557373046875, -0.0060024261474609375, -0.002979278564453125, 4.38690185546875e-05, 0.0030670166015625, 0.0060901641845703125, 0.009113311767578125, 0.012136459350585938, 0.01515960693359375, 0.018182754516601562, 0.021205902099609375, 0.024229049682617188, 0.027252197265625, 0.030275344848632812, 0.033298492431640625, 0.03632164001464844, 0.03934478759765625, 0.04236793518066406, 0.045391082763671875, 0.04841423034667969, 0.0514373779296875, 0.05446052551269531, 0.057483673095703125, 0.06050682067871094, 0.06352996826171875, 0.06655311584472656, 0.06957626342773438, 0.07259941101074219, 0.07562255859375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 13.0, 31.0, 111.0, 337.0, 348.0, 115.0, 30.0, 15.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1550973653793335, -0.9914608597755432, -0.8278243541717529, -0.6641878485679626, -0.5005513429641724, -0.3369148373603821, -0.1732783317565918, -0.009641766548156738, 0.15399467945098877, 0.31763118505477905, 0.48126769065856934, 0.6449041962623596, 0.8085407018661499, 0.9721772074699402, 1.1358137130737305, 1.2994502782821655, 1.463086724281311, 1.626723289489746, 1.7903597354888916, 1.953996181488037, 2.1176328659057617, 2.2812693119049072, 2.4449057579040527, 2.6085424423217773, 2.7721786499023438, 2.9358150959014893, 3.0994515419006348, 3.2630882263183594, 3.426724672317505, 3.5903611183166504, 3.753997802734375, 3.9176342487335205, 4.081271171569824, 4.244907855987549, 4.408544063568115, 4.57218074798584, 4.735816955566406, 4.899453639984131, 5.0630903244018555, 5.226726531982422, 5.3903632164001465, 5.553999900817871, 5.7176361083984375, 5.881272792816162, 6.044909477233887, 6.208545684814453, 6.372182369232178, 6.535819053649902, 6.699455261230469, 6.863091945648193, 7.02672815322876, 7.190364837646484, 7.354001045227051, 7.517637729644775, 7.6812744140625, 7.844910621643066, 8.008546829223633, 8.1721830368042, 8.335820198059082, 8.499456405639648, 8.663092613220215, 8.826729774475098, 8.990365982055664, 9.15400218963623, 9.317639350891113]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 9.0, 5.0, 8.0, 3.0, 8.0, 8.0, 13.0, 10.0, 18.0, 18.0, 19.0, 14.0, 26.0, 16.0, 17.0, 36.0, 31.0, 38.0, 35.0, 25.0, 38.0, 48.0, 29.0, 42.0, 44.0, 34.0, 37.0, 44.0, 30.0, 34.0, 23.0, 35.0, 17.0, 21.0, 27.0, 24.0, 19.0, 15.0, 9.0, 11.0, 16.0, 12.0, 3.0, 4.0, 6.0, 4.0, 6.0, 1.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.2128617763519287, -1.1747461557388306, -1.1366304159164429, -1.0985147953033447, -1.0603991746902466, -1.0222835540771484, -0.9841678142547607, -0.9460521936416626, -0.9079365134239197, -0.8698208332061768, -0.8317052125930786, -0.7935895323753357, -0.7554738521575928, -0.7173582315444946, -0.6792425513267517, -0.6411268711090088, -0.6030112504959106, -0.5648955702781677, -0.5267799496650696, -0.48866426944732666, -0.45054861903190613, -0.4124329686164856, -0.3743172883987427, -0.33620163798332214, -0.2980859875679016, -0.2599703371524811, -0.22185467183589935, -0.18373900651931763, -0.1456233561038971, -0.10750770568847656, -0.06939204037189484, -0.03127637505531311, 0.006839156150817871, 0.044954814016819, 0.08307047188282013, 0.12118612974882126, 0.1593017876148224, 0.19741743803024292, 0.23553310334682465, 0.27364876866340637, 0.3117644190788269, 0.34988006949424744, 0.38799571990966797, 0.4261114001274109, 0.4642270505428314, 0.502342700958252, 0.5404583811759949, 0.5785740613937378, 0.6166896820068359, 0.6548053622245789, 0.692920982837677, 0.7310366630554199, 0.7691522836685181, 0.807267963886261, 0.8453836441040039, 0.883499264717102, 0.921614944934845, 0.9597306251525879, 0.997846245765686, 1.0359618663787842, 1.0740776062011719, 1.11219322681427, 1.1503088474273682, 1.1884245872497559, 1.226540207862854]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 7.0, 6.0, 12.0, 13.0, 6.0, 9.0, 18.0, 15.0, 13.0, 26.0, 23.0, 41.0, 46.0, 70.0, 130.0, 224.0, 448.0, 1246.0, 3732.0, 16269.0, 143703.0, 3602007.0, 390988.0, 26474.0, 5503.0, 1718.0, 672.0, 338.0, 154.0, 83.0, 57.0, 49.0, 26.0, 26.0, 9.0, 16.0, 17.0, 15.0, 12.0, 11.0, 10.0, 9.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 0.0, 3.0], "bins": [-1.408203125, -1.3686981201171875, -1.329193115234375, -1.2896881103515625, -1.25018310546875, -1.2106781005859375, -1.171173095703125, -1.1316680908203125, -1.0921630859375, -1.0526580810546875, -1.013153076171875, -0.9736480712890625, -0.93414306640625, -0.8946380615234375, -0.855133056640625, -0.8156280517578125, -0.776123046875, -0.7366180419921875, -0.697113037109375, -0.6576080322265625, -0.61810302734375, -0.5785980224609375, -0.539093017578125, -0.4995880126953125, -0.4600830078125, -0.4205780029296875, -0.381072998046875, -0.3415679931640625, -0.30206298828125, -0.2625579833984375, -0.223052978515625, -0.1835479736328125, -0.14404296875, -0.1045379638671875, -0.065032958984375, -0.0255279541015625, 0.01397705078125, 0.0534820556640625, 0.092987060546875, 0.1324920654296875, 0.1719970703125, 0.2115020751953125, 0.251007080078125, 0.2905120849609375, 0.33001708984375, 0.3695220947265625, 0.409027099609375, 0.4485321044921875, 0.488037109375, 0.5275421142578125, 0.567047119140625, 0.6065521240234375, 0.64605712890625, 0.6855621337890625, 0.725067138671875, 0.7645721435546875, 0.8040771484375, 0.8435821533203125, 0.883087158203125, 0.9225921630859375, 0.96209716796875, 1.0016021728515625, 1.041107177734375, 1.0806121826171875, 1.1201171875]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 9.0, 9.0, 13.0, 24.0, 24.0, 31.0, 39.0, 52.0, 61.0, 67.0, 70.0, 62.0, 53.0, 72.0, 60.0, 54.0, 60.0, 52.0, 39.0, 26.0, 19.0, 22.0, 10.0, 19.0, 10.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6036186218261719, -0.5866317749023438, -0.5696449279785156, -0.5526580810546875, -0.5356712341308594, -0.5186843872070312, -0.5016975402832031, -0.484710693359375, -0.4677238464355469, -0.45073699951171875, -0.4337501525878906, -0.4167633056640625, -0.3997764587402344, -0.38278961181640625, -0.3658027648925781, -0.34881591796875, -0.3318290710449219, -0.31484222412109375, -0.2978553771972656, -0.2808685302734375, -0.2638816833496094, -0.24689483642578125, -0.22990798950195312, -0.212921142578125, -0.19593429565429688, -0.17894744873046875, -0.16196060180664062, -0.1449737548828125, -0.12798690795898438, -0.11100006103515625, -0.09401321411132812, -0.0770263671875, -0.060039520263671875, -0.04305267333984375, -0.026065826416015625, -0.0090789794921875, 0.007907867431640625, 0.02489471435546875, 0.041881561279296875, 0.058868408203125, 0.07585525512695312, 0.09284210205078125, 0.10982894897460938, 0.1268157958984375, 0.14380264282226562, 0.16078948974609375, 0.17777633666992188, 0.19476318359375, 0.21175003051757812, 0.22873687744140625, 0.24572372436523438, 0.2627105712890625, 0.2796974182128906, 0.29668426513671875, 0.3136711120605469, 0.330657958984375, 0.3476448059082031, 0.36463165283203125, 0.3816184997558594, 0.3986053466796875, 0.4155921936035156, 0.43257904052734375, 0.4495658874511719, 0.466552734375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 13.0, 20.0, 27.0, 43.0, 77.0, 173.0, 306.0, 534.0, 1341.0, 3784.0, 14377.0, 82398.0, 1725898.0, 2247263.0, 95217.0, 16025.0, 4105.0, 1414.0, 571.0, 277.0, 160.0, 81.0, 52.0, 40.0, 26.0, 12.0, 8.0, 9.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.9886474609375, -0.956787109375, -0.9249267578125, -0.89306640625, -0.8612060546875, -0.829345703125, -0.7974853515625, -0.765625, -0.7337646484375, -0.701904296875, -0.6700439453125, -0.63818359375, -0.6063232421875, -0.574462890625, -0.5426025390625, -0.5107421875, -0.4788818359375, -0.447021484375, -0.4151611328125, -0.38330078125, -0.3514404296875, -0.319580078125, -0.2877197265625, -0.255859375, -0.2239990234375, -0.192138671875, -0.1602783203125, -0.12841796875, -0.0965576171875, -0.064697265625, -0.0328369140625, -0.0009765625, 0.0308837890625, 0.062744140625, 0.0946044921875, 0.12646484375, 0.1583251953125, 0.190185546875, 0.2220458984375, 0.25390625, 0.2857666015625, 0.317626953125, 0.3494873046875, 0.38134765625, 0.4132080078125, 0.445068359375, 0.4769287109375, 0.5087890625, 0.5406494140625, 0.572509765625, 0.6043701171875, 0.63623046875, 0.6680908203125, 0.699951171875, 0.7318115234375, 0.763671875, 0.7955322265625, 0.827392578125, 0.8592529296875, 0.89111328125, 0.9229736328125, 0.954833984375, 0.9866943359375, 1.0185546875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 5.0, 7.0, 16.0, 22.0, 20.0, 28.0, 25.0, 50.0, 53.0, 81.0, 81.0, 139.0, 203.0, 306.0, 465.0, 594.0, 582.0, 424.0, 271.0, 181.0, 132.0, 89.0, 69.0, 43.0, 45.0, 30.0, 14.0, 20.0, 13.0, 16.0, 10.0, 10.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.1868762969970703, -0.18063735961914062, -0.17439842224121094, -0.16815948486328125, -0.16192054748535156, -0.15568161010742188, -0.1494426727294922, -0.1432037353515625, -0.1369647979736328, -0.13072586059570312, -0.12448692321777344, -0.11824798583984375, -0.11200904846191406, -0.10577011108398438, -0.09953117370605469, -0.093292236328125, -0.08705329895019531, -0.08081436157226562, -0.07457542419433594, -0.06833648681640625, -0.06209754943847656, -0.055858612060546875, -0.04961967468261719, -0.0433807373046875, -0.03714179992675781, -0.030902862548828125, -0.024663925170898438, -0.01842498779296875, -0.012186050415039062, -0.005947113037109375, 0.0002918243408203125, 0.00653076171875, 0.012769699096679688, 0.019008636474609375, 0.025247573852539062, 0.03148651123046875, 0.03772544860839844, 0.043964385986328125, 0.05020332336425781, 0.0564422607421875, 0.06268119812011719, 0.06892013549804688, 0.07515907287597656, 0.08139801025390625, 0.08763694763183594, 0.09387588500976562, 0.10011482238769531, 0.106353759765625, 0.11259269714355469, 0.11883163452148438, 0.12507057189941406, 0.13130950927734375, 0.13754844665527344, 0.14378738403320312, 0.1500263214111328, 0.1562652587890625, 0.1625041961669922, 0.16874313354492188, 0.17498207092285156, 0.18122100830078125, 0.18745994567871094, 0.19369888305664062, 0.1999378204345703, 0.2061767578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 6.0, 6.0, 13.0, 15.0, 32.0, 39.0, 75.0, 99.0, 112.0, 145.0, 116.0, 101.0, 85.0, 74.0, 47.0, 17.0, 11.0, 6.0, 0.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.925675630569458, -0.881473958492279, -0.8372722268104553, -0.7930705547332764, -0.7488688826560974, -0.7046672105789185, -0.6604654788970947, -0.6162638068199158, -0.5720621347427368, -0.5278604626655579, -0.4836587607860565, -0.4394570589065552, -0.3952553868293762, -0.3510536849498749, -0.30685198307037354, -0.2626503109931946, -0.21844857931137085, -0.1742468923330307, -0.13004520535469055, -0.08584350347518921, -0.04164181649684906, 0.002559870481491089, 0.04676157236099243, 0.09096324443817139, 0.13516494631767273, 0.17936663329601288, 0.22356832027435303, 0.26777002215385437, 0.3119717240333557, 0.35617339611053467, 0.400375097990036, 0.44457677006721497, 0.4887784719467163, 0.5329801440238953, 0.577181875705719, 0.621383547782898, 0.6655852198600769, 0.7097868919372559, 0.7539886236190796, 0.7981902956962585, 0.8423919677734375, 0.8865936398506165, 0.9307953715324402, 0.9749970436096191, 1.0191987752914429, 1.063400387763977, 1.1076021194458008, 1.151803731918335, 1.1960055828094482, 1.240207314491272, 1.2844089269638062, 1.3286106586456299, 1.3728123903274536, 1.4170140027999878, 1.4612157344818115, 1.5054173469543457, 1.5496190786361694, 1.5938208103179932, 1.6380224227905273, 1.682224154472351, 1.7264258861541748, 1.770627498626709, 1.8148292303085327, 1.8590309619903564, 1.9032325744628906]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 10.0, 2.0, 4.0, 4.0, 3.0, 14.0, 10.0, 24.0, 14.0, 20.0, 21.0, 28.0, 33.0, 39.0, 32.0, 41.0, 58.0, 57.0, 43.0, 54.0, 39.0, 58.0, 51.0, 42.0, 38.0, 38.0, 38.0, 29.0, 36.0, 21.0, 26.0, 7.0, 16.0, 11.0, 8.0, 12.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6371350288391113, -0.6192802786827087, -0.6014255881309509, -0.5835708379745483, -0.5657160878181458, -0.5478613972663879, -0.5300066471099854, -0.5121518969535828, -0.49429720640182495, -0.47644248604774475, -0.45858773589134216, -0.44073301553726196, -0.42287829518318176, -0.40502357482910156, -0.387168824672699, -0.3693141043186188, -0.3514593541622162, -0.333604633808136, -0.3157498836517334, -0.2978951632976532, -0.280040442943573, -0.2621856927871704, -0.2443309724330902, -0.22647625207901, -0.20862151682376862, -0.19076678156852722, -0.17291206121444702, -0.15505732595920563, -0.13720259070396423, -0.11934787034988403, -0.10149313509464264, -0.08363840728998184, -0.06578367948532104, -0.04792895168066025, -0.030074220150709152, -0.012219488620758057, 0.0056352391839027405, 0.023489966988563538, 0.04134470224380493, 0.05919943004846573, 0.07705415785312653, 0.09490888565778732, 0.11276361346244812, 0.13061834871768951, 0.1484730839729309, 0.1663278043270111, 0.1841825395822525, 0.2020372748374939, 0.2198919951915741, 0.2377467304468155, 0.2556014657020569, 0.2734561860561371, 0.2913109064102173, 0.3091656565666199, 0.3270203769207001, 0.3448750972747803, 0.36272984743118286, 0.38058456778526306, 0.39843931794166565, 0.41629403829574585, 0.43414875864982605, 0.45200347900390625, 0.46985822916030884, 0.48771294951438904, 0.5055676698684692]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 9.0, 14.0, 30.0, 66.0, 133.0, 321.0, 764.0, 2054.0, 6598.0, 37469.0, 880919.0, 105601.0, 9941.0, 2937.0, 994.0, 383.0, 164.0, 82.0, 33.0, 21.0, 10.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3759765625, -0.35938262939453125, -0.3427886962890625, -0.32619476318359375, -0.309600830078125, -0.29300689697265625, -0.2764129638671875, -0.25981903076171875, -0.24322509765625, -0.22663116455078125, -0.2100372314453125, -0.19344329833984375, -0.176849365234375, -0.16025543212890625, -0.1436614990234375, -0.12706756591796875, -0.1104736328125, -0.09387969970703125, -0.0772857666015625, -0.06069183349609375, -0.044097900390625, -0.02750396728515625, -0.0109100341796875, 0.00568389892578125, 0.02227783203125, 0.03887176513671875, 0.0554656982421875, 0.07205963134765625, 0.088653564453125, 0.10524749755859375, 0.1218414306640625, 0.13843536376953125, 0.155029296875, 0.17162322998046875, 0.1882171630859375, 0.20481109619140625, 0.221405029296875, 0.23799896240234375, 0.2545928955078125, 0.27118682861328125, 0.28778076171875, 0.30437469482421875, 0.3209686279296875, 0.33756256103515625, 0.354156494140625, 0.37075042724609375, 0.3873443603515625, 0.40393829345703125, 0.4205322265625, 0.43712615966796875, 0.4537200927734375, 0.47031402587890625, 0.486907958984375, 0.5035018920898438, 0.5200958251953125, 0.5366897583007812, 0.55328369140625, 0.5698776245117188, 0.5864715576171875, 0.6030654907226562, 0.619659423828125, 0.6362533569335938, 0.6528472900390625, 0.6694412231445312, 0.68603515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 14.0, 19.0, 32.0, 39.0, 67.0, 102.0, 123.0, 142.0, 127.0, 116.0, 89.0, 54.0, 33.0, 24.0, 12.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5002288818359375, -0.466278076171875, -0.4323272705078125, -0.39837646484375, -0.3644256591796875, -0.330474853515625, -0.2965240478515625, -0.2625732421875, -0.2286224365234375, -0.194671630859375, -0.1607208251953125, -0.12677001953125, -0.0928192138671875, -0.058868408203125, -0.0249176025390625, 0.009033203125, 0.0429840087890625, 0.076934814453125, 0.1108856201171875, 0.14483642578125, 0.1787872314453125, 0.212738037109375, 0.2466888427734375, 0.2806396484375, 0.3145904541015625, 0.348541259765625, 0.3824920654296875, 0.41644287109375, 0.4503936767578125, 0.484344482421875, 0.5182952880859375, 0.55224609375, 0.5861968994140625, 0.620147705078125, 0.6540985107421875, 0.68804931640625, 0.7220001220703125, 0.755950927734375, 0.7899017333984375, 0.8238525390625, 0.8578033447265625, 0.891754150390625, 0.9257049560546875, 0.95965576171875, 0.9936065673828125, 1.027557373046875, 1.0615081787109375, 1.095458984375, 1.1294097900390625, 1.163360595703125, 1.1973114013671875, 1.23126220703125, 1.2652130126953125, 1.299163818359375, 1.3331146240234375, 1.3670654296875, 1.4010162353515625, 1.434967041015625, 1.4689178466796875, 1.50286865234375, 1.5368194580078125, 1.570770263671875, 1.6047210693359375, 1.638671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 12.0, 16.0, 15.0, 21.0, 47.0, 54.0, 100.0, 188.0, 381.0, 791.0, 1832.0, 5280.0, 22936.0, 524981.0, 462536.0, 21046.0, 4920.0, 1811.0, 742.0, 354.0, 191.0, 105.0, 57.0, 28.0, 24.0, 26.0, 14.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.400634765625, -0.39035797119140625, -0.3800811767578125, -0.36980438232421875, -0.359527587890625, -0.34925079345703125, -0.3389739990234375, -0.32869720458984375, -0.31842041015625, -0.30814361572265625, -0.2978668212890625, -0.28759002685546875, -0.277313232421875, -0.26703643798828125, -0.2567596435546875, -0.24648284912109375, -0.2362060546875, -0.22592926025390625, -0.2156524658203125, -0.20537567138671875, -0.195098876953125, -0.18482208251953125, -0.1745452880859375, -0.16426849365234375, -0.15399169921875, -0.14371490478515625, -0.1334381103515625, -0.12316131591796875, -0.112884521484375, -0.10260772705078125, -0.0923309326171875, -0.08205413818359375, -0.07177734375, -0.06150054931640625, -0.0512237548828125, -0.04094696044921875, -0.030670166015625, -0.02039337158203125, -0.0101165771484375, 0.00016021728515625, 0.01043701171875, 0.02071380615234375, 0.0309906005859375, 0.04126739501953125, 0.051544189453125, 0.06182098388671875, 0.0720977783203125, 0.08237457275390625, 0.0926513671875, 0.10292816162109375, 0.1132049560546875, 0.12348175048828125, 0.133758544921875, 0.14403533935546875, 0.1543121337890625, 0.16458892822265625, 0.17486572265625, 0.18514251708984375, 0.1954193115234375, 0.20569610595703125, 0.215972900390625, 0.22624969482421875, 0.2365264892578125, 0.24680328369140625, 0.257080078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 0.0, 1.0, 5.0, 7.0, 3.0, 2.0, 13.0, 22.0, 16.0, 16.0, 21.0, 15.0, 28.0, 31.0, 33.0, 26.0, 25.0, 37.0, 43.0, 52.0, 43.0, 39.0, 47.0, 63.0, 42.0, 44.0, 50.0, 38.0, 34.0, 34.0, 26.0, 18.0, 28.0, 14.0, 18.0, 13.0, 11.0, 9.0, 12.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89404296875, -0.8666839599609375, -0.839324951171875, -0.8119659423828125, -0.78460693359375, -0.7572479248046875, -0.729888916015625, -0.7025299072265625, -0.6751708984375, -0.6478118896484375, -0.620452880859375, -0.5930938720703125, -0.56573486328125, -0.5383758544921875, -0.511016845703125, -0.4836578369140625, -0.456298828125, -0.4289398193359375, -0.401580810546875, -0.3742218017578125, -0.34686279296875, -0.3195037841796875, -0.292144775390625, -0.2647857666015625, -0.2374267578125, -0.2100677490234375, -0.182708740234375, -0.1553497314453125, -0.12799072265625, -0.1006317138671875, -0.073272705078125, -0.0459136962890625, -0.0185546875, 0.0088043212890625, 0.036163330078125, 0.0635223388671875, 0.09088134765625, 0.1182403564453125, 0.145599365234375, 0.1729583740234375, 0.2003173828125, 0.2276763916015625, 0.255035400390625, 0.2823944091796875, 0.30975341796875, 0.3371124267578125, 0.364471435546875, 0.3918304443359375, 0.419189453125, 0.4465484619140625, 0.473907470703125, 0.5012664794921875, 0.52862548828125, 0.5559844970703125, 0.583343505859375, 0.6107025146484375, 0.6380615234375, 0.6654205322265625, 0.692779541015625, 0.7201385498046875, 0.74749755859375, 0.7748565673828125, 0.802215576171875, 0.8295745849609375, 0.85693359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0, 4.0, 4.0, 0.0, 4.0, 4.0, 13.0, 25.0, 30.0, 38.0, 67.0, 108.0, 215.0, 381.0, 744.0, 1476.0, 3665.0, 9897.0, 67635.0, 863865.0, 81990.0, 11128.0, 3705.0, 1742.0, 832.0, 393.0, 201.0, 143.0, 91.0, 43.0, 35.0, 30.0, 12.0, 5.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12152099609375, -0.11740589141845703, -0.11329078674316406, -0.1091756820678711, -0.10506057739257812, -0.10094547271728516, -0.09683036804199219, -0.09271526336669922, -0.08860015869140625, -0.08448505401611328, -0.08036994934082031, -0.07625484466552734, -0.07213973999023438, -0.0680246353149414, -0.06390953063964844, -0.05979442596435547, -0.0556793212890625, -0.05156421661376953, -0.04744911193847656, -0.043334007263183594, -0.039218902587890625, -0.035103797912597656, -0.030988693237304688, -0.02687358856201172, -0.02275848388671875, -0.01864337921142578, -0.014528274536132812, -0.010413169860839844, -0.006298065185546875, -0.0021829605102539062, 0.0019321441650390625, 0.006047248840332031, 0.010162353515625, 0.014277458190917969, 0.018392562866210938, 0.022507667541503906, 0.026622772216796875, 0.030737876892089844, 0.03485298156738281, 0.03896808624267578, 0.04308319091796875, 0.04719829559326172, 0.05131340026855469, 0.055428504943847656, 0.059543609619140625, 0.0636587142944336, 0.06777381896972656, 0.07188892364501953, 0.0760040283203125, 0.08011913299560547, 0.08423423767089844, 0.0883493423461914, 0.09246444702148438, 0.09657955169677734, 0.10069465637207031, 0.10480976104736328, 0.10892486572265625, 0.11303997039794922, 0.11715507507324219, 0.12127017974853516, 0.12538528442382812, 0.1295003890991211, 0.13361549377441406, 0.13773059844970703, 0.141845703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 26.0, 24.0, 41.0, 100.0, 191.0, 253.0, 164.0, 86.0, 45.0, 20.0, 10.0, 9.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.887580871582031e-05, -4.658754914999008e-05, -4.429928958415985e-05, -4.201103001832962e-05, -3.972277045249939e-05, -3.743451088666916e-05, -3.514625132083893e-05, -3.28579917550087e-05, -3.056973218917847e-05, -2.8281472623348236e-05, -2.5993213057518005e-05, -2.3704953491687775e-05, -2.1416693925857544e-05, -1.9128434360027313e-05, -1.6840174794197083e-05, -1.4551915228366852e-05, -1.2263655662536621e-05, -9.97539609670639e-06, -7.68713653087616e-06, -5.398876965045929e-06, -3.1106173992156982e-06, -8.223578333854675e-07, 1.4659017324447632e-06, 3.754161298274994e-06, 6.042420864105225e-06, 8.330680429935455e-06, 1.0618939995765686e-05, 1.2907199561595917e-05, 1.5195459127426147e-05, 1.7483718693256378e-05, 1.977197825908661e-05, 2.206023782491684e-05, 2.434849739074707e-05, 2.66367569565773e-05, 2.8925016522407532e-05, 3.121327608823776e-05, 3.350153565406799e-05, 3.5789795219898224e-05, 3.8078054785728455e-05, 4.0366314351558685e-05, 4.2654573917388916e-05, 4.494283348321915e-05, 4.723109304904938e-05, 4.951935261487961e-05, 5.180761218070984e-05, 5.409587174654007e-05, 5.63841313123703e-05, 5.867239087820053e-05, 6.096065044403076e-05, 6.324891000986099e-05, 6.553716957569122e-05, 6.782542914152145e-05, 7.011368870735168e-05, 7.240194827318192e-05, 7.469020783901215e-05, 7.697846740484238e-05, 7.926672697067261e-05, 8.155498653650284e-05, 8.384324610233307e-05, 8.61315056681633e-05, 8.841976523399353e-05, 9.070802479982376e-05, 9.299628436565399e-05, 9.528454393148422e-05, 9.757280349731445e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 12.0, 9.0, 18.0, 30.0, 52.0, 72.0, 123.0, 202.0, 382.0, 689.0, 1332.0, 2518.0, 5365.0, 14632.0, 114166.0, 807851.0, 78848.0, 12341.0, 4882.0, 2341.0, 1203.0, 630.0, 338.0, 178.0, 111.0, 68.0, 42.0, 25.0, 14.0, 16.0, 11.0, 4.0, 5.0, 3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.11567974090576172, -0.11130332946777344, -0.10692691802978516, -0.10255050659179688, -0.0981740951538086, -0.09379768371582031, -0.08942127227783203, -0.08504486083984375, -0.08066844940185547, -0.07629203796386719, -0.0719156265258789, -0.06753921508789062, -0.06316280364990234, -0.05878639221191406, -0.05440998077392578, -0.0500335693359375, -0.04565715789794922, -0.04128074645996094, -0.036904335021972656, -0.032527923583984375, -0.028151512145996094, -0.023775100708007812, -0.01939868927001953, -0.01502227783203125, -0.010645866394042969, -0.0062694549560546875, -0.0018930435180664062, 0.002483367919921875, 0.006859779357910156, 0.011236190795898438, 0.015612602233886719, 0.019989013671875, 0.02436542510986328, 0.028741836547851562, 0.033118247985839844, 0.037494659423828125, 0.041871070861816406, 0.04624748229980469, 0.05062389373779297, 0.05500030517578125, 0.05937671661376953, 0.06375312805175781, 0.0681295394897461, 0.07250595092773438, 0.07688236236572266, 0.08125877380371094, 0.08563518524169922, 0.0900115966796875, 0.09438800811767578, 0.09876441955566406, 0.10314083099365234, 0.10751724243164062, 0.1118936538696289, 0.11627006530761719, 0.12064647674560547, 0.12502288818359375, 0.12939929962158203, 0.1337757110595703, 0.1381521224975586, 0.14252853393554688, 0.14690494537353516, 0.15128135681152344, 0.15565776824951172, 0.1600341796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 9.0, 29.0, 54.0, 92.0, 163.0, 243.0, 142.0, 99.0, 54.0, 32.0, 21.0, 11.0, 11.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0478515625, -0.04649972915649414, -0.04514789581298828, -0.04379606246948242, -0.04244422912597656, -0.0410923957824707, -0.039740562438964844, -0.038388729095458984, -0.037036895751953125, -0.035685062408447266, -0.034333229064941406, -0.03298139572143555, -0.03162956237792969, -0.030277729034423828, -0.02892589569091797, -0.02757406234741211, -0.02622222900390625, -0.02487039566040039, -0.02351856231689453, -0.022166728973388672, -0.020814895629882812, -0.019463062286376953, -0.018111228942871094, -0.016759395599365234, -0.015407562255859375, -0.014055728912353516, -0.012703895568847656, -0.011352062225341797, -0.010000228881835938, -0.008648395538330078, -0.007296562194824219, -0.005944728851318359, -0.0045928955078125, -0.0032410621643066406, -0.0018892288208007812, -0.0005373954772949219, 0.0008144378662109375, 0.002166271209716797, 0.0035181045532226562, 0.004869937896728516, 0.006221771240234375, 0.007573604583740234, 0.008925437927246094, 0.010277271270751953, 0.011629104614257812, 0.012980937957763672, 0.014332771301269531, 0.01568460464477539, 0.01703643798828125, 0.01838827133178711, 0.01974010467529297, 0.021091938018798828, 0.022443771362304688, 0.023795604705810547, 0.025147438049316406, 0.026499271392822266, 0.027851104736328125, 0.029202938079833984, 0.030554771423339844, 0.0319066047668457, 0.03325843811035156, 0.03461027145385742, 0.03596210479736328, 0.03731393814086914, 0.038665771484375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 14.0, 17.0, 60.0, 98.0, 174.0, 208.0, 162.0, 141.0, 81.0, 24.0, 21.0, 6.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2092769145965576, -2.1588737964630127, -2.1084706783294678, -2.058067798614502, -2.007664680480957, -1.957261562347412, -1.9068584442138672, -1.8564553260803223, -1.8060522079467773, -1.7556490898132324, -1.705246090888977, -1.6548429727554321, -1.6044398546218872, -1.5540368556976318, -1.503633737564087, -1.453230619430542, -1.4028276205062866, -1.3524245023727417, -1.3020215034484863, -1.2516183853149414, -1.2012152671813965, -1.1508121490478516, -1.1004091501235962, -1.0500060319900513, -0.9996029734611511, -0.949199914932251, -0.898796796798706, -0.8483937382698059, -0.7979906797409058, -0.7475875616073608, -0.6971845030784607, -0.6467814445495605, -0.5963782072067261, -0.5459751486778259, -0.495572030544281, -0.44516897201538086, -0.3947658836841583, -0.3443627953529358, -0.29395973682403564, -0.2435566484928131, -0.19315356016159058, -0.14275047183036804, -0.0923473984003067, -0.04194432497024536, 0.008458763360977173, 0.05886185169219971, 0.10926491022109985, 0.1596679985523224, 0.21007108688354492, 0.26047417521476746, 0.31087726354599, 0.36128032207489014, 0.41168341040611267, 0.4620864987373352, 0.5124895572662354, 0.5628926753997803, 0.6132957339286804, 0.6636987924575806, 0.7141019105911255, 0.7645049691200256, 0.8149080276489258, 0.8653111457824707, 0.9157142043113708, 0.966117262840271, 1.016520380973816]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 18.0, 10.0, 23.0, 31.0, 59.0, 67.0, 92.0, 122.0, 111.0, 106.0, 108.0, 81.0, 72.0, 32.0, 27.0, 21.0, 10.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42409247159957886, -0.39540407061576843, -0.3667156994342804, -0.33802729845046997, -0.30933892726898193, -0.2806505262851715, -0.2519621253013611, -0.22327373921871185, -0.19458535313606262, -0.1658969670534134, -0.13720858097076416, -0.10852017998695374, -0.0798317939043045, -0.05114340782165527, -0.02245500683784485, 0.006233379244804382, 0.03492176532745361, 0.06361015141010284, 0.09229854494333267, 0.1209869384765625, 0.14967532455921173, 0.17836371064186096, 0.2070521116256714, 0.23574049770832062, 0.26442888379096985, 0.2931172847747803, 0.3218056559562683, 0.35049405694007874, 0.37918245792388916, 0.4078708291053772, 0.4365592300891876, 0.46524763107299805, 0.49393606185913086, 0.5226244330406189, 0.5513128638267517, 0.5800012350082397, 0.6086896061897278, 0.6373779773712158, 0.6660664081573486, 0.6947547793388367, 0.7234431505203247, 0.7521315217018127, 0.7808199524879456, 0.8095083236694336, 0.8381966948509216, 0.8668850660324097, 0.8955734968185425, 0.9242618680000305, 0.9529502987861633, 0.9816386699676514, 1.0103271007537842, 1.039015531539917, 1.0677038431167603, 1.096392273902893, 1.1250805854797363, 1.1537690162658691, 1.182457447052002, 1.2111458778381348, 1.239834189414978, 1.2685226202011108, 1.2972110509872437, 1.325899362564087, 1.3545877933502197, 1.3832762241363525, 1.4119645357131958]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 16.0, 21.0, 37.0, 52.0, 100.0, 188.0, 386.0, 778.0, 1720.0, 4500.0, 12560.0, 45914.0, 230143.0, 587627.0, 122908.0, 27576.0, 8344.0, 3213.0, 1232.0, 565.0, 290.0, 169.0, 81.0, 53.0, 18.0, 19.0, 8.0, 6.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415283203125, -0.3974723815917969, -0.37966156005859375, -0.3618507385253906, -0.3440399169921875, -0.3262290954589844, -0.30841827392578125, -0.2906074523925781, -0.272796630859375, -0.2549858093261719, -0.23717498779296875, -0.21936416625976562, -0.2015533447265625, -0.18374252319335938, -0.16593170166015625, -0.14812088012695312, -0.13031005859375, -0.11249923706054688, -0.09468841552734375, -0.07687759399414062, -0.0590667724609375, -0.041255950927734375, -0.02344512939453125, -0.005634307861328125, 0.012176513671875, 0.029987335205078125, 0.04779815673828125, 0.06560897827148438, 0.0834197998046875, 0.10123062133789062, 0.11904144287109375, 0.13685226440429688, 0.1546630859375, 0.17247390747070312, 0.19028472900390625, 0.20809555053710938, 0.2259063720703125, 0.24371719360351562, 0.26152801513671875, 0.2793388366699219, 0.297149658203125, 0.3149604797363281, 0.33277130126953125, 0.3505821228027344, 0.3683929443359375, 0.3862037658691406, 0.40401458740234375, 0.4218254089355469, 0.43963623046875, 0.4574470520019531, 0.47525787353515625, 0.4930686950683594, 0.5108795166015625, 0.5286903381347656, 0.5465011596679688, 0.5643119812011719, 0.582122802734375, 0.5999336242675781, 0.6177444458007812, 0.6355552673339844, 0.6533660888671875, 0.6711769104003906, 0.6889877319335938, 0.7067985534667969, 0.724609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 7.0, 14.0, 21.0, 19.0, 35.0, 37.0, 65.0, 94.0, 85.0, 94.0, 100.0, 95.0, 91.0, 66.0, 55.0, 36.0, 32.0, 18.0, 11.0, 7.0, 6.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.923828125, -0.87823486328125, -0.8326416015625, -0.78704833984375, -0.741455078125, -0.69586181640625, -0.6502685546875, -0.60467529296875, -0.55908203125, -0.51348876953125, -0.4678955078125, -0.42230224609375, -0.376708984375, -0.33111572265625, -0.2855224609375, -0.23992919921875, -0.1943359375, -0.14874267578125, -0.1031494140625, -0.05755615234375, -0.011962890625, 0.03363037109375, 0.0792236328125, 0.12481689453125, 0.17041015625, 0.21600341796875, 0.2615966796875, 0.30718994140625, 0.352783203125, 0.39837646484375, 0.4439697265625, 0.48956298828125, 0.53515625, 0.58074951171875, 0.6263427734375, 0.67193603515625, 0.717529296875, 0.76312255859375, 0.8087158203125, 0.85430908203125, 0.89990234375, 0.94549560546875, 0.9910888671875, 1.03668212890625, 1.082275390625, 1.12786865234375, 1.1734619140625, 1.21905517578125, 1.2646484375, 1.31024169921875, 1.3558349609375, 1.40142822265625, 1.447021484375, 1.49261474609375, 1.5382080078125, 1.58380126953125, 1.62939453125, 1.67498779296875, 1.7205810546875, 1.76617431640625, 1.811767578125, 1.85736083984375, 1.9029541015625, 1.94854736328125, 1.994140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 6.0, 3.0, 7.0, 10.0, 9.0, 16.0, 22.0, 33.0, 61.0, 99.0, 161.0, 362.0, 1586.0, 44203.0, 979108.0, 20997.0, 1175.0, 313.0, 128.0, 73.0, 44.0, 48.0, 25.0, 16.0, 9.0, 13.0, 5.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.846527099609375, -1.78582763671875, -1.725128173828125, -1.6644287109375, -1.603729248046875, -1.54302978515625, -1.482330322265625, -1.421630859375, -1.360931396484375, -1.30023193359375, -1.239532470703125, -1.1788330078125, -1.118133544921875, -1.05743408203125, -0.996734619140625, -0.93603515625, -0.875335693359375, -0.81463623046875, -0.753936767578125, -0.6932373046875, -0.632537841796875, -0.57183837890625, -0.511138916015625, -0.450439453125, -0.389739990234375, -0.32904052734375, -0.268341064453125, -0.2076416015625, -0.146942138671875, -0.08624267578125, -0.025543212890625, 0.03515625, 0.095855712890625, 0.15655517578125, 0.217254638671875, 0.2779541015625, 0.338653564453125, 0.39935302734375, 0.460052490234375, 0.520751953125, 0.581451416015625, 0.64215087890625, 0.702850341796875, 0.7635498046875, 0.824249267578125, 0.88494873046875, 0.945648193359375, 1.00634765625, 1.067047119140625, 1.12774658203125, 1.188446044921875, 1.2491455078125, 1.309844970703125, 1.37054443359375, 1.431243896484375, 1.491943359375, 1.552642822265625, 1.61334228515625, 1.674041748046875, 1.7347412109375, 1.795440673828125, 1.85614013671875, 1.916839599609375, 1.9775390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 5.0, 4.0, 5.0, 7.0, 13.0, 12.0, 11.0, 19.0, 16.0, 29.0, 31.0, 36.0, 36.0, 39.0, 64.0, 50.0, 63.0, 56.0, 57.0, 56.0, 45.0, 55.0, 42.0, 40.0, 35.0, 39.0, 26.0, 24.0, 16.0, 21.0, 15.0, 8.0, 7.0, 4.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1162109375, -1.081268310546875, -1.04632568359375, -1.011383056640625, -0.9764404296875, -0.941497802734375, -0.90655517578125, -0.871612548828125, -0.836669921875, -0.801727294921875, -0.76678466796875, -0.731842041015625, -0.6968994140625, -0.661956787109375, -0.62701416015625, -0.592071533203125, -0.55712890625, -0.522186279296875, -0.48724365234375, -0.452301025390625, -0.4173583984375, -0.382415771484375, -0.34747314453125, -0.312530517578125, -0.277587890625, -0.242645263671875, -0.20770263671875, -0.172760009765625, -0.1378173828125, -0.102874755859375, -0.06793212890625, -0.032989501953125, 0.001953125, 0.036895751953125, 0.07183837890625, 0.106781005859375, 0.1417236328125, 0.176666259765625, 0.21160888671875, 0.246551513671875, 0.281494140625, 0.316436767578125, 0.35137939453125, 0.386322021484375, 0.4212646484375, 0.456207275390625, 0.49114990234375, 0.526092529296875, 0.56103515625, 0.595977783203125, 0.63092041015625, 0.665863037109375, 0.7008056640625, 0.735748291015625, 0.77069091796875, 0.805633544921875, 0.840576171875, 0.875518798828125, 0.91046142578125, 0.945404052734375, 0.9803466796875, 1.015289306640625, 1.05023193359375, 1.085174560546875, 1.1201171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 8.0, 9.0, 9.0, 16.0, 37.0, 44.0, 76.0, 133.0, 245.0, 646.0, 2053.0, 10013.0, 125731.0, 826065.0, 73626.0, 7112.0, 1639.0, 528.0, 236.0, 130.0, 71.0, 35.0, 28.0, 13.0, 10.0, 11.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.35546875, -0.3448295593261719, -0.33419036865234375, -0.3235511779785156, -0.3129119873046875, -0.3022727966308594, -0.29163360595703125, -0.2809944152832031, -0.270355224609375, -0.2597160339355469, -0.24907684326171875, -0.23843765258789062, -0.2277984619140625, -0.21715927124023438, -0.20652008056640625, -0.19588088989257812, -0.18524169921875, -0.17460250854492188, -0.16396331787109375, -0.15332412719726562, -0.1426849365234375, -0.13204574584960938, -0.12140655517578125, -0.11076736450195312, -0.100128173828125, -0.08948898315429688, -0.07884979248046875, -0.06821060180664062, -0.0575714111328125, -0.046932220458984375, -0.03629302978515625, -0.025653839111328125, -0.0150146484375, -0.004375457763671875, 0.00626373291015625, 0.016902923583984375, 0.0275421142578125, 0.038181304931640625, 0.04882049560546875, 0.059459686279296875, 0.070098876953125, 0.08073806762695312, 0.09137725830078125, 0.10201644897460938, 0.1126556396484375, 0.12329483032226562, 0.13393402099609375, 0.14457321166992188, 0.15521240234375, 0.16585159301757812, 0.17649078369140625, 0.18712997436523438, 0.1977691650390625, 0.20840835571289062, 0.21904754638671875, 0.22968673706054688, 0.240325927734375, 0.2509651184082031, 0.26160430908203125, 0.2722434997558594, 0.2828826904296875, 0.2935218811035156, 0.30416107177734375, 0.3148002624511719, 0.325439453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 11.0, 7.0, 8.0, 15.0, 22.0, 19.0, 36.0, 47.0, 62.0, 91.0, 122.0, 127.0, 83.0, 87.0, 61.0, 51.0, 30.0, 28.0, 20.0, 17.0, 7.0, 4.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.260374069213867e-05, -3.155320882797241e-05, -3.0502676963806152e-05, -2.9452145099639893e-05, -2.8401613235473633e-05, -2.7351081371307373e-05, -2.6300549507141113e-05, -2.5250017642974854e-05, -2.4199485778808594e-05, -2.3148953914642334e-05, -2.2098422050476074e-05, -2.1047890186309814e-05, -1.9997358322143555e-05, -1.8946826457977295e-05, -1.7896294593811035e-05, -1.6845762729644775e-05, -1.5795230865478516e-05, -1.4744699001312256e-05, -1.3694167137145996e-05, -1.2643635272979736e-05, -1.1593103408813477e-05, -1.0542571544647217e-05, -9.492039680480957e-06, -8.441507816314697e-06, -7.3909759521484375e-06, -6.340444087982178e-06, -5.289912223815918e-06, -4.239380359649658e-06, -3.1888484954833984e-06, -2.1383166313171387e-06, -1.087784767150879e-06, -3.725290298461914e-08, 1.0132789611816406e-06, 2.0638108253479004e-06, 3.11434268951416e-06, 4.16487455368042e-06, 5.21540641784668e-06, 6.2659382820129395e-06, 7.316470146179199e-06, 8.367002010345459e-06, 9.417533874511719e-06, 1.0468065738677979e-05, 1.1518597602844238e-05, 1.2569129467010498e-05, 1.3619661331176758e-05, 1.4670193195343018e-05, 1.5720725059509277e-05, 1.6771256923675537e-05, 1.7821788787841797e-05, 1.8872320652008057e-05, 1.9922852516174316e-05, 2.0973384380340576e-05, 2.2023916244506836e-05, 2.3074448108673096e-05, 2.4124979972839355e-05, 2.5175511837005615e-05, 2.6226043701171875e-05, 2.7276575565338135e-05, 2.8327107429504395e-05, 2.9377639293670654e-05, 3.0428171157836914e-05, 3.1478703022003174e-05, 3.2529234886169434e-05, 3.357976675033569e-05, 3.463029861450195e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 13.0, 17.0, 25.0, 41.0, 88.0, 130.0, 217.0, 521.0, 1144.0, 3457.0, 12115.0, 62521.0, 411702.0, 470655.0, 67121.0, 12986.0, 3453.0, 1192.0, 535.0, 238.0, 149.0, 79.0, 44.0, 24.0, 19.0, 22.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.21044921875, -0.20387649536132812, -0.19730377197265625, -0.19073104858398438, -0.1841583251953125, -0.17758560180664062, -0.17101287841796875, -0.16444015502929688, -0.157867431640625, -0.15129470825195312, -0.14472198486328125, -0.13814926147460938, -0.1315765380859375, -0.12500381469726562, -0.11843109130859375, -0.11185836791992188, -0.10528564453125, -0.09871292114257812, -0.09214019775390625, -0.08556747436523438, -0.0789947509765625, -0.07242202758789062, -0.06584930419921875, -0.059276580810546875, -0.052703857421875, -0.046131134033203125, -0.03955841064453125, -0.032985687255859375, -0.0264129638671875, -0.019840240478515625, -0.01326751708984375, -0.006694793701171875, -0.0001220703125, 0.006450653076171875, 0.01302337646484375, 0.019596099853515625, 0.0261688232421875, 0.032741546630859375, 0.03931427001953125, 0.045886993408203125, 0.052459716796875, 0.059032440185546875, 0.06560516357421875, 0.07217788696289062, 0.0787506103515625, 0.08532333374023438, 0.09189605712890625, 0.09846878051757812, 0.10504150390625, 0.11161422729492188, 0.11818695068359375, 0.12475967407226562, 0.1313323974609375, 0.13790512084960938, 0.14447784423828125, 0.15105056762695312, 0.157623291015625, 0.16419601440429688, 0.17076873779296875, 0.17734146118164062, 0.1839141845703125, 0.19048690795898438, 0.19705963134765625, 0.20363235473632812, 0.210205078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 11.0, 11.0, 15.0, 26.0, 28.0, 31.0, 37.0, 52.0, 78.0, 78.0, 133.0, 79.0, 65.0, 71.0, 57.0, 55.0, 40.0, 28.0, 23.0, 19.0, 11.0, 10.0, 9.0, 1.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0767822265625, -0.07380962371826172, -0.07083702087402344, -0.06786441802978516, -0.06489181518554688, -0.061919212341308594, -0.05894660949707031, -0.05597400665283203, -0.05300140380859375, -0.05002880096435547, -0.04705619812011719, -0.044083595275878906, -0.041110992431640625, -0.038138389587402344, -0.03516578674316406, -0.03219318389892578, -0.0292205810546875, -0.02624797821044922, -0.023275375366210938, -0.020302772521972656, -0.017330169677734375, -0.014357566833496094, -0.011384963989257812, -0.008412361145019531, -0.00543975830078125, -0.0024671554565429688, 0.0005054473876953125, 0.0034780502319335938, 0.006450653076171875, 0.009423255920410156, 0.012395858764648438, 0.015368461608886719, 0.018341064453125, 0.02131366729736328, 0.024286270141601562, 0.027258872985839844, 0.030231475830078125, 0.033204078674316406, 0.03617668151855469, 0.03914928436279297, 0.04212188720703125, 0.04509449005126953, 0.04806709289550781, 0.051039695739746094, 0.054012298583984375, 0.056984901428222656, 0.05995750427246094, 0.06293010711669922, 0.0659027099609375, 0.06887531280517578, 0.07184791564941406, 0.07482051849365234, 0.07779312133789062, 0.0807657241821289, 0.08373832702636719, 0.08671092987060547, 0.08968353271484375, 0.09265613555908203, 0.09562873840332031, 0.0986013412475586, 0.10157394409179688, 0.10454654693603516, 0.10751914978027344, 0.11049175262451172, 0.11346435546875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 14.0, 11.0, 18.0, 22.0, 35.0, 47.0, 61.0, 72.0, 101.0, 98.0, 83.0, 76.0, 81.0, 67.0, 49.0, 39.0, 31.0, 31.0, 21.0, 13.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6261335611343384, -1.5826365947723389, -1.5391396284103394, -1.4956426620483398, -1.4521456956863403, -1.4086487293243408, -1.3651516437530518, -1.3216547966003418, -1.2781577110290527, -1.2346607446670532, -1.1911637783050537, -1.1476668119430542, -1.1041698455810547, -1.0606728792190552, -1.0171759128570557, -0.9736788868904114, -0.9301819801330566, -0.8866850137710571, -0.8431880474090576, -0.7996910810470581, -0.7561941146850586, -0.7126971483230591, -0.6692001223564148, -0.6257031559944153, -0.5822061896324158, -0.5387092232704163, -0.49521225690841675, -0.45171526074409485, -0.40821829438209534, -0.3647213280200958, -0.3212243318557739, -0.2777273654937744, -0.23423027992248535, -0.19073331356048584, -0.14723633229732513, -0.10373935103416443, -0.06024238467216492, -0.016745418310165405, 0.026751577854156494, 0.070248544216156, 0.11374551057815552, 0.15724247694015503, 0.20073945820331573, 0.24423643946647644, 0.28773340582847595, 0.33123037219047546, 0.37472736835479736, 0.4182243347167969, 0.4617213010787964, 0.5052182674407959, 0.5487152338027954, 0.5922122001647949, 0.6357091665267944, 0.679206132888794, 0.7227031588554382, 0.7662001252174377, 0.8096970915794373, 0.8531940579414368, 0.8966910243034363, 0.9401880502700806, 0.9836850166320801, 1.0271819829940796, 1.070678949356079, 1.1141759157180786, 1.1576728820800781]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 11.0, 15.0, 4.0, 14.0, 12.0, 18.0, 19.0, 30.0, 30.0, 34.0, 41.0, 47.0, 35.0, 47.0, 49.0, 52.0, 48.0, 40.0, 61.0, 43.0, 30.0, 39.0, 35.0, 39.0, 25.0, 35.0, 27.0, 27.0, 14.0, 18.0, 10.0, 3.0, 6.0, 8.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.236802101135254, -1.1844162940979004, -1.1320303678512573, -1.0796445608139038, -1.0272586345672607, -0.9748728275299072, -0.9224869012832642, -0.8701010942459106, -0.8177151679992676, -0.7653293013572693, -0.712943434715271, -0.6605575680732727, -0.6081717014312744, -0.5557858943939209, -0.5033999681472778, -0.45101413130760193, -0.398628294467926, -0.34624242782592773, -0.29385656118392944, -0.24147070944309235, -0.18908484280109406, -0.13669899106025696, -0.08431312441825867, -0.031927257776260376, 0.020458608865737915, 0.0728444755077362, 0.1252303421497345, 0.1776161938905716, 0.23000206053256989, 0.282387912273407, 0.3347737789154053, 0.38715964555740356, 0.43954551219940186, 0.49193137884140015, 0.5443172454833984, 0.5967031121253967, 0.649088978767395, 0.7014747858047485, 0.7538607120513916, 0.8062465190887451, 0.8586324453353882, 0.9110183119773865, 0.9634041786193848, 1.0157899856567383, 1.0681759119033813, 1.1205617189407349, 1.172947645187378, 1.2253334522247314, 1.277719259262085, 1.3301050662994385, 1.3824909925460815, 1.434876799583435, 1.4872627258300781, 1.5396485328674316, 1.5920344591140747, 1.6444202661514282, 1.6968061923980713, 1.7491919994354248, 1.8015779256820679, 1.8539637327194214, 1.9063496589660645, 1.958735466003418, 2.0111212730407715, 2.063507318496704, 2.1158931255340576]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 3.0, 13.0, 16.0, 11.0, 25.0, 30.0, 35.0, 56.0, 66.0, 98.0, 117.0, 199.0, 342.0, 698.0, 1539.0, 4646.0, 17665.0, 113218.0, 2505373.0, 1457511.0, 73060.0, 12934.0, 3693.0, 1353.0, 585.0, 312.0, 198.0, 113.0, 102.0, 66.0, 43.0, 34.0, 28.0, 26.0, 19.0, 16.0, 13.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98779296875, -0.9558334350585938, -0.9238739013671875, -0.8919143676757812, -0.859954833984375, -0.8279953002929688, -0.7960357666015625, -0.7640762329101562, -0.73211669921875, -0.7001571655273438, -0.6681976318359375, -0.6362380981445312, -0.604278564453125, -0.5723190307617188, -0.5403594970703125, -0.5083999633789062, -0.4764404296875, -0.44448089599609375, -0.4125213623046875, -0.38056182861328125, -0.348602294921875, -0.31664276123046875, -0.2846832275390625, -0.25272369384765625, -0.22076416015625, -0.18880462646484375, -0.1568450927734375, -0.12488555908203125, -0.092926025390625, -0.06096649169921875, -0.0290069580078125, 0.00295257568359375, 0.034912109375, 0.06687164306640625, 0.0988311767578125, 0.13079071044921875, 0.162750244140625, 0.19470977783203125, 0.2266693115234375, 0.25862884521484375, 0.29058837890625, 0.32254791259765625, 0.3545074462890625, 0.38646697998046875, 0.418426513671875, 0.45038604736328125, 0.4823455810546875, 0.5143051147460938, 0.5462646484375, 0.5782241821289062, 0.6101837158203125, 0.6421432495117188, 0.674102783203125, 0.7060623168945312, 0.7380218505859375, 0.7699813842773438, 0.80194091796875, 0.8339004516601562, 0.8658599853515625, 0.8978195190429688, 0.929779052734375, 0.9617385864257812, 0.9936981201171875, 1.0256576538085938, 1.0576171875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 7.0, 9.0, 10.0, 10.0, 18.0, 14.0, 20.0, 32.0, 31.0, 29.0, 50.0, 60.0, 46.0, 81.0, 65.0, 53.0, 55.0, 56.0, 50.0, 55.0, 46.0, 34.0, 35.0, 26.0, 31.0, 17.0, 12.0, 5.0, 6.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.42252349853515625, -0.4070587158203125, -0.39159393310546875, -0.376129150390625, -0.36066436767578125, -0.3451995849609375, -0.32973480224609375, -0.31427001953125, -0.29880523681640625, -0.2833404541015625, -0.26787567138671875, -0.252410888671875, -0.23694610595703125, -0.2214813232421875, -0.20601654052734375, -0.1905517578125, -0.17508697509765625, -0.1596221923828125, -0.14415740966796875, -0.128692626953125, -0.11322784423828125, -0.0977630615234375, -0.08229827880859375, -0.06683349609375, -0.05136871337890625, -0.0359039306640625, -0.02043914794921875, -0.004974365234375, 0.01049041748046875, 0.0259552001953125, 0.04141998291015625, 0.056884765625, 0.07234954833984375, 0.0878143310546875, 0.10327911376953125, 0.118743896484375, 0.13420867919921875, 0.1496734619140625, 0.16513824462890625, 0.18060302734375, 0.19606781005859375, 0.2115325927734375, 0.22699737548828125, 0.242462158203125, 0.25792694091796875, 0.2733917236328125, 0.28885650634765625, 0.3043212890625, 0.31978607177734375, 0.3352508544921875, 0.35071563720703125, 0.366180419921875, 0.38164520263671875, 0.3971099853515625, 0.41257476806640625, 0.42803955078125, 0.44350433349609375, 0.4589691162109375, 0.47443389892578125, 0.489898681640625, 0.5053634643554688, 0.5208282470703125, 0.5362930297851562, 0.5517578125]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 8.0, 5.0, 14.0, 7.0, 17.0, 32.0, 49.0, 87.0, 173.0, 449.0, 1476.0, 8548.0, 104644.0, 3656269.0, 398910.0, 19617.0, 2756.0, 690.0, 255.0, 124.0, 55.0, 28.0, 13.0, 15.0, 12.0, 11.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.479461669921875, -1.42962646484375, -1.379791259765625, -1.3299560546875, -1.280120849609375, -1.23028564453125, -1.180450439453125, -1.130615234375, -1.080780029296875, -1.03094482421875, -0.981109619140625, -0.9312744140625, -0.881439208984375, -0.83160400390625, -0.781768798828125, -0.73193359375, -0.682098388671875, -0.63226318359375, -0.582427978515625, -0.5325927734375, -0.482757568359375, -0.43292236328125, -0.383087158203125, -0.333251953125, -0.283416748046875, -0.23358154296875, -0.183746337890625, -0.1339111328125, -0.084075927734375, -0.03424072265625, 0.015594482421875, 0.0654296875, 0.115264892578125, 0.16510009765625, 0.214935302734375, 0.2647705078125, 0.314605712890625, 0.36444091796875, 0.414276123046875, 0.464111328125, 0.513946533203125, 0.56378173828125, 0.613616943359375, 0.6634521484375, 0.713287353515625, 0.76312255859375, 0.812957763671875, 0.86279296875, 0.912628173828125, 0.96246337890625, 1.012298583984375, 1.0621337890625, 1.111968994140625, 1.16180419921875, 1.211639404296875, 1.261474609375, 1.311309814453125, 1.36114501953125, 1.410980224609375, 1.4608154296875, 1.510650634765625, 1.56048583984375, 1.610321044921875, 1.66015625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 4.0, 13.0, 10.0, 13.0, 22.0, 32.0, 39.0, 47.0, 63.0, 108.0, 141.0, 190.0, 336.0, 434.0, 614.0, 577.0, 417.0, 309.0, 204.0, 143.0, 89.0, 63.0, 48.0, 37.0, 31.0, 17.0, 15.0, 14.0, 16.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.293212890625, -0.28569793701171875, -0.2781829833984375, -0.27066802978515625, -0.263153076171875, -0.25563812255859375, -0.2481231689453125, -0.24060821533203125, -0.23309326171875, -0.22557830810546875, -0.2180633544921875, -0.21054840087890625, -0.203033447265625, -0.19551849365234375, -0.1880035400390625, -0.18048858642578125, -0.1729736328125, -0.16545867919921875, -0.1579437255859375, -0.15042877197265625, -0.142913818359375, -0.13539886474609375, -0.1278839111328125, -0.12036895751953125, -0.11285400390625, -0.10533905029296875, -0.0978240966796875, -0.09030914306640625, -0.082794189453125, -0.07527923583984375, -0.0677642822265625, -0.06024932861328125, -0.052734375, -0.04521942138671875, -0.0377044677734375, -0.03018951416015625, -0.022674560546875, -0.01515960693359375, -0.0076446533203125, -0.00012969970703125, 0.00738525390625, 0.01490020751953125, 0.0224151611328125, 0.02993011474609375, 0.037445068359375, 0.04496002197265625, 0.0524749755859375, 0.05998992919921875, 0.0675048828125, 0.07501983642578125, 0.0825347900390625, 0.09004974365234375, 0.097564697265625, 0.10507965087890625, 0.1125946044921875, 0.12010955810546875, 0.12762451171875, 0.13513946533203125, 0.1426544189453125, 0.15016937255859375, 0.157684326171875, 0.16519927978515625, 0.1727142333984375, 0.18022918701171875, 0.187744140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 11.0, 14.0, 17.0, 15.0, 28.0, 45.0, 61.0, 70.0, 83.0, 79.0, 88.0, 74.0, 73.0, 92.0, 40.0, 50.0, 31.0, 25.0, 33.0, 24.0, 16.0, 5.0, 7.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5145568251609802, -0.4861331582069397, -0.45770949125289917, -0.42928585410118103, -0.4008621871471405, -0.3724385201931, -0.34401488304138184, -0.3155912160873413, -0.2871675491333008, -0.25874388217926025, -0.23032023012638092, -0.2018965780735016, -0.17347291111946106, -0.14504924416542053, -0.1166255921125412, -0.08820194005966187, -0.05977827310562134, -0.03135461360216141, -0.002930954098701477, 0.025492705404758453, 0.053916364908218384, 0.08234003186225891, 0.11076368391513824, 0.13918733596801758, 0.1676110029220581, 0.19603466987609863, 0.22445832192897797, 0.2528819739818573, 0.2813056409358978, 0.30972930788993835, 0.3381529450416565, 0.366576611995697, 0.3950002193450928, 0.4234238862991333, 0.45184755325317383, 0.48027119040489197, 0.5086948871612549, 0.5371185541152954, 0.5655421614646912, 0.5939658284187317, 0.6223894953727722, 0.6508131623268127, 0.6792368292808533, 0.7076604962348938, 0.7360841035842896, 0.7645077705383301, 0.7929314374923706, 0.8213551044464111, 0.8497787714004517, 0.8782024383544922, 0.9066261053085327, 0.9350497722625732, 0.9634734392166138, 0.9918971061706543, 1.0203207731246948, 1.0487444400787354, 1.0771679878234863, 1.1055916547775269, 1.1340153217315674, 1.162438988685608, 1.1908626556396484, 1.219286322593689, 1.2477099895477295, 1.2761335372924805, 1.3045573234558105]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 4.0, 7.0, 13.0, 11.0, 19.0, 16.0, 20.0, 24.0, 37.0, 28.0, 36.0, 46.0, 33.0, 45.0, 44.0, 39.0, 40.0, 45.0, 46.0, 41.0, 45.0, 43.0, 37.0, 33.0, 28.0, 38.0, 17.0, 24.0, 22.0, 14.0, 18.0, 15.0, 6.0, 11.0, 5.0, 10.0, 4.0, 8.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.46474847197532654, -0.4487897753715515, -0.4328310787677765, -0.41687238216400146, -0.40091365575790405, -0.38495495915412903, -0.368996262550354, -0.353037565946579, -0.33707886934280396, -0.32112017273902893, -0.3051614761352539, -0.2892027497291565, -0.27324405312538147, -0.25728535652160645, -0.24132665991783142, -0.2253679633140564, -0.20940923690795898, -0.19345054030418396, -0.17749182879924774, -0.16153313219547272, -0.1455744206905365, -0.12961572408676147, -0.11365702748298645, -0.09769832342863083, -0.08173961937427521, -0.06578091531991959, -0.04982221499085426, -0.03386351466178894, -0.01790481060743332, -0.0019461065530776978, 0.014012590050697327, 0.029971294105052948, 0.04592996835708618, 0.0618886724114418, 0.07784737646579742, 0.09380607306957245, 0.10976477712392807, 0.1257234811782837, 0.14168217778205872, 0.15764087438583374, 0.17359958589076996, 0.18955828249454498, 0.2055169939994812, 0.22147569060325623, 0.23743438720703125, 0.25339311361312866, 0.2693517804145813, 0.2853105068206787, 0.30126920342445374, 0.31722790002822876, 0.3331865966320038, 0.3491452932357788, 0.3651040196418762, 0.38106271624565125, 0.39702141284942627, 0.4129801094532013, 0.4289388060569763, 0.44489750266075134, 0.46085619926452637, 0.4768149256706238, 0.4927736222743988, 0.5087323188781738, 0.5246909856796265, 0.5406497120857239, 0.5566084384918213]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 14.0, 17.0, 16.0, 33.0, 59.0, 89.0, 133.0, 232.0, 410.0, 664.0, 1203.0, 2247.0, 4685.0, 10811.0, 27175.0, 86192.0, 313595.0, 408836.0, 127897.0, 38025.0, 13972.0, 6018.0, 2808.0, 1444.0, 812.0, 438.0, 262.0, 174.0, 113.0, 64.0, 46.0, 17.0, 19.0, 5.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.116455078125, -0.11163330078125, -0.1068115234375, -0.10198974609375, -0.09716796875, -0.09234619140625, -0.0875244140625, -0.08270263671875, -0.077880859375, -0.07305908203125, -0.0682373046875, -0.06341552734375, -0.05859375, -0.05377197265625, -0.0489501953125, -0.04412841796875, -0.039306640625, -0.03448486328125, -0.0296630859375, -0.02484130859375, -0.02001953125, -0.01519775390625, -0.0103759765625, -0.00555419921875, -0.000732421875, 0.00408935546875, 0.0089111328125, 0.01373291015625, 0.0185546875, 0.02337646484375, 0.0281982421875, 0.03302001953125, 0.037841796875, 0.04266357421875, 0.0474853515625, 0.05230712890625, 0.05712890625, 0.06195068359375, 0.0667724609375, 0.07159423828125, 0.076416015625, 0.08123779296875, 0.0860595703125, 0.09088134765625, 0.095703125, 0.10052490234375, 0.1053466796875, 0.11016845703125, 0.114990234375, 0.11981201171875, 0.1246337890625, 0.12945556640625, 0.13427734375, 0.13909912109375, 0.1439208984375, 0.14874267578125, 0.153564453125, 0.15838623046875, 0.1632080078125, 0.16802978515625, 0.1728515625, 0.17767333984375, 0.1824951171875, 0.18731689453125, 0.192138671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 3.0, 10.0, 7.0, 6.0, 15.0, 25.0, 20.0, 31.0, 34.0, 48.0, 56.0, 62.0, 63.0, 61.0, 74.0, 55.0, 72.0, 63.0, 63.0, 43.0, 41.0, 31.0, 25.0, 22.0, 21.0, 15.0, 11.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34228515625, -0.32724761962890625, -0.3122100830078125, -0.29717254638671875, -0.282135009765625, -0.26709747314453125, -0.2520599365234375, -0.23702239990234375, -0.22198486328125, -0.20694732666015625, -0.1919097900390625, -0.17687225341796875, -0.161834716796875, -0.14679718017578125, -0.1317596435546875, -0.11672210693359375, -0.1016845703125, -0.08664703369140625, -0.0716094970703125, -0.05657196044921875, -0.041534423828125, -0.02649688720703125, -0.0114593505859375, 0.00357818603515625, 0.01861572265625, 0.03365325927734375, 0.0486907958984375, 0.06372833251953125, 0.078765869140625, 0.09380340576171875, 0.1088409423828125, 0.12387847900390625, 0.138916015625, 0.15395355224609375, 0.1689910888671875, 0.18402862548828125, 0.199066162109375, 0.21410369873046875, 0.2291412353515625, 0.24417877197265625, 0.25921630859375, 0.27425384521484375, 0.2892913818359375, 0.30432891845703125, 0.319366455078125, 0.33440399169921875, 0.3494415283203125, 0.36447906494140625, 0.3795166015625, 0.39455413818359375, 0.4095916748046875, 0.42462921142578125, 0.439666748046875, 0.45470428466796875, 0.4697418212890625, 0.48477935791015625, 0.49981689453125, 0.5148544311523438, 0.5298919677734375, 0.5449295043945312, 0.559967041015625, 0.5750045776367188, 0.5900421142578125, 0.6050796508789062, 0.6201171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 11.0, 13.0, 8.0, 17.0, 15.0, 25.0, 31.0, 53.0, 86.0, 91.0, 185.0, 232.0, 388.0, 617.0, 1148.0, 2421.0, 5891.0, 18109.0, 76270.0, 402564.0, 425984.0, 83198.0, 19290.0, 6270.0, 2527.0, 1252.0, 692.0, 367.0, 248.0, 143.0, 92.0, 90.0, 56.0, 47.0, 28.0, 18.0, 17.0, 13.0, 10.0, 11.0, 7.0, 0.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.147216796875, -0.14262008666992188, -0.13802337646484375, -0.13342666625976562, -0.1288299560546875, -0.12423324584960938, -0.11963653564453125, -0.11503982543945312, -0.110443115234375, -0.10584640502929688, -0.10124969482421875, -0.09665298461914062, -0.0920562744140625, -0.08745956420898438, -0.08286285400390625, -0.07826614379882812, -0.07366943359375, -0.06907272338867188, -0.06447601318359375, -0.059879302978515625, -0.0552825927734375, -0.050685882568359375, -0.04608917236328125, -0.041492462158203125, -0.036895751953125, -0.032299041748046875, -0.02770233154296875, -0.023105621337890625, -0.0185089111328125, -0.013912200927734375, -0.00931549072265625, -0.004718780517578125, -0.0001220703125, 0.004474639892578125, 0.00907135009765625, 0.013668060302734375, 0.0182647705078125, 0.022861480712890625, 0.02745819091796875, 0.032054901123046875, 0.036651611328125, 0.041248321533203125, 0.04584503173828125, 0.050441741943359375, 0.0550384521484375, 0.059635162353515625, 0.06423187255859375, 0.06882858276367188, 0.07342529296875, 0.07802200317382812, 0.08261871337890625, 0.08721542358398438, 0.0918121337890625, 0.09640884399414062, 0.10100555419921875, 0.10560226440429688, 0.110198974609375, 0.11479568481445312, 0.11939239501953125, 0.12398910522460938, 0.1285858154296875, 0.13318252563476562, 0.13777923583984375, 0.14237594604492188, 0.14697265625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 11.0, 20.0, 17.0, 17.0, 24.0, 45.0, 33.0, 31.0, 45.0, 35.0, 43.0, 50.0, 68.0, 63.0, 57.0, 55.0, 48.0, 54.0, 37.0, 33.0, 32.0, 31.0, 26.0, 24.0, 16.0, 16.0, 10.0, 14.0, 5.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73681640625, -0.7108917236328125, -0.684967041015625, -0.6590423583984375, -0.63311767578125, -0.6071929931640625, -0.581268310546875, -0.5553436279296875, -0.5294189453125, -0.5034942626953125, -0.477569580078125, -0.4516448974609375, -0.42572021484375, -0.3997955322265625, -0.373870849609375, -0.3479461669921875, -0.322021484375, -0.2960968017578125, -0.270172119140625, -0.2442474365234375, -0.21832275390625, -0.1923980712890625, -0.166473388671875, -0.1405487060546875, -0.1146240234375, -0.0886993408203125, -0.062774658203125, -0.0368499755859375, -0.01092529296875, 0.0149993896484375, 0.040924072265625, 0.0668487548828125, 0.0927734375, 0.1186981201171875, 0.144622802734375, 0.1705474853515625, 0.19647216796875, 0.2223968505859375, 0.248321533203125, 0.2742462158203125, 0.3001708984375, 0.3260955810546875, 0.352020263671875, 0.3779449462890625, 0.40386962890625, 0.4297943115234375, 0.455718994140625, 0.4816436767578125, 0.507568359375, 0.5334930419921875, 0.559417724609375, 0.5853424072265625, 0.61126708984375, 0.6371917724609375, 0.663116455078125, 0.6890411376953125, 0.7149658203125, 0.7408905029296875, 0.766815185546875, 0.7927398681640625, 0.81866455078125, 0.8445892333984375, 0.870513916015625, 0.8964385986328125, 0.92236328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 7.0, 12.0, 19.0, 28.0, 49.0, 58.0, 105.0, 144.0, 249.0, 438.0, 861.0, 1774.0, 4251.0, 13322.0, 55797.0, 409438.0, 475852.0, 62867.0, 14542.0, 4768.0, 1903.0, 882.0, 453.0, 254.0, 142.0, 116.0, 51.0, 44.0, 31.0, 19.0, 20.0, 13.0, 6.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10382080078125, -0.10058021545410156, -0.09733963012695312, -0.09409904479980469, -0.09085845947265625, -0.08761787414550781, -0.08437728881835938, -0.08113670349121094, -0.0778961181640625, -0.07465553283691406, -0.07141494750976562, -0.06817436218261719, -0.06493377685546875, -0.06169319152832031, -0.058452606201171875, -0.05521202087402344, -0.051971435546875, -0.04873085021972656, -0.045490264892578125, -0.04224967956542969, -0.03900909423828125, -0.03576850891113281, -0.032527923583984375, -0.029287338256835938, -0.0260467529296875, -0.022806167602539062, -0.019565582275390625, -0.016324996948242188, -0.01308441162109375, -0.009843826293945312, -0.006603240966796875, -0.0033626556396484375, -0.0001220703125, 0.0031185150146484375, 0.006359100341796875, 0.009599685668945312, 0.01284027099609375, 0.016080856323242188, 0.019321441650390625, 0.022562026977539062, 0.0258026123046875, 0.029043197631835938, 0.032283782958984375, 0.03552436828613281, 0.03876495361328125, 0.04200553894042969, 0.045246124267578125, 0.04848670959472656, 0.051727294921875, 0.05496788024902344, 0.058208465576171875, 0.06144905090332031, 0.06468963623046875, 0.06793022155761719, 0.07117080688476562, 0.07441139221191406, 0.0776519775390625, 0.08089256286621094, 0.08413314819335938, 0.08737373352050781, 0.09061431884765625, 0.09385490417480469, 0.09709548950195312, 0.10033607482910156, 0.10357666015625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 16.0, 15.0, 21.0, 42.0, 57.0, 89.0, 127.0, 171.0, 157.0, 111.0, 61.0, 37.0, 24.0, 22.0, 15.0, 10.0, 7.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76837158203125e-05, -4.558544605970383e-05, -4.3487176299095154e-05, -4.138890653848648e-05, -3.929063677787781e-05, -3.7192367017269135e-05, -3.509409725666046e-05, -3.299582749605179e-05, -3.0897557735443115e-05, -2.8799287974834442e-05, -2.670101821422577e-05, -2.4602748453617096e-05, -2.2504478693008423e-05, -2.040620893239975e-05, -1.8307939171791077e-05, -1.6209669411182404e-05, -1.411139965057373e-05, -1.2013129889965057e-05, -9.914860129356384e-06, -7.816590368747711e-06, -5.718320608139038e-06, -3.620050847530365e-06, -1.521781086921692e-06, 5.764886736869812e-07, 2.6747584342956543e-06, 4.773028194904327e-06, 6.8712979555130005e-06, 8.969567716121674e-06, 1.1067837476730347e-05, 1.316610723733902e-05, 1.5264376997947693e-05, 1.7362646758556366e-05, 1.946091651916504e-05, 2.1559186279773712e-05, 2.3657456040382385e-05, 2.575572580099106e-05, 2.785399556159973e-05, 2.9952265322208405e-05, 3.205053508281708e-05, 3.414880484342575e-05, 3.6247074604034424e-05, 3.83453443646431e-05, 4.044361412525177e-05, 4.254188388586044e-05, 4.4640153646469116e-05, 4.673842340707779e-05, 4.883669316768646e-05, 5.0934962928295135e-05, 5.303323268890381e-05, 5.513150244951248e-05, 5.7229772210121155e-05, 5.932804197072983e-05, 6.14263117313385e-05, 6.352458149194717e-05, 6.562285125255585e-05, 6.772112101316452e-05, 6.98193907737732e-05, 7.191766053438187e-05, 7.401593029499054e-05, 7.611420005559921e-05, 7.821246981620789e-05, 8.031073957681656e-05, 8.240900933742523e-05, 8.45072790980339e-05, 8.660554885864258e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 13.0, 9.0, 16.0, 26.0, 50.0, 63.0, 132.0, 226.0, 502.0, 1189.0, 2791.0, 7354.0, 20679.0, 68821.0, 290992.0, 480255.0, 123510.0, 33372.0, 11206.0, 4161.0, 1685.0, 742.0, 339.0, 162.0, 69.0, 54.0, 31.0, 26.0, 17.0, 10.0, 10.0, 5.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1046142578125, -0.10146427154541016, -0.09831428527832031, -0.09516429901123047, -0.09201431274414062, -0.08886432647705078, -0.08571434020996094, -0.0825643539428711, -0.07941436767578125, -0.0762643814086914, -0.07311439514160156, -0.06996440887451172, -0.06681442260742188, -0.06366443634033203, -0.06051445007324219, -0.057364463806152344, -0.0542144775390625, -0.051064491271972656, -0.04791450500488281, -0.04476451873779297, -0.041614532470703125, -0.03846454620361328, -0.03531455993652344, -0.032164573669433594, -0.02901458740234375, -0.025864601135253906, -0.022714614868164062, -0.01956462860107422, -0.016414642333984375, -0.013264656066894531, -0.010114669799804688, -0.006964683532714844, -0.003814697265625, -0.0006647109985351562, 0.0024852752685546875, 0.005635261535644531, 0.008785247802734375, 0.011935234069824219, 0.015085220336914062, 0.018235206604003906, 0.02138519287109375, 0.024535179138183594, 0.027685165405273438, 0.03083515167236328, 0.033985137939453125, 0.03713512420654297, 0.04028511047363281, 0.043435096740722656, 0.0465850830078125, 0.049735069274902344, 0.05288505554199219, 0.05603504180908203, 0.059185028076171875, 0.06233501434326172, 0.06548500061035156, 0.0686349868774414, 0.07178497314453125, 0.0749349594116211, 0.07808494567871094, 0.08123493194580078, 0.08438491821289062, 0.08753490447998047, 0.09068489074707031, 0.09383487701416016, 0.09698486328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 1.0, 5.0, 4.0, 5.0, 5.0, 5.0, 6.0, 21.0, 29.0, 28.0, 45.0, 49.0, 67.0, 87.0, 111.0, 110.0, 95.0, 64.0, 66.0, 38.0, 29.0, 30.0, 24.0, 15.0, 13.0, 8.0, 7.0, 7.0, 8.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019622802734375, -0.01884603500366211, -0.01806926727294922, -0.017292499542236328, -0.016515731811523438, -0.015738964080810547, -0.014962196350097656, -0.014185428619384766, -0.013408660888671875, -0.012631893157958984, -0.011855125427246094, -0.011078357696533203, -0.010301589965820312, -0.009524822235107422, -0.008748054504394531, -0.00797128677368164, -0.00719451904296875, -0.006417751312255859, -0.005640983581542969, -0.004864215850830078, -0.0040874481201171875, -0.003310680389404297, -0.0025339126586914062, -0.0017571449279785156, -0.000980377197265625, -0.00020360946655273438, 0.0005731582641601562, 0.0013499259948730469, 0.0021266937255859375, 0.002903461456298828, 0.0036802291870117188, 0.004456996917724609, 0.0052337646484375, 0.006010532379150391, 0.006787300109863281, 0.007564067840576172, 0.008340835571289062, 0.009117603302001953, 0.009894371032714844, 0.010671138763427734, 0.011447906494140625, 0.012224674224853516, 0.013001441955566406, 0.013778209686279297, 0.014554977416992188, 0.015331745147705078, 0.01610851287841797, 0.01688528060913086, 0.01766204833984375, 0.01843881607055664, 0.01921558380126953, 0.019992351531982422, 0.020769119262695312, 0.021545886993408203, 0.022322654724121094, 0.023099422454833984, 0.023876190185546875, 0.024652957916259766, 0.025429725646972656, 0.026206493377685547, 0.026983261108398438, 0.027760028839111328, 0.02853679656982422, 0.02931356430053711, 0.03009033203125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 10.0, 14.0, 23.0, 30.0, 34.0, 63.0, 87.0, 99.0, 114.0, 107.0, 100.0, 81.0, 70.0, 46.0, 35.0, 38.0, 17.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6156778335571289, -0.5939664840698242, -0.5722551345825195, -0.5505437850952148, -0.5288324356079102, -0.5071210861206055, -0.48540976643562317, -0.4636984169483185, -0.4419870674610138, -0.4202757179737091, -0.3985643684864044, -0.3768530488014221, -0.35514169931411743, -0.33343034982681274, -0.31171900033950806, -0.29000765085220337, -0.2682963013648987, -0.246584951877594, -0.2248736023902893, -0.2031622678041458, -0.18145091831684113, -0.15973956882953644, -0.13802823424339294, -0.11631688475608826, -0.09460553526878357, -0.07289418578147888, -0.05118284374475479, -0.0294715017080307, -0.007760152220726013, 0.013951197266578674, 0.03566253185272217, 0.057373881340026855, 0.07908517122268677, 0.10079652070999146, 0.12250786274671555, 0.14421920478343964, 0.16593055427074432, 0.187641903758049, 0.2093532383441925, 0.2310645878314972, 0.2527759373188019, 0.27448728680610657, 0.29619863629341125, 0.31790995597839355, 0.33962130546569824, 0.36133265495300293, 0.3830440044403076, 0.4047553539276123, 0.426466703414917, 0.4481780529022217, 0.46988940238952637, 0.49160075187683105, 0.5133121013641357, 0.5350234508514404, 0.5567348003387451, 0.5784461498260498, 0.6001574993133545, 0.6218688488006592, 0.6435801982879639, 0.6652915477752686, 0.6870028972625732, 0.7087142467498779, 0.7304255962371826, 0.7521369457244873, 0.7738482356071472]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 7.0, 20.0, 15.0, 20.0, 19.0, 33.0, 34.0, 46.0, 43.0, 54.0, 51.0, 55.0, 48.0, 62.0, 44.0, 61.0, 47.0, 54.0, 41.0, 39.0, 28.0, 26.0, 24.0, 24.0, 16.0, 16.0, 14.0, 9.0, 8.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3125542998313904, -0.3008567690849304, -0.28915923833847046, -0.2774617373943329, -0.2657642066478729, -0.25406667590141296, -0.242369145154953, -0.23067162930965424, -0.21897411346435547, -0.2072765827178955, -0.19557906687259674, -0.18388153612613678, -0.172184020280838, -0.16048648953437805, -0.1487889587879181, -0.13709144294261932, -0.12539391219615936, -0.11369638890028, -0.10199886560440063, -0.09030133485794067, -0.0786038190126419, -0.06690628826618195, -0.05520876497030258, -0.04351124167442322, -0.031813718378543854, -0.02011619508266449, -0.008418669924139977, 0.0032788552343845367, 0.0149763785302639, 0.026673901826143265, 0.03837142884731293, 0.05006895214319229, 0.061766475439071655, 0.07346399873495102, 0.08516152203083038, 0.09685905277729034, 0.10855656862258911, 0.12025409936904907, 0.13195163011550903, 0.1436491459608078, 0.15534666180610657, 0.16704419255256653, 0.1787417083978653, 0.19043923914432526, 0.20213675498962402, 0.21383428573608398, 0.22553181648254395, 0.2372293323278427, 0.24892686307430267, 0.26062437891960144, 0.2723219096660614, 0.28401944041252136, 0.2957169711589813, 0.3074144721031189, 0.31911200284957886, 0.3308095335960388, 0.3425070643424988, 0.35420459508895874, 0.3659021258354187, 0.3775996267795563, 0.38929715752601624, 0.4009946882724762, 0.41269221901893616, 0.42438971996307373, 0.4360872507095337]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 13.0, 23.0, 23.0, 39.0, 83.0, 133.0, 228.0, 378.0, 667.0, 1180.0, 2114.0, 4287.0, 9056.0, 21976.0, 63044.0, 253878.0, 485564.0, 137464.0, 39572.0, 15020.0, 6635.0, 3292.0, 1670.0, 879.0, 541.0, 295.0, 191.0, 118.0, 66.0, 35.0, 26.0, 18.0, 15.0, 2.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52001953125, -0.5034027099609375, -0.486785888671875, -0.4701690673828125, -0.45355224609375, -0.4369354248046875, -0.420318603515625, -0.4037017822265625, -0.3870849609375, -0.3704681396484375, -0.353851318359375, -0.3372344970703125, -0.32061767578125, -0.3040008544921875, -0.287384033203125, -0.2707672119140625, -0.254150390625, -0.2375335693359375, -0.220916748046875, -0.2042999267578125, -0.18768310546875, -0.1710662841796875, -0.154449462890625, -0.1378326416015625, -0.1212158203125, -0.1045989990234375, -0.087982177734375, -0.0713653564453125, -0.05474853515625, -0.0381317138671875, -0.021514892578125, -0.0048980712890625, 0.01171875, 0.0283355712890625, 0.044952392578125, 0.0615692138671875, 0.07818603515625, 0.0948028564453125, 0.111419677734375, 0.1280364990234375, 0.1446533203125, 0.1612701416015625, 0.177886962890625, 0.1945037841796875, 0.21112060546875, 0.2277374267578125, 0.244354248046875, 0.2609710693359375, 0.277587890625, 0.2942047119140625, 0.310821533203125, 0.3274383544921875, 0.34405517578125, 0.3606719970703125, 0.377288818359375, 0.3939056396484375, 0.4105224609375, 0.4271392822265625, 0.443756103515625, 0.4603729248046875, 0.47698974609375, 0.4936065673828125, 0.510223388671875, 0.5268402099609375, 0.54345703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 6.0, 14.0, 16.0, 31.0, 23.0, 37.0, 40.0, 34.0, 36.0, 58.0, 58.0, 54.0, 59.0, 63.0, 48.0, 56.0, 51.0, 43.0, 48.0, 39.0, 29.0, 36.0, 21.0, 23.0, 11.0, 20.0, 4.0, 7.0, 4.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.77001953125, -0.7428359985351562, -0.7156524658203125, -0.6884689331054688, -0.661285400390625, -0.6341018676757812, -0.6069183349609375, -0.5797348022460938, -0.55255126953125, -0.5253677368164062, -0.4981842041015625, -0.47100067138671875, -0.443817138671875, -0.41663360595703125, -0.3894500732421875, -0.36226654052734375, -0.3350830078125, -0.30789947509765625, -0.2807159423828125, -0.25353240966796875, -0.226348876953125, -0.19916534423828125, -0.1719818115234375, -0.14479827880859375, -0.11761474609375, -0.09043121337890625, -0.0632476806640625, -0.03606414794921875, -0.008880615234375, 0.01830291748046875, 0.0454864501953125, 0.07266998291015625, 0.099853515625, 0.12703704833984375, 0.1542205810546875, 0.18140411376953125, 0.208587646484375, 0.23577117919921875, 0.2629547119140625, 0.29013824462890625, 0.31732177734375, 0.34450531005859375, 0.3716888427734375, 0.39887237548828125, 0.426055908203125, 0.45323944091796875, 0.4804229736328125, 0.5076065063476562, 0.5347900390625, 0.5619735717773438, 0.5891571044921875, 0.6163406372070312, 0.643524169921875, 0.6707077026367188, 0.6978912353515625, 0.7250747680664062, 0.75225830078125, 0.7794418334960938, 0.8066253662109375, 0.8338088989257812, 0.860992431640625, 0.8881759643554688, 0.9153594970703125, 0.9425430297851562, 0.9697265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 9.0, 16.0, 21.0, 30.0, 46.0, 72.0, 154.0, 345.0, 1082.0, 4142.0, 22262.0, 271042.0, 693632.0, 45898.0, 7217.0, 1594.0, 500.0, 230.0, 92.0, 56.0, 38.0, 16.0, 19.0, 4.0, 8.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.376953125, -1.3418045043945312, -1.3066558837890625, -1.2715072631835938, -1.236358642578125, -1.2012100219726562, -1.1660614013671875, -1.1309127807617188, -1.09576416015625, -1.0606155395507812, -1.0254669189453125, -0.9903182983398438, -0.955169677734375, -0.9200210571289062, -0.8848724365234375, -0.8497238159179688, -0.8145751953125, -0.7794265747070312, -0.7442779541015625, -0.7091293334960938, -0.673980712890625, -0.6388320922851562, -0.6036834716796875, -0.5685348510742188, -0.53338623046875, -0.49823760986328125, -0.4630889892578125, -0.42794036865234375, -0.392791748046875, -0.35764312744140625, -0.3224945068359375, -0.28734588623046875, -0.252197265625, -0.21704864501953125, -0.1819000244140625, -0.14675140380859375, -0.111602783203125, -0.07645416259765625, -0.0413055419921875, -0.00615692138671875, 0.02899169921875, 0.06414031982421875, 0.0992889404296875, 0.13443756103515625, 0.169586181640625, 0.20473480224609375, 0.2398834228515625, 0.27503204345703125, 0.3101806640625, 0.34532928466796875, 0.3804779052734375, 0.41562652587890625, 0.450775146484375, 0.48592376708984375, 0.5210723876953125, 0.5562210083007812, 0.59136962890625, 0.6265182495117188, 0.6616668701171875, 0.6968154907226562, 0.731964111328125, 0.7671127319335938, 0.8022613525390625, 0.8374099731445312, 0.87255859375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 8.0, 14.0, 10.0, 19.0, 21.0, 23.0, 30.0, 35.0, 36.0, 47.0, 45.0, 49.0, 43.0, 43.0, 55.0, 46.0, 48.0, 57.0, 45.0, 37.0, 44.0, 32.0, 39.0, 27.0, 13.0, 29.0, 17.0, 13.0, 11.0, 8.0, 7.0, 5.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79052734375, -0.7609329223632812, -0.7313385009765625, -0.7017440795898438, -0.672149658203125, -0.6425552368164062, -0.6129608154296875, -0.5833663940429688, -0.55377197265625, -0.5241775512695312, -0.4945831298828125, -0.46498870849609375, -0.435394287109375, -0.40579986572265625, -0.3762054443359375, -0.34661102294921875, -0.3170166015625, -0.28742218017578125, -0.2578277587890625, -0.22823333740234375, -0.198638916015625, -0.16904449462890625, -0.1394500732421875, -0.10985565185546875, -0.08026123046875, -0.05066680908203125, -0.0210723876953125, 0.00852203369140625, 0.038116455078125, 0.06771087646484375, 0.0973052978515625, 0.12689971923828125, 0.156494140625, 0.18608856201171875, 0.2156829833984375, 0.24527740478515625, 0.274871826171875, 0.30446624755859375, 0.3340606689453125, 0.36365509033203125, 0.39324951171875, 0.42284393310546875, 0.4524383544921875, 0.48203277587890625, 0.511627197265625, 0.5412216186523438, 0.5708160400390625, 0.6004104614257812, 0.6300048828125, 0.6595993041992188, 0.6891937255859375, 0.7187881469726562, 0.748382568359375, 0.7779769897460938, 0.8075714111328125, 0.8371658325195312, 0.86676025390625, 0.8963546752929688, 0.9259490966796875, 0.9555435180664062, 0.985137939453125, 1.0147323608398438, 1.0443267822265625, 1.0739212036132812, 1.103515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 5.0, 14.0, 13.0, 45.0, 88.0, 306.0, 993.0, 4959.0, 56288.0, 798555.0, 174698.0, 10296.0, 1616.0, 427.0, 138.0, 46.0, 25.0, 14.0, 8.0, 7.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3193359375, -0.3082008361816406, -0.29706573486328125, -0.2859306335449219, -0.2747955322265625, -0.2636604309082031, -0.25252532958984375, -0.24139022827148438, -0.230255126953125, -0.21912002563476562, -0.20798492431640625, -0.19684982299804688, -0.1857147216796875, -0.17457962036132812, -0.16344451904296875, -0.15230941772460938, -0.14117431640625, -0.13003921508789062, -0.11890411376953125, -0.10776901245117188, -0.0966339111328125, -0.08549880981445312, -0.07436370849609375, -0.06322860717773438, -0.052093505859375, -0.040958404541015625, -0.02982330322265625, -0.018688201904296875, -0.0075531005859375, 0.003582000732421875, 0.01471710205078125, 0.025852203369140625, 0.0369873046875, 0.048122406005859375, 0.05925750732421875, 0.07039260864257812, 0.0815277099609375, 0.09266281127929688, 0.10379791259765625, 0.11493301391601562, 0.126068115234375, 0.13720321655273438, 0.14833831787109375, 0.15947341918945312, 0.1706085205078125, 0.18174362182617188, 0.19287872314453125, 0.20401382446289062, 0.21514892578125, 0.22628402709960938, 0.23741912841796875, 0.24855422973632812, 0.2596893310546875, 0.2708244323730469, 0.28195953369140625, 0.2930946350097656, 0.304229736328125, 0.3153648376464844, 0.32649993896484375, 0.3376350402832031, 0.3487701416015625, 0.3599052429199219, 0.37104034423828125, 0.3821754455566406, 0.393310546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 5.0, 8.0, 14.0, 22.0, 28.0, 40.0, 42.0, 65.0, 110.0, 119.0, 134.0, 109.0, 83.0, 61.0, 39.0, 30.0, 20.0, 11.0, 11.0, 14.0, 7.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.236532211303711e-05, -3.1218864023685455e-05, -3.00724059343338e-05, -2.8925947844982147e-05, -2.7779489755630493e-05, -2.663303166627884e-05, -2.5486573576927185e-05, -2.434011548757553e-05, -2.3193657398223877e-05, -2.2047199308872223e-05, -2.090074121952057e-05, -1.9754283130168915e-05, -1.860782504081726e-05, -1.7461366951465607e-05, -1.6314908862113953e-05, -1.5168450772762299e-05, -1.4021992683410645e-05, -1.287553459405899e-05, -1.1729076504707336e-05, -1.0582618415355682e-05, -9.436160326004028e-06, -8.289702236652374e-06, -7.14324414730072e-06, -5.996786057949066e-06, -4.850327968597412e-06, -3.703869879245758e-06, -2.557411789894104e-06, -1.41095370054245e-06, -2.644956111907959e-07, 8.819624781608582e-07, 2.028420567512512e-06, 3.1748786568641663e-06, 4.32133674621582e-06, 5.467794835567474e-06, 6.614252924919128e-06, 7.760711014270782e-06, 8.907169103622437e-06, 1.005362719297409e-05, 1.1200085282325745e-05, 1.2346543371677399e-05, 1.3493001461029053e-05, 1.4639459550380707e-05, 1.578591763973236e-05, 1.6932375729084015e-05, 1.807883381843567e-05, 1.9225291907787323e-05, 2.0371749997138977e-05, 2.151820808649063e-05, 2.2664666175842285e-05, 2.381112426519394e-05, 2.4957582354545593e-05, 2.6104040443897247e-05, 2.72504985332489e-05, 2.8396956622600555e-05, 2.954341471195221e-05, 3.0689872801303864e-05, 3.183633089065552e-05, 3.298278898000717e-05, 3.4129247069358826e-05, 3.527570515871048e-05, 3.6422163248062134e-05, 3.756862133741379e-05, 3.871507942676544e-05, 3.9861537516117096e-05, 4.100799560546875e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 16.0, 21.0, 41.0, 70.0, 266.0, 910.0, 4382.0, 31234.0, 432845.0, 532906.0, 39361.0, 4997.0, 1034.0, 274.0, 90.0, 41.0, 20.0, 11.0, 5.0, 8.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3154296875, -0.304931640625, -0.29443359375, -0.283935546875, -0.2734375, -0.262939453125, -0.25244140625, -0.241943359375, -0.2314453125, -0.220947265625, -0.21044921875, -0.199951171875, -0.189453125, -0.178955078125, -0.16845703125, -0.157958984375, -0.1474609375, -0.136962890625, -0.12646484375, -0.115966796875, -0.10546875, -0.094970703125, -0.08447265625, -0.073974609375, -0.0634765625, -0.052978515625, -0.04248046875, -0.031982421875, -0.021484375, -0.010986328125, -0.00048828125, 0.010009765625, 0.0205078125, 0.031005859375, 0.04150390625, 0.052001953125, 0.0625, 0.072998046875, 0.08349609375, 0.093994140625, 0.1044921875, 0.114990234375, 0.12548828125, 0.135986328125, 0.146484375, 0.156982421875, 0.16748046875, 0.177978515625, 0.1884765625, 0.198974609375, 0.20947265625, 0.219970703125, 0.23046875, 0.240966796875, 0.25146484375, 0.261962890625, 0.2724609375, 0.282958984375, 0.29345703125, 0.303955078125, 0.314453125, 0.324951171875, 0.33544921875, 0.345947265625, 0.3564453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 8.0, 7.0, 10.0, 14.0, 14.0, 19.0, 27.0, 38.0, 43.0, 65.0, 64.0, 62.0, 82.0, 94.0, 95.0, 88.0, 50.0, 45.0, 29.0, 35.0, 25.0, 19.0, 11.0, 14.0, 13.0, 6.0, 8.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09710693359375, -0.09417915344238281, -0.09125137329101562, -0.08832359313964844, -0.08539581298828125, -0.08246803283691406, -0.07954025268554688, -0.07661247253417969, -0.0736846923828125, -0.07075691223144531, -0.06782913208007812, -0.06490135192871094, -0.06197357177734375, -0.05904579162597656, -0.056118011474609375, -0.05319023132324219, -0.050262451171875, -0.04733467102050781, -0.044406890869140625, -0.04147911071777344, -0.03855133056640625, -0.03562355041503906, -0.032695770263671875, -0.029767990112304688, -0.0268402099609375, -0.023912429809570312, -0.020984649658203125, -0.018056869506835938, -0.01512908935546875, -0.012201309204101562, -0.009273529052734375, -0.0063457489013671875, -0.00341796875, -0.0004901885986328125, 0.002437591552734375, 0.0053653717041015625, 0.00829315185546875, 0.011220932006835938, 0.014148712158203125, 0.017076492309570312, 0.0200042724609375, 0.022932052612304688, 0.025859832763671875, 0.028787612915039062, 0.03171539306640625, 0.03464317321777344, 0.037570953369140625, 0.04049873352050781, 0.043426513671875, 0.04635429382324219, 0.049282073974609375, 0.05220985412597656, 0.05513763427734375, 0.05806541442871094, 0.060993194580078125, 0.06392097473144531, 0.0668487548828125, 0.06977653503417969, 0.07270431518554688, 0.07563209533691406, 0.07855987548828125, 0.08148765563964844, 0.08441543579101562, 0.08734321594238281, 0.09027099609375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 26.0, 32.0, 59.0, 72.0, 112.0, 128.0, 130.0, 141.0, 97.0, 72.0, 52.0, 35.0, 22.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5244736671447754, -1.464622139930725, -1.4047704935073853, -1.344918966293335, -1.2850673198699951, -1.2252157926559448, -1.1653642654418945, -1.1055126190185547, -1.0456610918045044, -0.9858095049858093, -0.9259579181671143, -0.866106390953064, -0.8062548041343689, -0.7464032173156738, -0.6865516901016235, -0.6267001032829285, -0.5668485164642334, -0.5069969296455383, -0.44714537262916565, -0.38729381561279297, -0.3274422287940979, -0.26759064197540283, -0.20773908495903015, -0.14788752794265747, -0.0880359411239624, -0.028184369206428528, 0.03166720271110535, 0.09151877462863922, 0.1513703465461731, 0.21122193336486816, 0.27107349038124084, 0.3309250473976135, 0.3907766342163086, 0.45062822103500366, 0.5104798078536987, 0.570331335067749, 0.6301829218864441, 0.6900345087051392, 0.7498860359191895, 0.8097376227378845, 0.8695892095565796, 0.9294407963752747, 0.9892923831939697, 1.04914391040802, 1.1089954376220703, 1.1688470840454102, 1.2286986112594604, 1.2885501384735107, 1.3484017848968506, 1.4082533121109009, 1.4681049585342407, 1.527956485748291, 1.5878081321716309, 1.6476596593856812, 1.7075111865997314, 1.7673628330230713, 1.8272143602371216, 1.8870658874511719, 1.9469175338745117, 2.0067691802978516, 2.0666205883026123, 2.126472234725952, 2.186323881149292, 2.2461752891540527, 2.3060269355773926]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 4.0, 5.0, 5.0, 6.0, 9.0, 3.0, 8.0, 10.0, 13.0, 20.0, 11.0, 20.0, 25.0, 23.0, 28.0, 21.0, 37.0, 27.0, 40.0, 34.0, 48.0, 41.0, 38.0, 51.0, 33.0, 45.0, 48.0, 42.0, 47.0, 37.0, 30.0, 35.0, 27.0, 22.0, 24.0, 18.0, 10.0, 8.0, 14.0, 3.0, 7.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.3675720691680908, -1.324709177017212, -1.2818461656570435, -1.2389832735061646, -1.196120262145996, -1.1532573699951172, -1.1103943586349487, -1.0675314664840698, -1.0246684551239014, -0.9818055033683777, -0.938942551612854, -0.8960795998573303, -0.8532166481018066, -0.810353696346283, -0.7674907445907593, -0.7246278524398804, -0.6817649006843567, -0.638901948928833, -0.5960389971733093, -0.5531760454177856, -0.510313093662262, -0.4674501419067383, -0.424587219953537, -0.3817242681980133, -0.3388613164424896, -0.29599836468696594, -0.25313541293144226, -0.21027247607707977, -0.1674095243215561, -0.12454657256603241, -0.08168363571166992, -0.03882068395614624, 0.004042267799377441, 0.046905215829610825, 0.08976816385984421, 0.1326311081647873, 0.17549405992031097, 0.21835701167583466, 0.26121994853019714, 0.3040829002857208, 0.3469458520412445, 0.3898088037967682, 0.43267175555229187, 0.47553467750549316, 0.5183976292610168, 0.5612605810165405, 0.6041235327720642, 0.6469864845275879, 0.6898494362831116, 0.7327123880386353, 0.7755753397941589, 0.8184382915496826, 0.8613012433052063, 0.90416419506073, 0.9470270872116089, 0.9898900985717773, 1.0327529907226562, 1.0756158828735352, 1.1184788942337036, 1.1613417863845825, 1.204204797744751, 1.2470676898956299, 1.2899307012557983, 1.3327935934066772, 1.3756566047668457]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 14.0, 5.0, 6.0, 13.0, 12.0, 14.0, 25.0, 21.0, 27.0, 54.0, 68.0, 142.0, 377.0, 1226.0, 5274.0, 31269.0, 430505.0, 3485439.0, 213803.0, 20354.0, 3831.0, 979.0, 360.0, 154.0, 94.0, 51.0, 38.0, 33.0, 19.0, 18.0, 9.0, 10.0, 14.0, 12.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2001953125, -1.1619720458984375, -1.123748779296875, -1.0855255126953125, -1.04730224609375, -1.0090789794921875, -0.970855712890625, -0.9326324462890625, -0.8944091796875, -0.8561859130859375, -0.817962646484375, -0.7797393798828125, -0.74151611328125, -0.7032928466796875, -0.665069580078125, -0.6268463134765625, -0.588623046875, -0.5503997802734375, -0.512176513671875, -0.4739532470703125, -0.43572998046875, -0.3975067138671875, -0.359283447265625, -0.3210601806640625, -0.2828369140625, -0.2446136474609375, -0.206390380859375, -0.1681671142578125, -0.12994384765625, -0.0917205810546875, -0.053497314453125, -0.0152740478515625, 0.02294921875, 0.0611724853515625, 0.099395751953125, 0.1376190185546875, 0.17584228515625, 0.2140655517578125, 0.252288818359375, 0.2905120849609375, 0.3287353515625, 0.3669586181640625, 0.405181884765625, 0.4434051513671875, 0.48162841796875, 0.5198516845703125, 0.558074951171875, 0.5962982177734375, 0.634521484375, 0.6727447509765625, 0.710968017578125, 0.7491912841796875, 0.78741455078125, 0.8256378173828125, 0.863861083984375, 0.9020843505859375, 0.9403076171875, 0.9785308837890625, 1.016754150390625, 1.0549774169921875, 1.09320068359375, 1.1314239501953125, 1.169647216796875, 1.2078704833984375, 1.24609375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 12.0, 14.0, 16.0, 16.0, 25.0, 25.0, 38.0, 51.0, 46.0, 45.0, 58.0, 64.0, 63.0, 52.0, 56.0, 58.0, 53.0, 55.0, 36.0, 29.0, 33.0, 23.0, 22.0, 22.0, 16.0, 13.0, 4.0, 10.0, 8.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3525390625, -0.34053802490234375, -0.3285369873046875, -0.31653594970703125, -0.304534912109375, -0.29253387451171875, -0.2805328369140625, -0.26853179931640625, -0.25653076171875, -0.24452972412109375, -0.2325286865234375, -0.22052764892578125, -0.208526611328125, -0.19652557373046875, -0.1845245361328125, -0.17252349853515625, -0.1605224609375, -0.14852142333984375, -0.1365203857421875, -0.12451934814453125, -0.112518310546875, -0.10051727294921875, -0.0885162353515625, -0.07651519775390625, -0.06451416015625, -0.05251312255859375, -0.0405120849609375, -0.02851104736328125, -0.016510009765625, -0.00450897216796875, 0.0074920654296875, 0.01949310302734375, 0.031494140625, 0.04349517822265625, 0.0554962158203125, 0.06749725341796875, 0.079498291015625, 0.09149932861328125, 0.1035003662109375, 0.11550140380859375, 0.12750244140625, 0.13950347900390625, 0.1515045166015625, 0.16350555419921875, 0.175506591796875, 0.18750762939453125, 0.1995086669921875, 0.21150970458984375, 0.2235107421875, 0.23551177978515625, 0.2475128173828125, 0.25951385498046875, 0.271514892578125, 0.28351593017578125, 0.2955169677734375, 0.30751800537109375, 0.31951904296875, 0.33152008056640625, 0.3435211181640625, 0.35552215576171875, 0.367523193359375, 0.37952423095703125, 0.3915252685546875, 0.40352630615234375, 0.41552734375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 13.0, 20.0, 37.0, 29.0, 58.0, 97.0, 166.0, 302.0, 782.0, 3459.0, 26774.0, 467340.0, 3493406.0, 184145.0, 14262.0, 2209.0, 576.0, 242.0, 121.0, 67.0, 56.0, 42.0, 21.0, 14.0, 13.0, 7.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -0.9980926513671875, -0.957122802734375, -0.9161529541015625, -0.87518310546875, -0.8342132568359375, -0.793243408203125, -0.7522735595703125, -0.7113037109375, -0.6703338623046875, -0.629364013671875, -0.5883941650390625, -0.54742431640625, -0.5064544677734375, -0.465484619140625, -0.4245147705078125, -0.383544921875, -0.3425750732421875, -0.301605224609375, -0.2606353759765625, -0.21966552734375, -0.1786956787109375, -0.137725830078125, -0.0967559814453125, -0.0557861328125, -0.0148162841796875, 0.026153564453125, 0.0671234130859375, 0.10809326171875, 0.1490631103515625, 0.190032958984375, 0.2310028076171875, 0.27197265625, 0.3129425048828125, 0.353912353515625, 0.3948822021484375, 0.43585205078125, 0.4768218994140625, 0.517791748046875, 0.5587615966796875, 0.5997314453125, 0.6407012939453125, 0.681671142578125, 0.7226409912109375, 0.76361083984375, 0.8045806884765625, 0.845550537109375, 0.8865203857421875, 0.927490234375, 0.9684600830078125, 1.009429931640625, 1.0503997802734375, 1.09136962890625, 1.1323394775390625, 1.173309326171875, 1.2142791748046875, 1.2552490234375, 1.2962188720703125, 1.337188720703125, 1.3781585693359375, 1.41912841796875, 1.4600982666015625, 1.501068115234375, 1.5420379638671875, 1.5830078125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 3.0, 4.0, 13.0, 11.0, 21.0, 31.0, 23.0, 25.0, 62.0, 58.0, 100.0, 127.0, 173.0, 238.0, 329.0, 418.0, 478.0, 499.0, 372.0, 278.0, 211.0, 161.0, 100.0, 94.0, 65.0, 54.0, 33.0, 19.0, 17.0, 17.0, 12.0, 12.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21923828125, -0.21209716796875, -0.2049560546875, -0.19781494140625, -0.190673828125, -0.18353271484375, -0.1763916015625, -0.16925048828125, -0.162109375, -0.15496826171875, -0.1478271484375, -0.14068603515625, -0.133544921875, -0.12640380859375, -0.1192626953125, -0.11212158203125, -0.10498046875, -0.09783935546875, -0.0906982421875, -0.08355712890625, -0.076416015625, -0.06927490234375, -0.0621337890625, -0.05499267578125, -0.0478515625, -0.04071044921875, -0.0335693359375, -0.02642822265625, -0.019287109375, -0.01214599609375, -0.0050048828125, 0.00213623046875, 0.00927734375, 0.01641845703125, 0.0235595703125, 0.03070068359375, 0.037841796875, 0.04498291015625, 0.0521240234375, 0.05926513671875, 0.06640625, 0.07354736328125, 0.0806884765625, 0.08782958984375, 0.094970703125, 0.10211181640625, 0.1092529296875, 0.11639404296875, 0.12353515625, 0.13067626953125, 0.1378173828125, 0.14495849609375, 0.152099609375, 0.15924072265625, 0.1663818359375, 0.17352294921875, 0.1806640625, 0.18780517578125, 0.1949462890625, 0.20208740234375, 0.209228515625, 0.21636962890625, 0.2235107421875, 0.23065185546875, 0.23779296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 11.0, 6.0, 10.0, 9.0, 8.0, 14.0, 16.0, 21.0, 22.0, 23.0, 39.0, 29.0, 32.0, 41.0, 37.0, 45.0, 46.0, 50.0, 58.0, 45.0, 45.0, 41.0, 37.0, 34.0, 36.0, 35.0, 36.0, 22.0, 29.0, 13.0, 20.0, 16.0, 12.0, 10.0, 13.0, 3.0, 6.0, 6.0, 3.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0], "bins": [-0.5422593951225281, -0.5267993807792664, -0.5113394260406494, -0.4958794414997101, -0.48041945695877075, -0.46495944261550903, -0.4494994580745697, -0.43403947353363037, -0.41857948899269104, -0.4031195044517517, -0.3876595199108124, -0.37219953536987305, -0.35673952102661133, -0.3412795662879944, -0.32581955194473267, -0.31035956740379333, -0.294899582862854, -0.2794395983219147, -0.26397961378097534, -0.24851961433887482, -0.23305962979793549, -0.21759964525699615, -0.20213964581489563, -0.1866796612739563, -0.17121967673301697, -0.15575969219207764, -0.1402997076511383, -0.12483970820903778, -0.10937972366809845, -0.09391973912715912, -0.07845974713563919, -0.06299975514411926, -0.047539740800857544, -0.032079752534627914, -0.016619764268398285, -0.0011597760021686554, 0.014300212264060974, 0.029760196805000305, 0.04522018879652023, 0.06068018078804016, 0.07614016532897949, 0.09160014986991882, 0.10706014186143875, 0.12252013385295868, 0.137980118393898, 0.15344010293483734, 0.16890010237693787, 0.1843600869178772, 0.19982007145881653, 0.21528005599975586, 0.2307400405406952, 0.24620003998279572, 0.26166003942489624, 0.2771199941635132, 0.2925800085067749, 0.30803999304771423, 0.32349997758865356, 0.3389599621295929, 0.3544199466705322, 0.36987993121147156, 0.3853399157524109, 0.4007999300956726, 0.41625991463661194, 0.43171989917755127, 0.4471798837184906]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 13.0, 8.0, 10.0, 10.0, 12.0, 18.0, 13.0, 20.0, 20.0, 25.0, 31.0, 20.0, 41.0, 30.0, 28.0, 32.0, 35.0, 37.0, 46.0, 39.0, 32.0, 44.0, 43.0, 37.0, 36.0, 21.0, 27.0, 29.0, 31.0, 25.0, 19.0, 23.0, 25.0, 18.0, 15.0, 12.0, 11.0, 14.0, 8.0, 7.0, 6.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.4581279456615448, -0.4442524313926697, -0.43037694692611694, -0.4165014326572418, -0.4026259183883667, -0.3887504041194916, -0.37487488985061646, -0.3609994053840637, -0.3471238911151886, -0.3332483768463135, -0.31937289237976074, -0.3054973781108856, -0.2916218638420105, -0.2777463495731354, -0.26387083530426025, -0.24999535083770752, -0.2361198365688324, -0.22224432229995728, -0.20836882293224335, -0.19449332356452942, -0.1806178092956543, -0.16674229502677917, -0.15286679565906525, -0.13899129629135132, -0.1251157820224762, -0.11124027520418167, -0.09736476838588715, -0.08348926156759262, -0.0696137547492981, -0.05573824793100357, -0.041862741112709045, -0.02798723429441452, -0.014111727476119995, -0.00023622065782546997, 0.013639286160469055, 0.02751479297876358, 0.041390299797058105, 0.05526580661535263, 0.06914131343364716, 0.08301682025194168, 0.0968923270702362, 0.11076783388853073, 0.12464334070682526, 0.13851884007453918, 0.1523943543434143, 0.16626986861228943, 0.18014536798000336, 0.19402086734771729, 0.2078963816165924, 0.22177189588546753, 0.23564739525318146, 0.24952289462089539, 0.2633984088897705, 0.27727392315864563, 0.29114943742752075, 0.3050249218940735, 0.3189004361629486, 0.33277595043182373, 0.34665143489837646, 0.3605269491672516, 0.3744024634361267, 0.38827797770500183, 0.40215349197387695, 0.4160289764404297, 0.4299044907093048]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 5.0, 6.0, 11.0, 16.0, 27.0, 32.0, 69.0, 100.0, 150.0, 220.0, 341.0, 485.0, 909.0, 1546.0, 2734.0, 5095.0, 11813.0, 69829.0, 612524.0, 297262.0, 28198.0, 7888.0, 3926.0, 2145.0, 1301.0, 755.0, 419.0, 275.0, 176.0, 101.0, 70.0, 41.0, 26.0, 19.0, 16.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2027587890625, -0.196380615234375, -0.19000244140625, -0.183624267578125, -0.17724609375, -0.170867919921875, -0.16448974609375, -0.158111572265625, -0.1517333984375, -0.145355224609375, -0.13897705078125, -0.132598876953125, -0.126220703125, -0.119842529296875, -0.11346435546875, -0.107086181640625, -0.1007080078125, -0.094329833984375, -0.08795166015625, -0.081573486328125, -0.0751953125, -0.068817138671875, -0.06243896484375, -0.056060791015625, -0.0496826171875, -0.043304443359375, -0.03692626953125, -0.030548095703125, -0.024169921875, -0.017791748046875, -0.01141357421875, -0.005035400390625, 0.0013427734375, 0.007720947265625, 0.01409912109375, 0.020477294921875, 0.02685546875, 0.033233642578125, 0.03961181640625, 0.045989990234375, 0.0523681640625, 0.058746337890625, 0.06512451171875, 0.071502685546875, 0.077880859375, 0.084259033203125, 0.09063720703125, 0.097015380859375, 0.1033935546875, 0.109771728515625, 0.11614990234375, 0.122528076171875, 0.12890625, 0.135284423828125, 0.14166259765625, 0.148040771484375, 0.1544189453125, 0.160797119140625, 0.16717529296875, 0.173553466796875, 0.179931640625, 0.186309814453125, 0.19268798828125, 0.199066162109375, 0.2054443359375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 12.0, 9.0, 7.0, 18.0, 20.0, 29.0, 39.0, 43.0, 36.0, 38.0, 48.0, 43.0, 44.0, 55.0, 38.0, 47.0, 54.0, 35.0, 52.0, 54.0, 39.0, 30.0, 31.0, 32.0, 20.0, 25.0, 19.0, 14.0, 12.0, 8.0, 10.0, 6.0, 10.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.3777313232421875, -0.365570068359375, -0.3534088134765625, -0.34124755859375, -0.3290863037109375, -0.316925048828125, -0.3047637939453125, -0.2926025390625, -0.2804412841796875, -0.268280029296875, -0.2561187744140625, -0.24395751953125, -0.2317962646484375, -0.219635009765625, -0.2074737548828125, -0.1953125, -0.1831512451171875, -0.170989990234375, -0.1588287353515625, -0.14666748046875, -0.1345062255859375, -0.122344970703125, -0.1101837158203125, -0.0980224609375, -0.0858612060546875, -0.073699951171875, -0.0615386962890625, -0.04937744140625, -0.0372161865234375, -0.025054931640625, -0.0128936767578125, -0.000732421875, 0.0114288330078125, 0.023590087890625, 0.0357513427734375, 0.04791259765625, 0.0600738525390625, 0.072235107421875, 0.0843963623046875, 0.0965576171875, 0.1087188720703125, 0.120880126953125, 0.1330413818359375, 0.14520263671875, 0.1573638916015625, 0.169525146484375, 0.1816864013671875, 0.19384765625, 0.2060089111328125, 0.218170166015625, 0.2303314208984375, 0.24249267578125, 0.2546539306640625, 0.266815185546875, 0.2789764404296875, 0.2911376953125, 0.3032989501953125, 0.315460205078125, 0.3276214599609375, 0.33978271484375, 0.3519439697265625, 0.364105224609375, 0.3762664794921875, 0.388427734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 9.0, 4.0, 8.0, 9.0, 13.0, 13.0, 14.0, 28.0, 37.0, 56.0, 110.0, 158.0, 342.0, 691.0, 1532.0, 3666.0, 11347.0, 100536.0, 796559.0, 114676.0, 11972.0, 3692.0, 1559.0, 662.0, 337.0, 194.0, 100.0, 59.0, 50.0, 21.0, 15.0, 8.0, 11.0, 14.0, 6.0, 12.0, 1.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.213134765625, -0.2063732147216797, -0.19961166381835938, -0.19285011291503906, -0.18608856201171875, -0.17932701110839844, -0.17256546020507812, -0.1658039093017578, -0.1590423583984375, -0.1522808074951172, -0.14551925659179688, -0.13875770568847656, -0.13199615478515625, -0.12523460388183594, -0.11847305297851562, -0.11171150207519531, -0.104949951171875, -0.09818840026855469, -0.09142684936523438, -0.08466529846191406, -0.07790374755859375, -0.07114219665527344, -0.06438064575195312, -0.05761909484863281, -0.0508575439453125, -0.04409599304199219, -0.037334442138671875, -0.030572891235351562, -0.02381134033203125, -0.017049789428710938, -0.010288238525390625, -0.0035266876220703125, 0.00323486328125, 0.009996414184570312, 0.016757965087890625, 0.023519515991210938, 0.03028106689453125, 0.03704261779785156, 0.043804168701171875, 0.05056571960449219, 0.0573272705078125, 0.06408882141113281, 0.07085037231445312, 0.07761192321777344, 0.08437347412109375, 0.09113502502441406, 0.09789657592773438, 0.10465812683105469, 0.111419677734375, 0.11818122863769531, 0.12494277954101562, 0.13170433044433594, 0.13846588134765625, 0.14522743225097656, 0.15198898315429688, 0.1587505340576172, 0.1655120849609375, 0.1722736358642578, 0.17903518676757812, 0.18579673767089844, 0.19255828857421875, 0.19931983947753906, 0.20608139038085938, 0.2128429412841797, 0.2196044921875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 13.0, 9.0, 12.0, 6.0, 10.0, 19.0, 23.0, 22.0, 25.0, 25.0, 30.0, 41.0, 39.0, 31.0, 44.0, 36.0, 46.0, 52.0, 52.0, 28.0, 40.0, 37.0, 34.0, 41.0, 25.0, 32.0, 21.0, 21.0, 21.0, 29.0, 17.0, 22.0, 14.0, 16.0, 16.0, 9.0, 18.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.7880859375, -0.7633285522460938, -0.7385711669921875, -0.7138137817382812, -0.689056396484375, -0.6642990112304688, -0.6395416259765625, -0.6147842407226562, -0.59002685546875, -0.5652694702148438, -0.5405120849609375, -0.5157546997070312, -0.490997314453125, -0.46623992919921875, -0.4414825439453125, -0.41672515869140625, -0.3919677734375, -0.36721038818359375, -0.3424530029296875, -0.31769561767578125, -0.292938232421875, -0.26818084716796875, -0.2434234619140625, -0.21866607666015625, -0.19390869140625, -0.16915130615234375, -0.1443939208984375, -0.11963653564453125, -0.094879150390625, -0.07012176513671875, -0.0453643798828125, -0.02060699462890625, 0.004150390625, 0.02890777587890625, 0.0536651611328125, 0.07842254638671875, 0.103179931640625, 0.12793731689453125, 0.1526947021484375, 0.17745208740234375, 0.20220947265625, 0.22696685791015625, 0.2517242431640625, 0.27648162841796875, 0.301239013671875, 0.32599639892578125, 0.3507537841796875, 0.37551116943359375, 0.4002685546875, 0.42502593994140625, 0.4497833251953125, 0.47454071044921875, 0.499298095703125, 0.5240554809570312, 0.5488128662109375, 0.5735702514648438, 0.59832763671875, 0.6230850219726562, 0.6478424072265625, 0.6725997924804688, 0.697357177734375, 0.7221145629882812, 0.7468719482421875, 0.7716293334960938, 0.79638671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 8.0, 10.0, 11.0, 23.0, 19.0, 31.0, 61.0, 105.0, 171.0, 385.0, 800.0, 2040.0, 6077.0, 27056.0, 716835.0, 269978.0, 17408.0, 4477.0, 1655.0, 671.0, 313.0, 179.0, 93.0, 55.0, 37.0, 16.0, 11.0, 12.0, 10.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.1730823516845703, -0.16708755493164062, -0.16109275817871094, -0.15509796142578125, -0.14910316467285156, -0.14310836791992188, -0.1371135711669922, -0.1311187744140625, -0.1251239776611328, -0.11912918090820312, -0.11313438415527344, -0.10713958740234375, -0.10114479064941406, -0.09514999389648438, -0.08915519714355469, -0.083160400390625, -0.07716560363769531, -0.07117080688476562, -0.06517601013183594, -0.05918121337890625, -0.05318641662597656, -0.047191619873046875, -0.04119682312011719, -0.0352020263671875, -0.029207229614257812, -0.023212432861328125, -0.017217636108398438, -0.01122283935546875, -0.0052280426025390625, 0.000766754150390625, 0.0067615509033203125, 0.01275634765625, 0.018751144409179688, 0.024745941162109375, 0.030740737915039062, 0.03673553466796875, 0.04273033142089844, 0.048725128173828125, 0.05471992492675781, 0.0607147216796875, 0.06670951843261719, 0.07270431518554688, 0.07869911193847656, 0.08469390869140625, 0.09068870544433594, 0.09668350219726562, 0.10267829895019531, 0.108673095703125, 0.11466789245605469, 0.12066268920898438, 0.12665748596191406, 0.13265228271484375, 0.13864707946777344, 0.14464187622070312, 0.1506366729736328, 0.1566314697265625, 0.1626262664794922, 0.16862106323242188, 0.17461585998535156, 0.18061065673828125, 0.18660545349121094, 0.19260025024414062, 0.1985950469970703, 0.20458984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 13.0, 10.0, 28.0, 56.0, 135.0, 188.0, 225.0, 143.0, 80.0, 35.0, 28.0, 14.0, 7.0, 9.0, 2.0, 4.0, 0.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.638599395751953e-05, -5.406234413385391e-05, -5.1738694310188293e-05, -4.9415044486522675e-05, -4.7091394662857056e-05, -4.476774483919144e-05, -4.244409501552582e-05, -4.01204451918602e-05, -3.779679536819458e-05, -3.547314554452896e-05, -3.314949572086334e-05, -3.0825845897197723e-05, -2.8502196073532104e-05, -2.6178546249866486e-05, -2.3854896426200867e-05, -2.1531246602535248e-05, -1.920759677886963e-05, -1.688394695520401e-05, -1.4560297131538391e-05, -1.2236647307872772e-05, -9.912997484207153e-06, -7.5893476605415344e-06, -5.2656978368759155e-06, -2.9420480132102966e-06, -6.183981895446777e-07, 1.7052516341209412e-06, 4.02890145778656e-06, 6.352551281452179e-06, 8.676201105117798e-06, 1.0999850928783417e-05, 1.3323500752449036e-05, 1.5647150576114655e-05, 1.7970800399780273e-05, 2.0294450223445892e-05, 2.261810004711151e-05, 2.494174987077713e-05, 2.726539969444275e-05, 2.9589049518108368e-05, 3.191269934177399e-05, 3.4236349165439606e-05, 3.6559998989105225e-05, 3.8883648812770844e-05, 4.120729863643646e-05, 4.353094846010208e-05, 4.58545982837677e-05, 4.817824810743332e-05, 5.050189793109894e-05, 5.282554775476456e-05, 5.5149197578430176e-05, 5.7472847402095795e-05, 5.9796497225761414e-05, 6.212014704942703e-05, 6.444379687309265e-05, 6.676744669675827e-05, 6.909109652042389e-05, 7.141474634408951e-05, 7.373839616775513e-05, 7.606204599142075e-05, 7.838569581508636e-05, 8.070934563875198e-05, 8.30329954624176e-05, 8.535664528608322e-05, 8.768029510974884e-05, 9.000394493341446e-05, 9.232759475708008e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 9.0, 22.0, 32.0, 49.0, 74.0, 136.0, 215.0, 377.0, 693.0, 1212.0, 2283.0, 3822.0, 7250.0, 15742.0, 55032.0, 365516.0, 483495.0, 74971.0, 19554.0, 8285.0, 4336.0, 2400.0, 1306.0, 802.0, 400.0, 221.0, 139.0, 87.0, 42.0, 29.0, 11.0, 5.0, 13.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10693359375, -0.10379695892333984, -0.10066032409667969, -0.09752368927001953, -0.09438705444335938, -0.09125041961669922, -0.08811378479003906, -0.0849771499633789, -0.08184051513671875, -0.0787038803100586, -0.07556724548339844, -0.07243061065673828, -0.06929397583007812, -0.06615734100341797, -0.06302070617675781, -0.059884071350097656, -0.0567474365234375, -0.053610801696777344, -0.05047416687011719, -0.04733753204345703, -0.044200897216796875, -0.04106426239013672, -0.03792762756347656, -0.034790992736816406, -0.03165435791015625, -0.028517723083496094, -0.025381088256835938, -0.02224445343017578, -0.019107818603515625, -0.01597118377685547, -0.012834548950195312, -0.009697914123535156, -0.006561279296875, -0.0034246444702148438, -0.0002880096435546875, 0.0028486251831054688, 0.005985260009765625, 0.009121894836425781, 0.012258529663085938, 0.015395164489746094, 0.01853179931640625, 0.021668434143066406, 0.024805068969726562, 0.02794170379638672, 0.031078338623046875, 0.03421497344970703, 0.03735160827636719, 0.040488243103027344, 0.0436248779296875, 0.046761512756347656, 0.04989814758300781, 0.05303478240966797, 0.056171417236328125, 0.05930805206298828, 0.06244468688964844, 0.0655813217163086, 0.06871795654296875, 0.0718545913696289, 0.07499122619628906, 0.07812786102294922, 0.08126449584960938, 0.08440113067626953, 0.08753776550292969, 0.09067440032958984, 0.09381103515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 1.0, 6.0, 7.0, 5.0, 20.0, 24.0, 82.0, 125.0, 205.0, 231.0, 126.0, 74.0, 29.0, 20.0, 12.0, 10.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04736328125, -0.04578733444213867, -0.044211387634277344, -0.042635440826416016, -0.04105949401855469, -0.03948354721069336, -0.03790760040283203, -0.0363316535949707, -0.034755706787109375, -0.03317975997924805, -0.03160381317138672, -0.03002786636352539, -0.028451919555664062, -0.026875972747802734, -0.025300025939941406, -0.023724079132080078, -0.02214813232421875, -0.020572185516357422, -0.018996238708496094, -0.017420291900634766, -0.015844345092773438, -0.01426839828491211, -0.012692451477050781, -0.011116504669189453, -0.009540557861328125, -0.007964611053466797, -0.006388664245605469, -0.004812717437744141, -0.0032367706298828125, -0.0016608238220214844, -8.487701416015625e-05, 0.0014910697937011719, 0.0030670166015625, 0.004642963409423828, 0.006218910217285156, 0.007794857025146484, 0.009370803833007812, 0.01094675064086914, 0.012522697448730469, 0.014098644256591797, 0.015674591064453125, 0.017250537872314453, 0.01882648468017578, 0.02040243148803711, 0.021978378295898438, 0.023554325103759766, 0.025130271911621094, 0.026706218719482422, 0.02828216552734375, 0.029858112335205078, 0.031434059143066406, 0.033010005950927734, 0.03458595275878906, 0.03616189956665039, 0.03773784637451172, 0.03931379318237305, 0.040889739990234375, 0.0424656867980957, 0.04404163360595703, 0.04561758041381836, 0.04719352722167969, 0.048769474029541016, 0.050345420837402344, 0.05192136764526367, 0.053497314453125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 3.0, 7.0, 8.0, 9.0, 5.0, 11.0, 16.0, 17.0, 22.0, 27.0, 20.0, 40.0, 30.0, 47.0, 46.0, 43.0, 54.0, 56.0, 56.0, 61.0, 60.0, 43.0, 48.0, 39.0, 34.0, 47.0, 22.0, 29.0, 22.0, 23.0, 12.0, 14.0, 9.0, 6.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3248569071292877, -0.3130475878715515, -0.3012382388114929, -0.2894289195537567, -0.2776196002960205, -0.2658102512359619, -0.2540009319782257, -0.2421916127204895, -0.2303822785615921, -0.2185729444026947, -0.2067636251449585, -0.1949542909860611, -0.1831449568271637, -0.1713356375694275, -0.1595263034105301, -0.1477169692516327, -0.13590764999389648, -0.12409832328557968, -0.11228899657726288, -0.10047966241836548, -0.08867033571004868, -0.07686100900173187, -0.06505167484283447, -0.05324234813451767, -0.04143302142620087, -0.029623692855238914, -0.017814364284276962, -0.006005033850669861, 0.005804292857646942, 0.017613619565963745, 0.029422953724861145, 0.04123228043317795, 0.05304163694381714, 0.06485096365213394, 0.07666029036045074, 0.08846962451934814, 0.10027895122766495, 0.11208827793598175, 0.12389761209487915, 0.13570693135261536, 0.14751626551151276, 0.15932559967041016, 0.17113491892814636, 0.18294425308704376, 0.19475358724594116, 0.20656290650367737, 0.21837224066257477, 0.23018157482147217, 0.24199089407920837, 0.2538002133369446, 0.2656095623970032, 0.2774188816547394, 0.2892282009124756, 0.3010375499725342, 0.3128468692302704, 0.3246561884880066, 0.3364655375480652, 0.3482748568058014, 0.36008420586586, 0.3718935251235962, 0.3837028443813324, 0.3955121636390686, 0.4073215126991272, 0.4191308319568634, 0.4309401512145996]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 6.0, 6.0, 11.0, 18.0, 4.0, 18.0, 21.0, 24.0, 22.0, 37.0, 32.0, 34.0, 33.0, 34.0, 38.0, 40.0, 48.0, 41.0, 51.0, 40.0, 39.0, 43.0, 30.0, 49.0, 30.0, 35.0, 27.0, 24.0, 28.0, 27.0, 16.0, 15.0, 13.0, 22.0, 10.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3110934793949127, -0.30085837841033936, -0.290623277425766, -0.2803881764411926, -0.27015310525894165, -0.2599180042743683, -0.24968290328979492, -0.23944780230522156, -0.2292127013206482, -0.21897760033607483, -0.20874249935150146, -0.1985074132680893, -0.18827231228351593, -0.17803721129894257, -0.1678021252155304, -0.15756702423095703, -0.14733192324638367, -0.1370968222618103, -0.12686172127723694, -0.11662663519382477, -0.1063915342092514, -0.09615643322467804, -0.08592133969068527, -0.0756862461566925, -0.06545114517211914, -0.055216047912836075, -0.04498095065355301, -0.03474585339426994, -0.024510756134986877, -0.014275658875703812, -0.004040561616420746, 0.0061945319175720215, 0.016429632902145386, 0.02666473016142845, 0.03689982742071152, 0.04713492467999458, 0.05737002193927765, 0.06760512292385101, 0.07784021645784378, 0.08807530999183655, 0.09831041097640991, 0.10854551196098328, 0.11878060549497604, 0.1290156990289688, 0.13925080001354218, 0.14948590099811554, 0.1597209870815277, 0.16995608806610107, 0.18019118905067444, 0.1904262900352478, 0.20066139101982117, 0.21089647710323334, 0.2211315780878067, 0.23136667907238007, 0.24160176515579224, 0.2518368661403656, 0.26207196712493896, 0.27230706810951233, 0.2825421690940857, 0.29277727007865906, 0.3030123710632324, 0.3132474422454834, 0.32348254323005676, 0.3337176442146301, 0.3439527451992035]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 5.0, 12.0, 13.0, 22.0, 34.0, 51.0, 62.0, 104.0, 153.0, 233.0, 356.0, 616.0, 1088.0, 1948.0, 3623.0, 7025.0, 14062.0, 28313.0, 60672.0, 144017.0, 325111.0, 261724.0, 106414.0, 47033.0, 22263.0, 11019.0, 5632.0, 2904.0, 1682.0, 907.0, 550.0, 305.0, 197.0, 132.0, 97.0, 50.0, 41.0, 26.0, 13.0, 15.0, 6.0, 4.0, 6.0, 6.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462646484375, -0.4471397399902344, -0.43163299560546875, -0.4161262512207031, -0.4006195068359375, -0.3851127624511719, -0.36960601806640625, -0.3540992736816406, -0.338592529296875, -0.3230857849121094, -0.30757904052734375, -0.2920722961425781, -0.2765655517578125, -0.2610588073730469, -0.24555206298828125, -0.23004531860351562, -0.21453857421875, -0.19903182983398438, -0.18352508544921875, -0.16801834106445312, -0.1525115966796875, -0.13700485229492188, -0.12149810791015625, -0.10599136352539062, -0.090484619140625, -0.07497787475585938, -0.05947113037109375, -0.043964385986328125, -0.0284576416015625, -0.012950897216796875, 0.00255584716796875, 0.018062591552734375, 0.0335693359375, 0.049076080322265625, 0.06458282470703125, 0.08008956909179688, 0.0955963134765625, 0.11110305786132812, 0.12660980224609375, 0.14211654663085938, 0.157623291015625, 0.17313003540039062, 0.18863677978515625, 0.20414352416992188, 0.2196502685546875, 0.23515701293945312, 0.25066375732421875, 0.2661705017089844, 0.28167724609375, 0.2971839904785156, 0.31269073486328125, 0.3281974792480469, 0.3437042236328125, 0.3592109680175781, 0.37471771240234375, 0.3902244567871094, 0.405731201171875, 0.4212379455566406, 0.43674468994140625, 0.4522514343261719, 0.4677581787109375, 0.4832649230957031, 0.49877166748046875, 0.5142784118652344, 0.52978515625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 7.0, 10.0, 10.0, 8.0, 13.0, 12.0, 18.0, 19.0, 18.0, 28.0, 25.0, 30.0, 23.0, 28.0, 33.0, 42.0, 43.0, 45.0, 49.0, 32.0, 27.0, 34.0, 34.0, 33.0, 35.0, 34.0, 28.0, 31.0, 29.0, 26.0, 27.0, 20.0, 20.0, 25.0, 24.0, 11.0, 19.0, 8.0, 10.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.49560546875, -0.4803123474121094, -0.46501922607421875, -0.4497261047363281, -0.4344329833984375, -0.4191398620605469, -0.40384674072265625, -0.3885536193847656, -0.373260498046875, -0.3579673767089844, -0.34267425537109375, -0.3273811340332031, -0.3120880126953125, -0.2967948913574219, -0.28150177001953125, -0.2662086486816406, -0.25091552734375, -0.23562240600585938, -0.22032928466796875, -0.20503616333007812, -0.1897430419921875, -0.17444992065429688, -0.15915679931640625, -0.14386367797851562, -0.128570556640625, -0.11327743530273438, -0.09798431396484375, -0.08269119262695312, -0.0673980712890625, -0.052104949951171875, -0.03681182861328125, -0.021518707275390625, -0.0062255859375, 0.009067535400390625, 0.02436065673828125, 0.039653778076171875, 0.0549468994140625, 0.07024002075195312, 0.08553314208984375, 0.10082626342773438, 0.116119384765625, 0.13141250610351562, 0.14670562744140625, 0.16199874877929688, 0.1772918701171875, 0.19258499145507812, 0.20787811279296875, 0.22317123413085938, 0.23846435546875, 0.2537574768066406, 0.26905059814453125, 0.2843437194824219, 0.2996368408203125, 0.3149299621582031, 0.33022308349609375, 0.3455162048339844, 0.360809326171875, 0.3761024475097656, 0.39139556884765625, 0.4066886901855469, 0.4219818115234375, 0.4372749328613281, 0.45256805419921875, 0.4678611755371094, 0.483154296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 9.0, 17.0, 17.0, 18.0, 32.0, 39.0, 55.0, 99.0, 167.0, 241.0, 457.0, 863.0, 1556.0, 2981.0, 6130.0, 12308.0, 25681.0, 54885.0, 133071.0, 321867.0, 284134.0, 111797.0, 47610.0, 22431.0, 10787.0, 5326.0, 2727.0, 1398.0, 731.0, 404.0, 258.0, 158.0, 101.0, 68.0, 37.0, 34.0, 13.0, 17.0, 9.0, 7.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4150848388671875, -0.400726318359375, -0.3863677978515625, -0.37200927734375, -0.3576507568359375, -0.343292236328125, -0.3289337158203125, -0.3145751953125, -0.3002166748046875, -0.285858154296875, -0.2714996337890625, -0.25714111328125, -0.2427825927734375, -0.228424072265625, -0.2140655517578125, -0.19970703125, -0.1853485107421875, -0.170989990234375, -0.1566314697265625, -0.14227294921875, -0.1279144287109375, -0.113555908203125, -0.0991973876953125, -0.0848388671875, -0.0704803466796875, -0.056121826171875, -0.0417633056640625, -0.02740478515625, -0.0130462646484375, 0.001312255859375, 0.0156707763671875, 0.030029296875, 0.0443878173828125, 0.058746337890625, 0.0731048583984375, 0.08746337890625, 0.1018218994140625, 0.116180419921875, 0.1305389404296875, 0.1448974609375, 0.1592559814453125, 0.173614501953125, 0.1879730224609375, 0.20233154296875, 0.2166900634765625, 0.231048583984375, 0.2454071044921875, 0.259765625, 0.2741241455078125, 0.288482666015625, 0.3028411865234375, 0.31719970703125, 0.3315582275390625, 0.345916748046875, 0.3602752685546875, 0.3746337890625, 0.3889923095703125, 0.403350830078125, 0.4177093505859375, 0.43206787109375, 0.4464263916015625, 0.460784912109375, 0.4751434326171875, 0.489501953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 5.0, 14.0, 13.0, 17.0, 13.0, 16.0, 15.0, 19.0, 34.0, 33.0, 40.0, 42.0, 40.0, 40.0, 44.0, 48.0, 49.0, 36.0, 49.0, 40.0, 36.0, 41.0, 40.0, 34.0, 39.0, 27.0, 26.0, 22.0, 14.0, 23.0, 12.0, 15.0, 12.0, 4.0, 9.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.712890625, -0.6923675537109375, -0.671844482421875, -0.6513214111328125, -0.63079833984375, -0.6102752685546875, -0.589752197265625, -0.5692291259765625, -0.5487060546875, -0.5281829833984375, -0.507659912109375, -0.4871368408203125, -0.46661376953125, -0.4460906982421875, -0.425567626953125, -0.4050445556640625, -0.384521484375, -0.3639984130859375, -0.343475341796875, -0.3229522705078125, -0.30242919921875, -0.2819061279296875, -0.261383056640625, -0.2408599853515625, -0.2203369140625, -0.1998138427734375, -0.179290771484375, -0.1587677001953125, -0.13824462890625, -0.1177215576171875, -0.097198486328125, -0.0766754150390625, -0.05615234375, -0.0356292724609375, -0.015106201171875, 0.0054168701171875, 0.02593994140625, 0.0464630126953125, 0.066986083984375, 0.0875091552734375, 0.1080322265625, 0.1285552978515625, 0.149078369140625, 0.1696014404296875, 0.19012451171875, 0.2106475830078125, 0.231170654296875, 0.2516937255859375, 0.272216796875, 0.2927398681640625, 0.313262939453125, 0.3337860107421875, 0.35430908203125, 0.3748321533203125, 0.395355224609375, 0.4158782958984375, 0.4364013671875, 0.4569244384765625, 0.477447509765625, 0.4979705810546875, 0.51849365234375, 0.5390167236328125, 0.559539794921875, 0.5800628662109375, 0.6005859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 4.0, 17.0, 19.0, 26.0, 33.0, 48.0, 64.0, 105.0, 133.0, 185.0, 277.0, 380.0, 573.0, 849.0, 1413.0, 2129.0, 3775.0, 7213.0, 14974.0, 34494.0, 83083.0, 196522.0, 351970.0, 198539.0, 84085.0, 34738.0, 15350.0, 7365.0, 3868.0, 2181.0, 1306.0, 882.0, 573.0, 393.0, 261.0, 187.0, 142.0, 103.0, 74.0, 62.0, 33.0, 34.0, 29.0, 20.0, 8.0, 11.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.11285400390625, -0.10915470123291016, -0.10545539855957031, -0.10175609588623047, -0.09805679321289062, -0.09435749053955078, -0.09065818786621094, -0.0869588851928711, -0.08325958251953125, -0.0795602798461914, -0.07586097717285156, -0.07216167449951172, -0.06846237182617188, -0.06476306915283203, -0.06106376647949219, -0.057364463806152344, -0.0536651611328125, -0.049965858459472656, -0.04626655578613281, -0.04256725311279297, -0.038867950439453125, -0.03516864776611328, -0.03146934509277344, -0.027770042419433594, -0.02407073974609375, -0.020371437072753906, -0.016672134399414062, -0.012972831726074219, -0.009273529052734375, -0.005574226379394531, -0.0018749237060546875, 0.0018243789672851562, 0.005523681640625, 0.009222984313964844, 0.012922286987304688, 0.01662158966064453, 0.020320892333984375, 0.02402019500732422, 0.027719497680664062, 0.031418800354003906, 0.03511810302734375, 0.038817405700683594, 0.04251670837402344, 0.04621601104736328, 0.049915313720703125, 0.05361461639404297, 0.05731391906738281, 0.061013221740722656, 0.0647125244140625, 0.06841182708740234, 0.07211112976074219, 0.07581043243408203, 0.07950973510742188, 0.08320903778076172, 0.08690834045410156, 0.0906076431274414, 0.09430694580078125, 0.0980062484741211, 0.10170555114746094, 0.10540485382080078, 0.10910415649414062, 0.11280345916748047, 0.11650276184082031, 0.12020206451416016, 0.1239013671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 6.0, 8.0, 8.0, 15.0, 27.0, 37.0, 47.0, 56.0, 73.0, 92.0, 94.0, 155.0, 89.0, 65.0, 61.0, 47.0, 38.0, 28.0, 16.0, 9.0, 9.0, 8.0, 3.0, 2.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6253204345703125e-05, -4.497729241847992e-05, -4.3701380491256714e-05, -4.242546856403351e-05, -4.11495566368103e-05, -3.98736447095871e-05, -3.859773278236389e-05, -3.7321820855140686e-05, -3.604590892791748e-05, -3.4769997000694275e-05, -3.349408507347107e-05, -3.2218173146247864e-05, -3.094226121902466e-05, -2.9666349291801453e-05, -2.8390437364578247e-05, -2.711452543735504e-05, -2.5838613510131836e-05, -2.456270158290863e-05, -2.3286789655685425e-05, -2.201087772846222e-05, -2.0734965801239014e-05, -1.9459053874015808e-05, -1.8183141946792603e-05, -1.6907230019569397e-05, -1.563131809234619e-05, -1.4355406165122986e-05, -1.307949423789978e-05, -1.1803582310676575e-05, -1.0527670383453369e-05, -9.251758456230164e-06, -7.975846529006958e-06, -6.6999346017837524e-06, -5.424022674560547e-06, -4.148110747337341e-06, -2.8721988201141357e-06, -1.5962868928909302e-06, -3.203749656677246e-07, 9.55536961555481e-07, 2.2314488887786865e-06, 3.507360816001892e-06, 4.783272743225098e-06, 6.059184670448303e-06, 7.335096597671509e-06, 8.611008524894714e-06, 9.88692045211792e-06, 1.1162832379341125e-05, 1.2438744306564331e-05, 1.3714656233787537e-05, 1.4990568161010742e-05, 1.6266480088233948e-05, 1.7542392015457153e-05, 1.881830394268036e-05, 2.0094215869903564e-05, 2.137012779712677e-05, 2.2646039724349976e-05, 2.392195165157318e-05, 2.5197863578796387e-05, 2.6473775506019592e-05, 2.7749687433242798e-05, 2.9025599360466003e-05, 3.030151128768921e-05, 3.1577423214912415e-05, 3.285333514213562e-05, 3.4129247069358826e-05, 3.540515899658203e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 8.0, 14.0, 10.0, 14.0, 18.0, 29.0, 33.0, 53.0, 71.0, 82.0, 103.0, 138.0, 233.0, 324.0, 490.0, 748.0, 1211.0, 2016.0, 3773.0, 7365.0, 16647.0, 43263.0, 125332.0, 373222.0, 304338.0, 103510.0, 36169.0, 14399.0, 6426.0, 3353.0, 1843.0, 1127.0, 655.0, 472.0, 310.0, 218.0, 156.0, 117.0, 61.0, 51.0, 41.0, 24.0, 27.0, 17.0, 11.0, 16.0, 2.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.1539306640625, -0.14878463745117188, -0.14363861083984375, -0.13849258422851562, -0.1333465576171875, -0.12820053100585938, -0.12305450439453125, -0.11790847778320312, -0.112762451171875, -0.10761642456054688, -0.10247039794921875, -0.09732437133789062, -0.0921783447265625, -0.08703231811523438, -0.08188629150390625, -0.07674026489257812, -0.07159423828125, -0.06644821166992188, -0.06130218505859375, -0.056156158447265625, -0.0510101318359375, -0.045864105224609375, -0.04071807861328125, -0.035572052001953125, -0.030426025390625, -0.025279998779296875, -0.02013397216796875, -0.014987945556640625, -0.0098419189453125, -0.004695892333984375, 0.00045013427734375, 0.005596160888671875, 0.0107421875, 0.015888214111328125, 0.02103424072265625, 0.026180267333984375, 0.0313262939453125, 0.036472320556640625, 0.04161834716796875, 0.046764373779296875, 0.051910400390625, 0.057056427001953125, 0.06220245361328125, 0.06734848022460938, 0.0724945068359375, 0.07764053344726562, 0.08278656005859375, 0.08793258666992188, 0.09307861328125, 0.09822463989257812, 0.10337066650390625, 0.10851669311523438, 0.1136627197265625, 0.11880874633789062, 0.12395477294921875, 0.12910079956054688, 0.134246826171875, 0.13939285278320312, 0.14453887939453125, 0.14968490600585938, 0.1548309326171875, 0.15997695922851562, 0.16512298583984375, 0.17026901245117188, 0.1754150390625]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 5.0, 16.0, 20.0, 21.0, 22.0, 30.0, 60.0, 66.0, 100.0, 112.0, 100.0, 94.0, 92.0, 63.0, 53.0, 32.0, 27.0, 24.0, 20.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1356201171875, -0.1317605972290039, -0.1279010772705078, -0.12404155731201172, -0.12018203735351562, -0.11632251739501953, -0.11246299743652344, -0.10860347747802734, -0.10474395751953125, -0.10088443756103516, -0.09702491760253906, -0.09316539764404297, -0.08930587768554688, -0.08544635772705078, -0.08158683776855469, -0.0777273178100586, -0.0738677978515625, -0.0700082778930664, -0.06614875793457031, -0.06228923797607422, -0.058429718017578125, -0.05457019805908203, -0.05071067810058594, -0.046851158142089844, -0.04299163818359375, -0.039132118225097656, -0.03527259826660156, -0.03141307830810547, -0.027553558349609375, -0.02369403839111328, -0.019834518432617188, -0.015974998474121094, -0.012115478515625, -0.008255958557128906, -0.0043964385986328125, -0.0005369186401367188, 0.003322601318359375, 0.007182121276855469, 0.011041641235351562, 0.014901161193847656, 0.01876068115234375, 0.022620201110839844, 0.026479721069335938, 0.03033924102783203, 0.034198760986328125, 0.03805828094482422, 0.04191780090332031, 0.045777320861816406, 0.0496368408203125, 0.053496360778808594, 0.05735588073730469, 0.06121540069580078, 0.06507492065429688, 0.06893444061279297, 0.07279396057128906, 0.07665348052978516, 0.08051300048828125, 0.08437252044677734, 0.08823204040527344, 0.09209156036376953, 0.09595108032226562, 0.09981060028076172, 0.10367012023925781, 0.1075296401977539, 0.11138916015625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 9.0, 13.0, 27.0, 75.0, 102.0, 138.0, 163.0, 172.0, 111.0, 98.0, 56.0, 18.0, 9.0, 5.0, 5.0], "bins": [-4.051299095153809, -3.978719711303711, -3.9061403274536133, -3.8335609436035156, -3.760981798171997, -3.6884024143218994, -3.6158230304718018, -3.543243646621704, -3.4706642627716064, -3.398084878921509, -3.325505495071411, -3.2529263496398926, -3.180346965789795, -3.1077675819396973, -3.0351881980895996, -2.962608814239502, -2.8900294303894043, -2.8174500465393066, -2.744870662689209, -2.6722912788391113, -2.5997121334075928, -2.527132749557495, -2.4545533657073975, -2.3819739818573, -2.3093948364257812, -2.2368154525756836, -2.164236068725586, -2.0916566848754883, -2.0190775394439697, -1.946498155593872, -1.8739187717437744, -1.8013393878936768, -1.7287598848342896, -1.656180500984192, -1.5836012363433838, -1.5110218524932861, -1.4384424686431885, -1.3658630847930908, -1.2932838201522827, -1.220704436302185, -1.148125171661377, -1.0755457878112793, -1.0029665231704712, -0.9303871393203735, -0.8578077554702759, -0.785228431224823, -0.7126491069793701, -0.6400697231292725, -0.5674903392791748, -0.49491098523139954, -0.42233163118362427, -0.3497523069381714, -0.2771729528903961, -0.20459359884262085, -0.13201427459716797, -0.05943489074707031, 0.013144433498382568, 0.08572378009557724, 0.1583031266927719, 0.230882465839386, 0.30346181988716125, 0.3760411739349365, 0.4486204981803894, 0.5211998820304871, 0.5937792062759399]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 8.0, 5.0, 4.0, 12.0, 13.0, 13.0, 11.0, 15.0, 15.0, 16.0, 27.0, 29.0, 18.0, 31.0, 31.0, 26.0, 38.0, 24.0, 49.0, 47.0, 36.0, 46.0, 40.0, 34.0, 35.0, 38.0, 30.0, 39.0, 32.0, 23.0, 20.0, 24.0, 24.0, 14.0, 20.0, 21.0, 12.0, 16.0, 8.0, 6.0, 10.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9332066178321838, -0.9024879932403564, -0.871769368648529, -0.8410507440567017, -0.810332179069519, -0.7796135544776917, -0.7488949298858643, -0.7181763052940369, -0.6874576807022095, -0.6567390561103821, -0.6260204315185547, -0.5953018665313721, -0.5645832419395447, -0.5338646173477173, -0.5031459927558899, -0.4724273681640625, -0.4417088031768799, -0.4109901785850525, -0.3802715837955475, -0.3495529592037201, -0.3188343644142151, -0.2881157398223877, -0.2573971152305603, -0.2266785055398941, -0.1959598958492279, -0.1652412861585617, -0.1345226764678955, -0.10380405187606812, -0.07308544218540192, -0.04236683249473572, -0.011648207902908325, 0.019070401787757874, 0.04978907108306885, 0.08050768077373505, 0.11122629791498184, 0.14194491505622864, 0.17266352474689484, 0.20338213443756104, 0.23410075902938843, 0.2648193836212158, 0.2955379784107208, 0.3262566030025482, 0.3569751977920532, 0.3876938223838806, 0.418412446975708, 0.449131041765213, 0.4798496663570404, 0.5105682611465454, 0.5412868857383728, 0.5720055103302002, 0.6027241349220276, 0.633442759513855, 0.6641613245010376, 0.694879949092865, 0.7255985736846924, 0.7563171982765198, 0.7870358228683472, 0.8177544474601746, 0.848473072052002, 0.8791916370391846, 0.909910261631012, 0.9406288862228394, 0.9713475108146667, 1.0020661354064941, 1.0327847003936768]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 11.0, 20.0, 23.0, 28.0, 49.0, 63.0, 65.0, 102.0, 99.0, 163.0, 208.0, 328.0, 390.0, 505.0, 650.0, 895.0, 1175.0, 1491.0, 1922.0, 2592.0, 1029615.0, 2434.0, 1734.0, 1405.0, 1140.0, 851.0, 660.0, 485.0, 385.0, 289.0, 197.0, 155.0, 109.0, 91.0, 57.0, 46.0, 44.0, 25.0, 32.0, 21.0, 15.0, 4.0, 2.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.151054859161377, -1.1155321598052979, -1.0800094604492188, -1.0444868803024292, -1.00896418094635, -0.973441481590271, -0.9379187822341919, -0.9023960828781128, -0.8668734431266785, -0.8313507437705994, -0.795828104019165, -0.7603054046630859, -0.7247827053070068, -0.6892600655555725, -0.6537373661994934, -0.6182147264480591, -0.58269202709198, -0.5471693277359009, -0.5116466879844666, -0.47612398862838745, -0.44060131907463074, -0.405078649520874, -0.3695559501647949, -0.3340332806110382, -0.2985106110572815, -0.2629879415035248, -0.22746525704860687, -0.19194257259368896, -0.15641990303993225, -0.12089723348617554, -0.08537454903125763, -0.04985186457633972, -0.014329195022583008, 0.021193481981754303, 0.056716158986091614, 0.09223883599042892, 0.12776151299476624, 0.16328418254852295, 0.19880686700344086, 0.23432955145835876, 0.2698522210121155, 0.3053748905658722, 0.3408975601196289, 0.376420259475708, 0.4119429290294647, 0.44746559858322144, 0.48298829793930054, 0.5185109376907349, 0.554033637046814, 0.5895563364028931, 0.6250789761543274, 0.6606016755104065, 0.6961243152618408, 0.7316470146179199, 0.767169713973999, 0.8026924133300781, 0.8382150530815125, 0.8737377524375916, 0.9092603921890259, 0.944783091545105, 0.9803057909011841, 1.0158283710479736, 1.0513510704040527, 1.0868737697601318, 1.122396469116211]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 31.0, 35.0, 78.0, 195.0, 662.0, 2465.0, 8649.0, 50994484.0, 451780.0, 9638.0, 2746.0, 757.0, 240.0, 85.0, 31.0, 21.0, 17.0, 6.0, 1.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.800079345703125, -6.557189464569092, -6.314300060272217, -6.071410655975342, -5.828520774841309, -5.585631370544434, -5.342741966247559, -5.099852085113525, -4.85696268081665, -4.614072799682617, -4.371183395385742, -4.128293991088867, -3.885404109954834, -3.642514705657959, -3.399625062942505, -3.15673565864563, -2.913846015930176, -2.670956611633301, -2.4280669689178467, -2.1851773262023926, -1.942287802696228, -1.6993982791900635, -1.4565086364746094, -1.2136191129684448, -0.9707295298576355, -0.7278399467468262, -0.4849504232406616, -0.2420608401298523, 0.0008287429809570312, 0.24371826648712158, 0.4866079092025757, 0.7294974327087402, 0.9723870158195496, 1.2152765989303589, 1.4581661224365234, 1.7010557651519775, 1.943945288658142, 2.1868348121643066, 2.4297244548797607, 2.672614097595215, 2.915503740310669, 3.158393144607544, 3.401282787322998, 3.644172430038452, 3.8870620727539062, 4.129951477050781, 4.372840881347656, 4.615730285644531, 4.858619689941406, 5.1015095710754395, 5.3443989753723145, 5.5872883796691895, 5.830178260803223, 6.073067665100098, 6.315957069396973, 6.558846950531006, 6.801736354827881, 7.044626235961914, 7.287515640258789, 7.530405044555664, 7.773294925689697, 8.016183853149414, 8.259074211120605, 8.50196361541748]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 9.0, 13.0, 15.0, 25.0, 32.0, 53.0, 93.0, 121.0, 180.0, 308.0, 446.0, 717.0, 1189.0, 1963.0, 3487.0, 6444.0, 12033.0, 23853.0, 50988.0, 114654.0, 268835.0, 622315.0, 3558346.0, 971603.0, 364178.0, 156218.0, 67799.0, 31537.0, 15367.0, 8038.0, 4405.0, 2446.0, 1491.0, 849.0, 474.0, 304.0, 191.0, 141.0, 87.0, 44.0, 47.0, 36.0, 23.0, 16.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.56591796875, -0.5485992431640625, -0.531280517578125, -0.5139617919921875, -0.49664306640625, -0.4793243408203125, -0.462005615234375, -0.4446868896484375, -0.4273681640625, -0.4100494384765625, -0.392730712890625, -0.3754119873046875, -0.35809326171875, -0.3407745361328125, -0.323455810546875, -0.3061370849609375, -0.288818359375, -0.2714996337890625, -0.254180908203125, -0.2368621826171875, -0.21954345703125, -0.2022247314453125, -0.184906005859375, -0.1675872802734375, -0.1502685546875, -0.1329498291015625, -0.115631103515625, -0.0983123779296875, -0.08099365234375, -0.0636749267578125, -0.046356201171875, -0.0290374755859375, -0.01171875, 0.0055999755859375, 0.022918701171875, 0.0402374267578125, 0.05755615234375, 0.0748748779296875, 0.092193603515625, 0.1095123291015625, 0.1268310546875, 0.1441497802734375, 0.161468505859375, 0.1787872314453125, 0.19610595703125, 0.2134246826171875, 0.230743408203125, 0.2480621337890625, 0.265380859375, 0.2826995849609375, 0.300018310546875, 0.3173370361328125, 0.33465576171875, 0.3519744873046875, 0.369293212890625, 0.3866119384765625, 0.4039306640625, 0.4212493896484375, 0.438568115234375, 0.4558868408203125, 0.47320556640625, 0.4905242919921875, 0.507843017578125, 0.5251617431640625, 0.54248046875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 4.0, 8.0, 10.0, 11.0, 4.0, 10.0, 13.0, 12.0, 15.0, 21.0, 19.0, 29.0, 15.0, 32.0, 47.0, 48.0, 41.0, 44.0, 38.0, 40.0, 115.0, 688.0, 334.0, 52.0, 41.0, 29.0, 31.0, 34.0, 24.0, 24.0, 24.0, 27.0, 20.0, 20.0, 13.0, 9.0, 16.0, 10.0, 9.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0], "bins": [-3.365234375, -3.2559814453125, -3.146728515625, -3.0374755859375, -2.92822265625, -2.8189697265625, -2.709716796875, -2.6004638671875, -2.4912109375, -2.3819580078125, -2.272705078125, -2.1634521484375, -2.05419921875, -1.9449462890625, -1.835693359375, -1.7264404296875, -1.6171875, -1.5079345703125, -1.398681640625, -1.2894287109375, -1.18017578125, -1.0709228515625, -0.961669921875, -0.8524169921875, -0.7431640625, -0.6339111328125, -0.524658203125, -0.4154052734375, -0.30615234375, -0.1968994140625, -0.087646484375, 0.0216064453125, 0.130859375, 0.2401123046875, 0.349365234375, 0.4586181640625, 0.56787109375, 0.6771240234375, 0.786376953125, 0.8956298828125, 1.0048828125, 1.1141357421875, 1.223388671875, 1.3326416015625, 1.44189453125, 1.5511474609375, 1.660400390625, 1.7696533203125, 1.87890625, 1.9881591796875, 2.097412109375, 2.2066650390625, 2.31591796875, 2.4251708984375, 2.534423828125, 2.6436767578125, 2.7529296875, 2.8621826171875, 2.971435546875, 3.0806884765625, 3.18994140625, 3.2991943359375, 3.408447265625, 3.5177001953125, 3.626953125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 5.0, 14.0, 9.0, 34.0, 43.0, 69.0, 105.0, 191.0, 269.0, 444.0, 728.0, 1277.0, 2175.0, 3941.0, 7023.0, 12490.0, 23143.0, 42574.0, 77505.0, 138442.0, 231078.0, 352580.0, 687290.0, 3264290.0, 591421.0, 341385.0, 220591.0, 130501.0, 73416.0, 39938.0, 21599.0, 11735.0, 6491.0, 3567.0, 2074.0, 1199.0, 706.0, 470.0, 246.0, 132.0, 86.0, 54.0, 52.0, 25.0, 10.0, 7.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2678680419921875, -0.259613037109375, -0.2513580322265625, -0.24310302734375, -0.2348480224609375, -0.226593017578125, -0.2183380126953125, -0.2100830078125, -0.2018280029296875, -0.193572998046875, -0.1853179931640625, -0.17706298828125, -0.1688079833984375, -0.160552978515625, -0.1522979736328125, -0.14404296875, -0.1357879638671875, -0.127532958984375, -0.1192779541015625, -0.11102294921875, -0.1027679443359375, -0.094512939453125, -0.0862579345703125, -0.0780029296875, -0.0697479248046875, -0.061492919921875, -0.0532379150390625, -0.04498291015625, -0.0367279052734375, -0.028472900390625, -0.0202178955078125, -0.011962890625, -0.0037078857421875, 0.004547119140625, 0.0128021240234375, 0.02105712890625, 0.0293121337890625, 0.037567138671875, 0.0458221435546875, 0.0540771484375, 0.0623321533203125, 0.070587158203125, 0.0788421630859375, 0.08709716796875, 0.0953521728515625, 0.103607177734375, 0.1118621826171875, 0.1201171875, 0.1283721923828125, 0.136627197265625, 0.1448822021484375, 0.15313720703125, 0.1613922119140625, 0.169647216796875, 0.1779022216796875, 0.1861572265625, 0.1944122314453125, 0.202667236328125, 0.2109222412109375, 0.21917724609375, 0.2274322509765625, 0.235687255859375, 0.2439422607421875, 0.252197265625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 7.0, 11.0, 8.0, 10.0, 17.0, 17.0, 19.0, 21.0, 15.0, 25.0, 28.0, 27.0, 37.0, 39.0, 37.0, 34.0, 45.0, 36.0, 117.0, 776.0, 221.0, 38.0, 31.0, 40.0, 36.0, 29.0, 40.0, 38.0, 27.0, 20.0, 22.0, 19.0, 19.0, 17.0, 12.0, 9.0, 16.0, 8.0, 5.0, 4.0, 11.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.517578125, -2.43548583984375, -2.3533935546875, -2.27130126953125, -2.189208984375, -2.10711669921875, -2.0250244140625, -1.94293212890625, -1.86083984375, -1.77874755859375, -1.6966552734375, -1.61456298828125, -1.532470703125, -1.45037841796875, -1.3682861328125, -1.28619384765625, -1.2041015625, -1.12200927734375, -1.0399169921875, -0.95782470703125, -0.875732421875, -0.79364013671875, -0.7115478515625, -0.62945556640625, -0.54736328125, -0.46527099609375, -0.3831787109375, -0.30108642578125, -0.218994140625, -0.13690185546875, -0.0548095703125, 0.02728271484375, 0.109375, 0.19146728515625, 0.2735595703125, 0.35565185546875, 0.437744140625, 0.51983642578125, 0.6019287109375, 0.68402099609375, 0.76611328125, 0.84820556640625, 0.9302978515625, 1.01239013671875, 1.094482421875, 1.17657470703125, 1.2586669921875, 1.34075927734375, 1.4228515625, 1.50494384765625, 1.5870361328125, 1.66912841796875, 1.751220703125, 1.83331298828125, 1.9154052734375, 1.99749755859375, 2.07958984375, 2.16168212890625, 2.2437744140625, 2.32586669921875, 2.407958984375, 2.49005126953125, 2.5721435546875, 2.65423583984375, 2.736328125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 3.0, 9.0, 12.0, 13.0, 28.0, 33.0, 46.0, 67.0, 105.0, 126.0, 189.0, 255.0, 389.0, 545.0, 849.0, 1295.0, 2237.0, 4187.0, 8484.0, 21105.0, 59181.0, 175502.0, 504076.0, 3786887.0, 1158659.0, 369409.0, 123925.0, 42069.0, 16072.0, 7046.0, 3395.0, 1824.0, 1161.0, 701.0, 465.0, 311.0, 230.0, 149.0, 96.0, 71.0, 53.0, 42.0, 37.0, 16.0, 14.0, 17.0, 13.0, 9.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.489990234375, -0.47460174560546875, -0.4592132568359375, -0.44382476806640625, -0.428436279296875, -0.41304779052734375, -0.3976593017578125, -0.38227081298828125, -0.36688232421875, -0.35149383544921875, -0.3361053466796875, -0.32071685791015625, -0.305328369140625, -0.28993988037109375, -0.2745513916015625, -0.25916290283203125, -0.2437744140625, -0.22838592529296875, -0.2129974365234375, -0.19760894775390625, -0.182220458984375, -0.16683197021484375, -0.1514434814453125, -0.13605499267578125, -0.12066650390625, -0.10527801513671875, -0.0898895263671875, -0.07450103759765625, -0.059112548828125, -0.04372406005859375, -0.0283355712890625, -0.01294708251953125, 0.00244140625, 0.01782989501953125, 0.0332183837890625, 0.04860687255859375, 0.063995361328125, 0.07938385009765625, 0.0947723388671875, 0.11016082763671875, 0.12554931640625, 0.14093780517578125, 0.1563262939453125, 0.17171478271484375, 0.187103271484375, 0.20249176025390625, 0.2178802490234375, 0.23326873779296875, 0.2486572265625, 0.26404571533203125, 0.2794342041015625, 0.29482269287109375, 0.310211181640625, 0.32559967041015625, 0.3409881591796875, 0.35637664794921875, 0.37176513671875, 0.38715362548828125, 0.4025421142578125, 0.41793060302734375, 0.433319091796875, 0.44870758056640625, 0.4640960693359375, 0.47948455810546875, 0.494873046875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 1.0, 3.0, 6.0, 8.0, 10.0, 7.0, 21.0, 10.0, 24.0, 17.0, 28.0, 28.0, 31.0, 30.0, 24.0, 41.0, 44.0, 40.0, 42.0, 48.0, 517.0, 583.0, 46.0, 52.0, 39.0, 36.0, 34.0, 36.0, 28.0, 31.0, 29.0, 20.0, 13.0, 17.0, 13.0, 18.0, 10.0, 5.0, 14.0, 6.0, 7.0, 0.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.412109375, -3.3118896484375, -3.211669921875, -3.1114501953125, -3.01123046875, -2.9110107421875, -2.810791015625, -2.7105712890625, -2.6103515625, -2.5101318359375, -2.409912109375, -2.3096923828125, -2.20947265625, -2.1092529296875, -2.009033203125, -1.9088134765625, -1.80859375, -1.7083740234375, -1.608154296875, -1.5079345703125, -1.40771484375, -1.3074951171875, -1.207275390625, -1.1070556640625, -1.0068359375, -0.9066162109375, -0.806396484375, -0.7061767578125, -0.60595703125, -0.5057373046875, -0.405517578125, -0.3052978515625, -0.205078125, -0.1048583984375, -0.004638671875, 0.0955810546875, 0.19580078125, 0.2960205078125, 0.396240234375, 0.4964599609375, 0.5966796875, 0.6968994140625, 0.797119140625, 0.8973388671875, 0.99755859375, 1.0977783203125, 1.197998046875, 1.2982177734375, 1.3984375, 1.4986572265625, 1.598876953125, 1.6990966796875, 1.79931640625, 1.8995361328125, 1.999755859375, 2.0999755859375, 2.2001953125, 2.3004150390625, 2.400634765625, 2.5008544921875, 2.60107421875, 2.7012939453125, 2.801513671875, 2.9017333984375, 3.001953125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 31.0, 141.0, 522.0, 237.0, 54.0, 13.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.47587966918945, -36.6895751953125, -35.90327072143555, -35.116966247558594, -34.33066177368164, -33.54435729980469, -32.758052825927734, -31.971750259399414, -31.18544578552246, -30.399141311645508, -29.612836837768555, -28.8265323638916, -28.04022979736328, -27.253925323486328, -26.467620849609375, -25.681316375732422, -24.89501190185547, -24.108707427978516, -23.322402954101562, -22.53609848022461, -21.749794006347656, -20.963491439819336, -20.177186965942383, -19.39088249206543, -18.604578018188477, -17.818273544311523, -17.03196907043457, -16.245664596557617, -15.45936107635498, -14.673056602478027, -13.88675308227539, -13.100448608398438, -12.314144134521484, -11.527839660644531, -10.741535186767578, -9.955231666564941, -9.168927192687988, -8.382622718811035, -7.59631872177124, -6.810014724731445, -6.023710250854492, -5.237405776977539, -4.451101779937744, -3.66479754447937, -2.878493309020996, -2.092189073562622, -1.305884838104248, -0.5195808410644531, 0.2667236328125, 1.053027868270874, 1.839332103729248, 2.625636339187622, 3.411940574645996, 4.198245048522949, 4.984549045562744, 5.770853042602539, 6.557157516479492, 7.343461990356445, 8.129766464233398, 8.916069984436035, 9.702374458312988, 10.488678932189941, 11.274982452392578, 12.061286926269531, 12.847591400146484]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 7.0, 4.0, 5.0, 4.0, 11.0, 11.0, 14.0, 9.0, 21.0, 31.0, 31.0, 22.0, 34.0, 30.0, 46.0, 52.0, 43.0, 51.0, 39.0, 54.0, 61.0, 41.0, 49.0, 43.0, 30.0, 41.0, 30.0, 33.0, 34.0, 22.0, 21.0, 20.0, 12.0, 6.0, 12.0, 5.0, 4.0, 8.0, 0.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.056772232055664, -10.739232063293457, -10.42169189453125, -10.104151725769043, -9.786611557006836, -9.469072341918945, -9.151532173156738, -8.833992004394531, -8.516451835632324, -8.198911666870117, -7.88137149810791, -7.563831806182861, -7.246291637420654, -6.928751468658447, -6.611211776733398, -6.293671607971191, -5.976131439208984, -5.658591270446777, -5.34105110168457, -5.0235114097595215, -4.7059712409973145, -4.388431072235107, -4.070891380310059, -3.7533512115478516, -3.4358110427856445, -3.1182708740234375, -2.8007309436798096, -2.4831910133361816, -2.1656508445739746, -1.8481107950210571, -1.5305707454681396, -1.2130308151245117, -0.8954906463623047, -0.5779505968093872, -0.2604105472564697, 0.057129502296447754, 0.37466955184936523, 0.6922096014022827, 1.0097496509552002, 1.3272895812988281, 1.6448297500610352, 1.9623697996139526, 2.27990984916687, 2.597449779510498, 2.914989948272705, 3.232530117034912, 3.55007004737854, 3.867609977722168, 4.185150146484375, 4.502690315246582, 4.820230484008789, 5.137770175933838, 5.455310344696045, 5.772850513458252, 6.090390205383301, 6.407930374145508, 6.725470542907715, 7.043010711669922, 7.360550880432129, 7.678090572357178, 7.995630741119385, 8.313170433044434, 8.63071060180664, 8.948250770568848, 9.265790939331055]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 9.0, 8.0, 13.0, 13.0, 27.0, 28.0, 47.0, 71.0, 69.0, 93.0, 172.0, 254.0, 459.0, 1174.0, 3298.0, 10203.0, 35861.0, 2030461.0, 2060579.0, 37284.0, 9002.0, 2863.0, 1097.0, 450.0, 251.0, 141.0, 111.0, 64.0, 55.0, 29.0, 22.0, 10.0, 17.0, 8.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1927490234375, -0.1872425079345703, -0.18173599243164062, -0.17622947692871094, -0.17072296142578125, -0.16521644592285156, -0.15970993041992188, -0.1542034149169922, -0.1486968994140625, -0.1431903839111328, -0.13768386840820312, -0.13217735290527344, -0.12667083740234375, -0.12116432189941406, -0.11565780639648438, -0.11015129089355469, -0.104644775390625, -0.09913825988769531, -0.09363174438476562, -0.08812522888183594, -0.08261871337890625, -0.07711219787597656, -0.07160568237304688, -0.06609916687011719, -0.0605926513671875, -0.05508613586425781, -0.049579620361328125, -0.04407310485839844, -0.03856658935546875, -0.03306007385253906, -0.027553558349609375, -0.022047042846679688, -0.01654052734375, -0.011034011840820312, -0.005527496337890625, -2.09808349609375e-05, 0.00548553466796875, 0.010992050170898438, 0.016498565673828125, 0.022005081176757812, 0.0275115966796875, 0.03301811218261719, 0.038524627685546875, 0.04403114318847656, 0.04953765869140625, 0.05504417419433594, 0.060550689697265625, 0.06605720520019531, 0.071563720703125, 0.07707023620605469, 0.08257675170898438, 0.08808326721191406, 0.09358978271484375, 0.09909629821777344, 0.10460281372070312, 0.11010932922363281, 0.1156158447265625, 0.12112236022949219, 0.12662887573242188, 0.13213539123535156, 0.13764190673828125, 0.14314842224121094, 0.14865493774414062, 0.1541614532470703, 0.15966796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 8.0, 5.0, 7.0, 9.0, 20.0, 13.0, 14.0, 19.0, 21.0, 31.0, 42.0, 37.0, 35.0, 29.0, 49.0, 44.0, 38.0, 54.0, 69.0, 62.0, 62.0, 51.0, 43.0, 36.0, 38.0, 23.0, 24.0, 26.0, 19.0, 19.0, 19.0, 7.0, 5.0, 8.0, 1.0, 7.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.038330078125, -0.03719902038574219, -0.036067962646484375, -0.03493690490722656, -0.03380584716796875, -0.03267478942871094, -0.031543731689453125, -0.030412673950195312, -0.0292816162109375, -0.028150558471679688, -0.027019500732421875, -0.025888442993164062, -0.02475738525390625, -0.023626327514648438, -0.022495269775390625, -0.021364212036132812, -0.020233154296875, -0.019102096557617188, -0.017971038818359375, -0.016839981079101562, -0.01570892333984375, -0.014577865600585938, -0.013446807861328125, -0.012315750122070312, -0.0111846923828125, -0.010053634643554688, -0.008922576904296875, -0.0077915191650390625, -0.00666046142578125, -0.0055294036865234375, -0.004398345947265625, -0.0032672882080078125, -0.00213623046875, -0.0010051727294921875, 0.000125885009765625, 0.0012569427490234375, 0.00238800048828125, 0.0035190582275390625, 0.004650115966796875, 0.0057811737060546875, 0.0069122314453125, 0.008043289184570312, 0.009174346923828125, 0.010305404663085938, 0.01143646240234375, 0.012567520141601562, 0.013698577880859375, 0.014829635620117188, 0.015960693359375, 0.017091751098632812, 0.018222808837890625, 0.019353866577148438, 0.02048492431640625, 0.021615982055664062, 0.022747039794921875, 0.023878097534179688, 0.0250091552734375, 0.026140213012695312, 0.027271270751953125, 0.028402328491210938, 0.02953338623046875, 0.030664443969726562, 0.031795501708984375, 0.03292655944824219, 0.0340576171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 3.0, 7.0, 9.0, 7.0, 8.0, 19.0, 13.0, 17.0, 21.0, 22.0, 36.0, 103.0, 229.0, 632.0, 4176.0, 2451107.0, 1733262.0, 3644.0, 568.0, 176.0, 79.0, 36.0, 15.0, 18.0, 12.0, 15.0, 4.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037353515625, -0.1964550018310547, -0.18917465209960938, -0.18189430236816406, -0.17461395263671875, -0.16733360290527344, -0.16005325317382812, -0.1527729034423828, -0.1454925537109375, -0.1382122039794922, -0.13093185424804688, -0.12365150451660156, -0.11637115478515625, -0.10909080505371094, -0.10181045532226562, -0.09453010559082031, -0.087249755859375, -0.07996940612792969, -0.07268905639648438, -0.06540870666503906, -0.05812835693359375, -0.05084800720214844, -0.043567657470703125, -0.03628730773925781, -0.0290069580078125, -0.021726608276367188, -0.014446258544921875, -0.0071659088134765625, 0.00011444091796875, 0.0073947906494140625, 0.014675140380859375, 0.021955490112304688, 0.02923583984375, 0.03651618957519531, 0.043796539306640625, 0.05107688903808594, 0.05835723876953125, 0.06563758850097656, 0.07291793823242188, 0.08019828796386719, 0.0874786376953125, 0.09475898742675781, 0.10203933715820312, 0.10931968688964844, 0.11660003662109375, 0.12388038635253906, 0.13116073608398438, 0.1384410858154297, 0.145721435546875, 0.1530017852783203, 0.16028213500976562, 0.16756248474121094, 0.17484283447265625, 0.18212318420410156, 0.18940353393554688, 0.1966838836669922, 0.2039642333984375, 0.2112445831298828, 0.21852493286132812, 0.22580528259277344, 0.23308563232421875, 0.24036598205566406, 0.24764633178710938, 0.2549266815185547, 0.26220703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 9.0, 8.0, 10.0, 20.0, 27.0, 51.0, 106.0, 274.0, 625.0, 1222.0, 875.0, 403.0, 189.0, 77.0, 67.0, 18.0, 27.0, 16.0, 10.0, 3.0, 6.0, 8.0, 9.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07902336120605469, -0.07644271850585938, -0.07386207580566406, -0.07128143310546875, -0.06870079040527344, -0.06612014770507812, -0.06353950500488281, -0.0609588623046875, -0.05837821960449219, -0.055797576904296875, -0.05321693420410156, -0.05063629150390625, -0.04805564880371094, -0.045475006103515625, -0.04289436340332031, -0.040313720703125, -0.03773307800292969, -0.035152435302734375, -0.03257179260253906, -0.02999114990234375, -0.027410507202148438, -0.024829864501953125, -0.022249221801757812, -0.0196685791015625, -0.017087936401367188, -0.014507293701171875, -0.011926651000976562, -0.00934600830078125, -0.0067653656005859375, -0.004184722900390625, -0.0016040802001953125, 0.0009765625, 0.0035572052001953125, 0.006137847900390625, 0.008718490600585938, 0.01129913330078125, 0.013879776000976562, 0.016460418701171875, 0.019041061401367188, 0.0216217041015625, 0.024202346801757812, 0.026782989501953125, 0.029363632202148438, 0.03194427490234375, 0.03452491760253906, 0.037105560302734375, 0.03968620300292969, 0.042266845703125, 0.04484748840332031, 0.047428131103515625, 0.05000877380371094, 0.05258941650390625, 0.05517005920410156, 0.057750701904296875, 0.06033134460449219, 0.0629119873046875, 0.06549263000488281, 0.06807327270507812, 0.07065391540527344, 0.07323455810546875, 0.07581520080566406, 0.07839584350585938, 0.08097648620605469, 0.08355712890625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 704.0, 307.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27800488471984863, -0.18231546878814697, -0.08662605285644531, 0.009063363075256348, 0.10475277900695801, 0.20044219493865967, 0.29613161087036133, 0.391821026802063, 0.48751044273376465, 0.5831998586654663, 0.678889274597168, 0.7745786905288696, 0.8702681064605713, 0.965957522392273, 1.0616469383239746, 1.1573363542556763, 1.253025770187378, 1.3487151861190796, 1.4444046020507812, 1.540094017982483, 1.6357834339141846, 1.7314728498458862, 1.827162265777588, 1.9228516817092896, 2.018541097640991, 2.1142306327819824, 2.2099199295043945, 2.3056092262268066, 2.401298761367798, 2.496988296508789, 2.592677593231201, 2.6883668899536133, 2.7840566635131836, 2.8797459602355957, 2.975435495376587, 3.071125030517578, 3.1668143272399902, 3.2625036239624023, 3.3581931591033936, 3.4538826942443848, 3.549571990966797, 3.645261287689209, 3.7409508228302, 3.8366403579711914, 3.9323296546936035, 4.028018951416016, 4.123708724975586, 4.219398021697998, 4.31508731842041, 4.410776615142822, 4.506465911865234, 4.602155685424805, 4.697844982147217, 4.793534278869629, 4.889224052429199, 4.984913349151611, 5.080602645874023, 5.1762919425964355, 5.271981239318848, 5.367671012878418, 5.46336030960083, 5.559049606323242, 5.6547393798828125, 5.750428676605225, 5.846117973327637]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 7.0, 15.0, 11.0, 13.0, 23.0, 26.0, 26.0, 44.0, 45.0, 59.0, 64.0, 57.0, 75.0, 57.0, 66.0, 70.0, 48.0, 50.0, 47.0, 61.0, 42.0, 34.0, 17.0, 13.0, 17.0, 3.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253251850605011, -0.24421082437038422, -0.23516978323459625, -0.22612875699996948, -0.2170877307653427, -0.20804670453071594, -0.19900566339492798, -0.1899646371603012, -0.18092361092567444, -0.17188258469104767, -0.1628415435552597, -0.15380051732063293, -0.14475949108600616, -0.1357184648513794, -0.12667742371559143, -0.11763639748096466, -0.1085953563451767, -0.09955432265996933, -0.09051329642534256, -0.08147226274013519, -0.07243123650550842, -0.06339020282030106, -0.05434916913509369, -0.04530814290046692, -0.03626710921525955, -0.027226079255342484, -0.018185047432780266, -0.009144015610218048, -0.00010298565030097961, 0.008938044309616089, 0.017979077994823456, 0.027020104229450226, 0.03606113791465759, 0.04510216787457466, 0.05414319783449173, 0.0631842315196991, 0.07222525775432587, 0.08126629143953323, 0.0903073251247406, 0.09934835135936737, 0.10838938504457474, 0.1174304187297821, 0.12647144496440887, 0.13551247119903564, 0.1445535123348236, 0.15359453856945038, 0.16263556480407715, 0.1716766059398651, 0.18071763217449188, 0.18975865840911865, 0.19879969954490662, 0.2078407257795334, 0.21688175201416016, 0.22592279314994812, 0.2349638193845749, 0.24400484561920166, 0.2530458867549896, 0.2620869278907776, 0.27112793922424316, 0.28016898036003113, 0.2892100214958191, 0.29825103282928467, 0.30729207396507263, 0.3163331151008606, 0.32537412643432617]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 5.0, 8.0, 8.0, 13.0, 13.0, 24.0, 35.0, 54.0, 77.0, 114.0, 187.0, 308.0, 529.0, 1013.0, 1854.0, 3874.0, 10376.0, 64368.0, 902525.0, 46459.0, 9295.0, 3596.0, 1623.0, 837.0, 513.0, 303.0, 164.0, 133.0, 82.0, 52.0, 40.0, 17.0, 20.0, 8.0, 10.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21923828125, -0.21062088012695312, -0.20200347900390625, -0.19338607788085938, -0.1847686767578125, -0.17615127563476562, -0.16753387451171875, -0.15891647338867188, -0.150299072265625, -0.14168167114257812, -0.13306427001953125, -0.12444686889648438, -0.1158294677734375, -0.10721206665039062, -0.09859466552734375, -0.08997726440429688, -0.08135986328125, -0.07274246215820312, -0.06412506103515625, -0.055507659912109375, -0.0468902587890625, -0.038272857666015625, -0.02965545654296875, -0.021038055419921875, -0.012420654296875, -0.003803253173828125, 0.00481414794921875, 0.013431549072265625, 0.0220489501953125, 0.030666351318359375, 0.03928375244140625, 0.047901153564453125, 0.0565185546875, 0.06513595581054688, 0.07375335693359375, 0.08237075805664062, 0.0909881591796875, 0.09960556030273438, 0.10822296142578125, 0.11684036254882812, 0.125457763671875, 0.13407516479492188, 0.14269256591796875, 0.15130996704101562, 0.1599273681640625, 0.16854476928710938, 0.17716217041015625, 0.18577957153320312, 0.19439697265625, 0.20301437377929688, 0.21163177490234375, 0.22024917602539062, 0.2288665771484375, 0.23748397827148438, 0.24610137939453125, 0.2547187805175781, 0.263336181640625, 0.2719535827636719, 0.28057098388671875, 0.2891883850097656, 0.2978057861328125, 0.3064231872558594, 0.31504058837890625, 0.3236579895019531, 0.332275390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 12.0, 6.0, 17.0, 12.0, 9.0, 30.0, 26.0, 30.0, 44.0, 32.0, 43.0, 36.0, 48.0, 39.0, 44.0, 72.0, 70.0, 69.0, 62.0, 43.0, 34.0, 36.0, 36.0, 29.0, 21.0, 23.0, 16.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04168701171875, -0.040506839752197266, -0.03932666778564453, -0.0381464958190918, -0.03696632385253906, -0.03578615188598633, -0.034605979919433594, -0.03342580795288086, -0.032245635986328125, -0.03106546401977539, -0.029885292053222656, -0.028705120086669922, -0.027524948120117188, -0.026344776153564453, -0.02516460418701172, -0.023984432220458984, -0.02280426025390625, -0.021624088287353516, -0.02044391632080078, -0.019263744354248047, -0.018083572387695312, -0.016903400421142578, -0.015723228454589844, -0.01454305648803711, -0.013362884521484375, -0.01218271255493164, -0.011002540588378906, -0.009822368621826172, -0.008642196655273438, -0.007462024688720703, -0.006281852722167969, -0.005101680755615234, -0.0039215087890625, -0.0027413368225097656, -0.0015611648559570312, -0.0003809928894042969, 0.0007991790771484375, 0.001979351043701172, 0.0031595230102539062, 0.004339694976806641, 0.005519866943359375, 0.006700038909912109, 0.007880210876464844, 0.009060382843017578, 0.010240554809570312, 0.011420726776123047, 0.012600898742675781, 0.013781070709228516, 0.01496124267578125, 0.016141414642333984, 0.01732158660888672, 0.018501758575439453, 0.019681930541992188, 0.020862102508544922, 0.022042274475097656, 0.02322244644165039, 0.024402618408203125, 0.02558279037475586, 0.026762962341308594, 0.027943134307861328, 0.029123306274414062, 0.030303478240966797, 0.03148365020751953, 0.032663822174072266, 0.033843994140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 5.0, 7.0, 6.0, 11.0, 6.0, 15.0, 15.0, 18.0, 19.0, 31.0, 42.0, 45.0, 51.0, 56.0, 89.0, 136.0, 199.0, 360.0, 920.0, 3172.0, 16830.0, 169038.0, 706866.0, 132036.0, 14002.0, 2721.0, 817.0, 334.0, 182.0, 117.0, 98.0, 63.0, 32.0, 35.0, 22.0, 26.0, 23.0, 19.0, 17.0, 10.0, 15.0, 8.0, 10.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06670475006103516, -0.06443977355957031, -0.06217479705810547, -0.059909820556640625, -0.05764484405517578, -0.05537986755371094, -0.053114891052246094, -0.05084991455078125, -0.048584938049316406, -0.04631996154785156, -0.04405498504638672, -0.041790008544921875, -0.03952503204345703, -0.03726005554199219, -0.034995079040527344, -0.0327301025390625, -0.030465126037597656, -0.028200149536132812, -0.02593517303466797, -0.023670196533203125, -0.02140522003173828, -0.019140243530273438, -0.016875267028808594, -0.01461029052734375, -0.012345314025878906, -0.010080337524414062, -0.007815361022949219, -0.005550384521484375, -0.0032854080200195312, -0.0010204315185546875, 0.0012445449829101562, 0.003509521484375, 0.005774497985839844, 0.008039474487304688, 0.010304450988769531, 0.012569427490234375, 0.014834403991699219, 0.017099380493164062, 0.019364356994628906, 0.02162933349609375, 0.023894309997558594, 0.026159286499023438, 0.02842426300048828, 0.030689239501953125, 0.03295421600341797, 0.03521919250488281, 0.037484169006347656, 0.0397491455078125, 0.042014122009277344, 0.04427909851074219, 0.04654407501220703, 0.048809051513671875, 0.05107402801513672, 0.05333900451660156, 0.055603981018066406, 0.05786895751953125, 0.060133934020996094, 0.06239891052246094, 0.06466388702392578, 0.06692886352539062, 0.06919384002685547, 0.07145881652832031, 0.07372379302978516, 0.07598876953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 7.0, 4.0, 5.0, 11.0, 10.0, 10.0, 16.0, 9.0, 15.0, 20.0, 22.0, 30.0, 31.0, 31.0, 29.0, 36.0, 35.0, 35.0, 42.0, 39.0, 43.0, 39.0, 39.0, 50.0, 40.0, 40.0, 38.0, 34.0, 25.0, 28.0, 31.0, 21.0, 18.0, 16.0, 21.0, 17.0, 15.0, 8.0, 5.0, 8.0, 9.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0665283203125, -0.06429004669189453, -0.06205177307128906, -0.059813499450683594, -0.057575225830078125, -0.055336952209472656, -0.05309867858886719, -0.05086040496826172, -0.04862213134765625, -0.04638385772705078, -0.04414558410644531, -0.041907310485839844, -0.039669036865234375, -0.037430763244628906, -0.03519248962402344, -0.03295421600341797, -0.0307159423828125, -0.02847766876220703, -0.026239395141601562, -0.024001121520996094, -0.021762847900390625, -0.019524574279785156, -0.017286300659179688, -0.015048027038574219, -0.01280975341796875, -0.010571479797363281, -0.008333206176757812, -0.006094932556152344, -0.003856658935546875, -0.0016183853149414062, 0.0006198883056640625, 0.0028581619262695312, 0.005096435546875, 0.007334709167480469, 0.009572982788085938, 0.011811256408691406, 0.014049530029296875, 0.016287803649902344, 0.018526077270507812, 0.02076435089111328, 0.02300262451171875, 0.02524089813232422, 0.027479171752929688, 0.029717445373535156, 0.031955718994140625, 0.034193992614746094, 0.03643226623535156, 0.03867053985595703, 0.0409088134765625, 0.04314708709716797, 0.04538536071777344, 0.047623634338378906, 0.049861907958984375, 0.052100181579589844, 0.05433845520019531, 0.05657672882080078, 0.05881500244140625, 0.06105327606201172, 0.06329154968261719, 0.06552982330322266, 0.06776809692382812, 0.0700063705444336, 0.07224464416503906, 0.07448291778564453, 0.07672119140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 8.0, 10.0, 22.0, 25.0, 54.0, 78.0, 108.0, 182.0, 298.0, 584.0, 1116.0, 2759.0, 8868.0, 65619.0, 700425.0, 241601.0, 18821.0, 4421.0, 1716.0, 801.0, 411.0, 220.0, 131.0, 88.0, 57.0, 38.0, 27.0, 13.0, 16.0, 9.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174407958984375, -0.016811847686767578, -0.016182899475097656, -0.015553951263427734, -0.014925003051757812, -0.01429605484008789, -0.013667106628417969, -0.013038158416748047, -0.012409210205078125, -0.011780261993408203, -0.011151313781738281, -0.01052236557006836, -0.009893417358398438, -0.009264469146728516, -0.008635520935058594, -0.008006572723388672, -0.00737762451171875, -0.006748676300048828, -0.006119728088378906, -0.005490779876708984, -0.0048618316650390625, -0.004232883453369141, -0.0036039352416992188, -0.002974987030029297, -0.002346038818359375, -0.0017170906066894531, -0.0010881423950195312, -0.0004591941833496094, 0.0001697540283203125, 0.0007987022399902344, 0.0014276504516601562, 0.002056598663330078, 0.002685546875, 0.003314495086669922, 0.003943443298339844, 0.004572391510009766, 0.0052013397216796875, 0.005830287933349609, 0.006459236145019531, 0.007088184356689453, 0.007717132568359375, 0.008346080780029297, 0.008975028991699219, 0.00960397720336914, 0.010232925415039062, 0.010861873626708984, 0.011490821838378906, 0.012119770050048828, 0.01274871826171875, 0.013377666473388672, 0.014006614685058594, 0.014635562896728516, 0.015264511108398438, 0.01589345932006836, 0.01652240753173828, 0.017151355743408203, 0.017780303955078125, 0.018409252166748047, 0.01903820037841797, 0.01966714859008789, 0.020296096801757812, 0.020925045013427734, 0.021553993225097656, 0.022182941436767578, 0.0228118896484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 6.0, 6.0, 9.0, 8.0, 16.0, 25.0, 37.0, 55.0, 49.0, 61.0, 69.0, 80.0, 100.0, 84.0, 82.0, 69.0, 62.0, 44.0, 24.0, 18.0, 17.0, 14.0, 9.0, 10.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.1563301086425781e-05, -1.1217780411243439e-05, -1.0872259736061096e-05, -1.0526739060878754e-05, -1.0181218385696411e-05, -9.835697710514069e-06, -9.490177035331726e-06, -9.144656360149384e-06, -8.799135684967041e-06, -8.453615009784698e-06, -8.108094334602356e-06, -7.762573659420013e-06, -7.417052984237671e-06, -7.071532309055328e-06, -6.726011633872986e-06, -6.380490958690643e-06, -6.034970283508301e-06, -5.689449608325958e-06, -5.343928933143616e-06, -4.998408257961273e-06, -4.652887582778931e-06, -4.307366907596588e-06, -3.961846232414246e-06, -3.616325557231903e-06, -3.2708048820495605e-06, -2.925284206867218e-06, -2.5797635316848755e-06, -2.234242856502533e-06, -1.8887221813201904e-06, -1.543201506137848e-06, -1.1976808309555054e-06, -8.521601557731628e-07, -5.066394805908203e-07, -1.6111880540847778e-07, 1.8440186977386475e-07, 5.299225449562073e-07, 8.754432201385498e-07, 1.2209638953208923e-06, 1.5664845705032349e-06, 1.9120052456855774e-06, 2.25752592086792e-06, 2.6030465960502625e-06, 2.948567271232605e-06, 3.2940879464149475e-06, 3.63960862159729e-06, 3.9851292967796326e-06, 4.330649971961975e-06, 4.676170647144318e-06, 5.02169132232666e-06, 5.367211997509003e-06, 5.712732672691345e-06, 6.058253347873688e-06, 6.40377402305603e-06, 6.749294698238373e-06, 7.094815373420715e-06, 7.440336048603058e-06, 7.7858567237854e-06, 8.131377398967743e-06, 8.476898074150085e-06, 8.822418749332428e-06, 9.16793942451477e-06, 9.513460099697113e-06, 9.858980774879456e-06, 1.0204501450061798e-05, 1.055002212524414e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 10.0, 19.0, 30.0, 47.0, 62.0, 81.0, 111.0, 160.0, 266.0, 351.0, 496.0, 741.0, 1003.0, 1375.0, 2150.0, 3177.0, 5693.0, 18696.0, 275153.0, 678704.0, 40575.0, 7876.0, 3723.0, 2496.0, 1619.0, 1166.0, 763.0, 593.0, 387.0, 292.0, 218.0, 132.0, 96.0, 88.0, 56.0, 41.0, 27.0, 21.0, 11.0, 14.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0261993408203125, -0.025385379791259766, -0.02457141876220703, -0.023757457733154297, -0.022943496704101562, -0.022129535675048828, -0.021315574645996094, -0.02050161361694336, -0.019687652587890625, -0.01887369155883789, -0.018059730529785156, -0.017245769500732422, -0.016431808471679688, -0.015617847442626953, -0.014803886413574219, -0.013989925384521484, -0.01317596435546875, -0.012362003326416016, -0.011548042297363281, -0.010734081268310547, -0.009920120239257812, -0.009106159210205078, -0.008292198181152344, -0.007478237152099609, -0.006664276123046875, -0.005850315093994141, -0.005036354064941406, -0.004222393035888672, -0.0034084320068359375, -0.002594470977783203, -0.0017805099487304688, -0.0009665489196777344, -0.000152587890625, 0.0006613731384277344, 0.0014753341674804688, 0.002289295196533203, 0.0031032562255859375, 0.003917217254638672, 0.004731178283691406, 0.005545139312744141, 0.006359100341796875, 0.007173061370849609, 0.007987022399902344, 0.008800983428955078, 0.009614944458007812, 0.010428905487060547, 0.011242866516113281, 0.012056827545166016, 0.01287078857421875, 0.013684749603271484, 0.014498710632324219, 0.015312671661376953, 0.016126632690429688, 0.016940593719482422, 0.017754554748535156, 0.01856851577758789, 0.019382476806640625, 0.02019643783569336, 0.021010398864746094, 0.021824359893798828, 0.022638320922851562, 0.023452281951904297, 0.02426624298095703, 0.025080204010009766, 0.0258941650390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 14.0, 13.0, 15.0, 24.0, 34.0, 25.0, 50.0, 74.0, 94.0, 102.0, 112.0, 100.0, 86.0, 61.0, 38.0, 34.0, 20.0, 14.0, 19.0, 6.0, 6.0, 15.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02215576171875, -0.021525144577026367, -0.020894527435302734, -0.0202639102935791, -0.01963329315185547, -0.019002676010131836, -0.018372058868408203, -0.01774144172668457, -0.017110824584960938, -0.016480207443237305, -0.015849590301513672, -0.015218973159790039, -0.014588356018066406, -0.013957738876342773, -0.01332712173461914, -0.012696504592895508, -0.012065887451171875, -0.011435270309448242, -0.01080465316772461, -0.010174036026000977, -0.009543418884277344, -0.008912801742553711, -0.008282184600830078, -0.007651567459106445, -0.0070209503173828125, -0.00639033317565918, -0.005759716033935547, -0.005129098892211914, -0.004498481750488281, -0.0038678646087646484, -0.0032372474670410156, -0.002606630325317383, -0.00197601318359375, -0.0013453960418701172, -0.0007147789001464844, -8.416175842285156e-05, 0.0005464553833007812, 0.001177072525024414, 0.0018076896667480469, 0.0024383068084716797, 0.0030689239501953125, 0.0036995410919189453, 0.004330158233642578, 0.004960775375366211, 0.005591392517089844, 0.0062220096588134766, 0.006852626800537109, 0.007483243942260742, 0.008113861083984375, 0.008744478225708008, 0.00937509536743164, 0.010005712509155273, 0.010636329650878906, 0.011266946792602539, 0.011897563934326172, 0.012528181076049805, 0.013158798217773438, 0.01378941535949707, 0.014420032501220703, 0.015050649642944336, 0.01568126678466797, 0.0163118839263916, 0.016942501068115234, 0.017573118209838867, 0.0182037353515625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 60.0, 773.0, 177.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.343912363052368, -3.2791998386383057, -3.214487075805664, -3.1497745513916016, -3.085062026977539, -3.0203495025634766, -2.955636978149414, -2.8909242153167725, -2.82621169090271, -2.7614991664886475, -2.696786403656006, -2.6320738792419434, -2.567361354827881, -2.5026488304138184, -2.437936305999756, -2.3732235431671143, -2.3085110187530518, -2.2437984943389893, -2.1790857315063477, -2.114373207092285, -2.0496606826782227, -1.9849481582641602, -1.920235514640808, -1.855522871017456, -1.7908103466033936, -1.726097822189331, -1.661385178565979, -1.596672534942627, -1.5319600105285645, -1.467247486114502, -1.40253484249115, -1.3378221988677979, -1.2731095552444458, -1.2083969116210938, -1.1436843872070312, -1.0789718627929688, -1.0142592191696167, -0.9495466351509094, -0.8848340511322021, -0.8201214671134949, -0.7554088830947876, -0.6906962990760803, -0.625983715057373, -0.5612711310386658, -0.4965585470199585, -0.4318459630012512, -0.36713337898254395, -0.30242079496383667, -0.2377082109451294, -0.17299562692642212, -0.10828304290771484, -0.04357045888900757, 0.021142125129699707, 0.08585470914840698, 0.15056729316711426, 0.21527987718582153, 0.2799924612045288, 0.3447050452232361, 0.40941762924194336, 0.47413021326065063, 0.5388427972793579, 0.6035553812980652, 0.6682679653167725, 0.7329805493354797, 0.797693133354187]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 9.0, 7.0, 14.0, 23.0, 21.0, 26.0, 24.0, 37.0, 44.0, 47.0, 51.0, 44.0, 69.0, 49.0, 72.0, 65.0, 57.0, 57.0, 51.0, 36.0, 37.0, 25.0, 22.0, 19.0, 24.0, 16.0, 8.0, 9.0, 7.0, 4.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.6059556007385254, -0.590543270111084, -0.5751309394836426, -0.559718668460846, -0.5443063378334045, -0.5288940072059631, -0.5134816765785217, -0.4980693757534027, -0.4826570451259613, -0.4672447144985199, -0.4518324136734009, -0.4364200830459595, -0.42100778222084045, -0.40559545159339905, -0.39018315076828003, -0.3747708201408386, -0.3593584895133972, -0.3439461588859558, -0.3285338580608368, -0.3131215274333954, -0.29770922660827637, -0.28229689598083496, -0.26688456535339355, -0.25147226452827454, -0.23605996370315552, -0.2206476479768753, -0.2052353322505951, -0.1898230016231537, -0.17441068589687347, -0.15899837017059326, -0.14358605444431305, -0.12817373871803284, -0.11276140809059143, -0.09734909236431122, -0.08193676918745041, -0.0665244534611702, -0.051112134009599686, -0.035699814558029175, -0.020287498831748962, -0.004875175654888153, 0.01053714007139206, 0.02594945952296257, 0.04136177897453308, 0.05677409470081329, 0.0721864104270935, 0.08759873360395432, 0.10301104933023453, 0.11842337250709534, 0.13383568823337555, 0.14924800395965576, 0.16466031968593597, 0.1800726354122162, 0.1954849660396576, 0.2108972817659378, 0.22630959749221802, 0.24172192811965942, 0.25713422894477844, 0.27254655957221985, 0.28795886039733887, 0.3033711910247803, 0.3187834918498993, 0.3341958224773407, 0.3496081233024597, 0.3650204539299011, 0.38043278455734253]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 9.0, 11.0, 3.0, 25.0, 21.0, 20.0, 30.0, 27.0, 34.0, 34.0, 56.0, 106.0, 229.0, 983.0, 5109.0, 3962157.0, 221296.0, 2955.0, 624.0, 201.0, 86.0, 52.0, 36.0, 34.0, 21.0, 27.0, 18.0, 13.0, 12.0, 11.0, 6.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.433837890625, -0.42021942138671875, -0.4066009521484375, -0.39298248291015625, -0.379364013671875, -0.36574554443359375, -0.3521270751953125, -0.33850860595703125, -0.32489013671875, -0.31127166748046875, -0.2976531982421875, -0.28403472900390625, -0.270416259765625, -0.25679779052734375, -0.2431793212890625, -0.22956085205078125, -0.2159423828125, -0.20232391357421875, -0.1887054443359375, -0.17508697509765625, -0.161468505859375, -0.14785003662109375, -0.1342315673828125, -0.12061309814453125, -0.10699462890625, -0.09337615966796875, -0.0797576904296875, -0.06613922119140625, -0.052520751953125, -0.03890228271484375, -0.0252838134765625, -0.01166534423828125, 0.001953125, 0.01557159423828125, 0.0291900634765625, 0.04280853271484375, 0.056427001953125, 0.07004547119140625, 0.0836639404296875, 0.09728240966796875, 0.11090087890625, 0.12451934814453125, 0.1381378173828125, 0.15175628662109375, 0.165374755859375, 0.17899322509765625, 0.1926116943359375, 0.20623016357421875, 0.2198486328125, 0.23346710205078125, 0.2470855712890625, 0.26070404052734375, 0.274322509765625, 0.28794097900390625, 0.3015594482421875, 0.31517791748046875, 0.32879638671875, 0.34241485595703125, 0.3560333251953125, 0.36965179443359375, 0.383270263671875, 0.39688873291015625, 0.4105072021484375, 0.42412567138671875, 0.437744140625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 7.0, 9.0, 18.0, 13.0, 16.0, 27.0, 24.0, 29.0, 29.0, 43.0, 35.0, 45.0, 31.0, 45.0, 44.0, 52.0, 68.0, 55.0, 65.0, 43.0, 40.0, 54.0, 36.0, 28.0, 26.0, 21.0, 17.0, 13.0, 8.0, 9.0, 9.0, 9.0, 6.0, 5.0, 1.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.033782958984375, -0.03268623352050781, -0.031589508056640625, -0.030492782592773438, -0.02939605712890625, -0.028299331665039062, -0.027202606201171875, -0.026105880737304688, -0.0250091552734375, -0.023912429809570312, -0.022815704345703125, -0.021718978881835938, -0.02062225341796875, -0.019525527954101562, -0.018428802490234375, -0.017332077026367188, -0.0162353515625, -0.015138626098632812, -0.014041900634765625, -0.012945175170898438, -0.01184844970703125, -0.010751724243164062, -0.009654998779296875, -0.008558273315429688, -0.0074615478515625, -0.0063648223876953125, -0.005268096923828125, -0.0041713714599609375, -0.00307464599609375, -0.0019779205322265625, -0.000881195068359375, 0.0002155303955078125, 0.001312255859375, 0.0024089813232421875, 0.003505706787109375, 0.0046024322509765625, 0.00569915771484375, 0.0067958831787109375, 0.007892608642578125, 0.008989334106445312, 0.0100860595703125, 0.011182785034179688, 0.012279510498046875, 0.013376235961914062, 0.01447296142578125, 0.015569686889648438, 0.016666412353515625, 0.017763137817382812, 0.01885986328125, 0.019956588745117188, 0.021053314208984375, 0.022150039672851562, 0.02324676513671875, 0.024343490600585938, 0.025440216064453125, 0.026536941528320312, 0.0276336669921875, 0.028730392456054688, 0.029827117919921875, 0.030923843383789062, 0.03202056884765625, 0.03311729431152344, 0.034214019775390625, 0.03531074523925781, 0.036407470703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 6.0, 5.0, 13.0, 18.0, 15.0, 19.0, 37.0, 54.0, 101.0, 215.0, 547.0, 1924.0, 9023.0, 66220.0, 944052.0, 2946747.0, 199675.0, 20376.0, 3684.0, 954.0, 306.0, 131.0, 62.0, 36.0, 15.0, 12.0, 5.0, 5.0, 8.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09795570373535156, -0.09471511840820312, -0.09147453308105469, -0.08823394775390625, -0.08499336242675781, -0.08175277709960938, -0.07851219177246094, -0.0752716064453125, -0.07203102111816406, -0.06879043579101562, -0.06554985046386719, -0.06230926513671875, -0.05906867980957031, -0.055828094482421875, -0.05258750915527344, -0.049346923828125, -0.04610633850097656, -0.042865753173828125, -0.03962516784667969, -0.03638458251953125, -0.03314399719238281, -0.029903411865234375, -0.026662826538085938, -0.0234222412109375, -0.020181655883789062, -0.016941070556640625, -0.013700485229492188, -0.01045989990234375, -0.0072193145751953125, -0.003978729248046875, -0.0007381439208984375, 0.00250244140625, 0.0057430267333984375, 0.008983612060546875, 0.012224197387695312, 0.01546478271484375, 0.018705368041992188, 0.021945953369140625, 0.025186538696289062, 0.0284271240234375, 0.03166770935058594, 0.034908294677734375, 0.03814888000488281, 0.04138946533203125, 0.04463005065917969, 0.047870635986328125, 0.05111122131347656, 0.054351806640625, 0.05759239196777344, 0.060832977294921875, 0.06407356262207031, 0.06731414794921875, 0.07055473327636719, 0.07379531860351562, 0.07703590393066406, 0.0802764892578125, 0.08351707458496094, 0.08675765991210938, 0.08999824523925781, 0.09323883056640625, 0.09647941589355469, 0.09972000122070312, 0.10296058654785156, 0.106201171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 7.0, 3.0, 5.0, 17.0, 19.0, 23.0, 30.0, 34.0, 49.0, 71.0, 113.0, 130.0, 175.0, 242.0, 357.0, 554.0, 595.0, 426.0, 342.0, 216.0, 166.0, 133.0, 84.0, 70.0, 55.0, 27.0, 22.0, 22.0, 26.0, 12.0, 8.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0291900634765625, -0.0281527042388916, -0.027115345001220703, -0.026077985763549805, -0.025040626525878906, -0.024003267288208008, -0.02296590805053711, -0.02192854881286621, -0.020891189575195312, -0.019853830337524414, -0.018816471099853516, -0.017779111862182617, -0.01674175262451172, -0.01570439338684082, -0.014667034149169922, -0.013629674911499023, -0.012592315673828125, -0.011554956436157227, -0.010517597198486328, -0.00948023796081543, -0.008442878723144531, -0.007405519485473633, -0.006368160247802734, -0.005330801010131836, -0.0042934417724609375, -0.003256082534790039, -0.0022187232971191406, -0.0011813640594482422, -0.00014400482177734375, 0.0008933544158935547, 0.0019307136535644531, 0.0029680728912353516, 0.00400543212890625, 0.0050427913665771484, 0.006080150604248047, 0.007117509841918945, 0.008154869079589844, 0.009192228317260742, 0.01022958755493164, 0.011266946792602539, 0.012304306030273438, 0.013341665267944336, 0.014379024505615234, 0.015416383743286133, 0.01645374298095703, 0.01749110221862793, 0.018528461456298828, 0.019565820693969727, 0.020603179931640625, 0.021640539169311523, 0.022677898406982422, 0.02371525764465332, 0.02475261688232422, 0.025789976119995117, 0.026827335357666016, 0.027864694595336914, 0.028902053833007812, 0.02993941307067871, 0.03097677230834961, 0.03201413154602051, 0.033051490783691406, 0.034088850021362305, 0.0351262092590332, 0.0361635684967041, 0.037200927734375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 24.0, 223.0, 659.0, 90.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36220836639404297, -0.32708966732025146, -0.29197096824645996, -0.25685226917266846, -0.22173357009887695, -0.18661487102508545, -0.15149617195129395, -0.11637747287750244, -0.08125877380371094, -0.046140074729919434, -0.01102137565612793, 0.024097323417663574, 0.05921602249145508, 0.09433472156524658, 0.12945342063903809, 0.1645721197128296, 0.1996908187866211, 0.2348095178604126, 0.2699282169342041, 0.3050469160079956, 0.3401656150817871, 0.3752843141555786, 0.4104030132293701, 0.4455217123031616, 0.4806404113769531, 0.5157591104507446, 0.5508778095245361, 0.5859965085983276, 0.6211152076721191, 0.6562339067459106, 0.6913526058197021, 0.7264713048934937, 0.7615901231765747, 0.7967088222503662, 0.8318275213241577, 0.8669462203979492, 0.9020649194717407, 0.9371836185455322, 0.9723023176193237, 1.0074210166931152, 1.0425397157669067, 1.0776584148406982, 1.1127771139144897, 1.1478958129882812, 1.1830145120620728, 1.2181332111358643, 1.2532519102096558, 1.2883706092834473, 1.3234893083572388, 1.3586080074310303, 1.3937267065048218, 1.4288454055786133, 1.4639641046524048, 1.4990828037261963, 1.5342015027999878, 1.5693202018737793, 1.6044389009475708, 1.6395576000213623, 1.6746762990951538, 1.7097949981689453, 1.7449136972427368, 1.7800323963165283, 1.8151510953903198, 1.8502697944641113, 1.8853884935379028]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 13.0, 16.0, 15.0, 12.0, 23.0, 24.0, 29.0, 31.0, 43.0, 48.0, 52.0, 56.0, 60.0, 76.0, 50.0, 63.0, 61.0, 50.0, 46.0, 44.0, 42.0, 30.0, 17.0, 24.0, 11.0, 10.0, 13.0, 12.0, 5.0, 8.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1685832142829895, -0.16302813589572906, -0.15747304260730743, -0.151917964220047, -0.14636287093162537, -0.14080779254436493, -0.1352527141571045, -0.12969762086868286, -0.12414254248142242, -0.11858745664358139, -0.11303237080574036, -0.10747729241847992, -0.10192220658063889, -0.09636712074279785, -0.09081204235553741, -0.08525695651769638, -0.07970187067985535, -0.07414678484201431, -0.06859169900417328, -0.06303662061691284, -0.05748153477907181, -0.051926448941230774, -0.04637136682868004, -0.0408162847161293, -0.03526119887828827, -0.029706114903092384, -0.0241510309278965, -0.018595946952700615, -0.01304086297750473, -0.0074857790023088455, -0.0019306950271129608, 0.0036243870854377747, 0.009179472923278809, 0.014734556898474693, 0.020289640873670578, 0.025844724848866463, 0.03139980882406235, 0.03695489466190338, 0.04250997677445412, 0.04806505888700485, 0.053620144724845886, 0.05917523056268692, 0.06473031640052795, 0.07028539478778839, 0.07584048062562943, 0.08139556646347046, 0.0869506448507309, 0.09250573068857193, 0.09806081652641296, 0.103615902364254, 0.10917098820209503, 0.11472606658935547, 0.1202811524271965, 0.12583623826503754, 0.13139131665229797, 0.1369464099407196, 0.14250148832798004, 0.14805656671524048, 0.1536116600036621, 0.15916673839092255, 0.16472181677818298, 0.17027691006660461, 0.17583198845386505, 0.1813870668411255, 0.18694216012954712]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 16.0, 20.0, 22.0, 26.0, 39.0, 53.0, 85.0, 131.0, 172.0, 273.0, 411.0, 625.0, 1033.0, 1917.0, 3794.0, 8628.0, 24613.0, 97622.0, 472903.0, 337157.0, 65945.0, 18829.0, 6940.0, 3038.0, 1614.0, 940.0, 548.0, 375.0, 232.0, 137.0, 116.0, 80.0, 60.0, 45.0, 16.0, 21.0, 16.0, 7.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1148681640625, -0.11147689819335938, -0.10808563232421875, -0.10469436645507812, -0.1013031005859375, -0.09791183471679688, -0.09452056884765625, -0.09112930297851562, -0.087738037109375, -0.08434677124023438, -0.08095550537109375, -0.07756423950195312, -0.0741729736328125, -0.07078170776367188, -0.06739044189453125, -0.06399917602539062, -0.06060791015625, -0.057216644287109375, -0.05382537841796875, -0.050434112548828125, -0.0470428466796875, -0.043651580810546875, -0.04026031494140625, -0.036869049072265625, -0.033477783203125, -0.030086517333984375, -0.02669525146484375, -0.023303985595703125, -0.0199127197265625, -0.016521453857421875, -0.01313018798828125, -0.009738922119140625, -0.00634765625, -0.002956390380859375, 0.00043487548828125, 0.003826141357421875, 0.0072174072265625, 0.010608673095703125, 0.01399993896484375, 0.017391204833984375, 0.020782470703125, 0.024173736572265625, 0.02756500244140625, 0.030956268310546875, 0.0343475341796875, 0.037738800048828125, 0.04113006591796875, 0.044521331787109375, 0.04791259765625, 0.051303863525390625, 0.05469512939453125, 0.058086395263671875, 0.0614776611328125, 0.06486892700195312, 0.06826019287109375, 0.07165145874023438, 0.075042724609375, 0.07843399047851562, 0.08182525634765625, 0.08521652221679688, 0.0886077880859375, 0.09199905395507812, 0.09539031982421875, 0.09878158569335938, 0.1021728515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 3.0, 8.0, 5.0, 15.0, 17.0, 19.0, 12.0, 24.0, 28.0, 30.0, 39.0, 38.0, 32.0, 38.0, 36.0, 39.0, 44.0, 56.0, 48.0, 57.0, 54.0, 60.0, 45.0, 40.0, 29.0, 32.0, 26.0, 28.0, 16.0, 15.0, 15.0, 7.0, 11.0, 7.0, 6.0, 3.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.034881591796875, -0.03385043144226074, -0.032819271087646484, -0.03178811073303223, -0.03075695037841797, -0.02972579002380371, -0.028694629669189453, -0.027663469314575195, -0.026632308959960938, -0.02560114860534668, -0.024569988250732422, -0.023538827896118164, -0.022507667541503906, -0.02147650718688965, -0.02044534683227539, -0.019414186477661133, -0.018383026123046875, -0.017351865768432617, -0.01632070541381836, -0.015289545059204102, -0.014258384704589844, -0.013227224349975586, -0.012196063995361328, -0.01116490364074707, -0.010133743286132812, -0.009102582931518555, -0.008071422576904297, -0.007040262222290039, -0.006009101867675781, -0.0049779415130615234, -0.003946781158447266, -0.002915620803833008, -0.00188446044921875, -0.0008533000946044922, 0.00017786026000976562, 0.0012090206146240234, 0.0022401809692382812, 0.003271341323852539, 0.004302501678466797, 0.005333662033081055, 0.0063648223876953125, 0.00739598274230957, 0.008427143096923828, 0.009458303451538086, 0.010489463806152344, 0.011520624160766602, 0.01255178451538086, 0.013582944869995117, 0.014614105224609375, 0.015645265579223633, 0.01667642593383789, 0.01770758628845215, 0.018738746643066406, 0.019769906997680664, 0.020801067352294922, 0.02183222770690918, 0.022863388061523438, 0.023894548416137695, 0.024925708770751953, 0.02595686912536621, 0.02698802947998047, 0.028019189834594727, 0.029050350189208984, 0.030081510543823242, 0.0311126708984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 9.0, 9.0, 8.0, 12.0, 14.0, 22.0, 21.0, 27.0, 18.0, 26.0, 46.0, 61.0, 83.0, 94.0, 225.0, 472.0, 2162.0, 35659.0, 769531.0, 230715.0, 7630.0, 876.0, 306.0, 153.0, 83.0, 60.0, 45.0, 33.0, 24.0, 22.0, 14.0, 13.0, 11.0, 8.0, 13.0, 10.0, 5.0, 6.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1722412109375, -0.1666412353515625, -0.161041259765625, -0.1554412841796875, -0.14984130859375, -0.1442413330078125, -0.138641357421875, -0.1330413818359375, -0.12744140625, -0.1218414306640625, -0.116241455078125, -0.1106414794921875, -0.10504150390625, -0.0994415283203125, -0.093841552734375, -0.0882415771484375, -0.0826416015625, -0.0770416259765625, -0.071441650390625, -0.0658416748046875, -0.06024169921875, -0.0546417236328125, -0.049041748046875, -0.0434417724609375, -0.037841796875, -0.0322418212890625, -0.026641845703125, -0.0210418701171875, -0.01544189453125, -0.0098419189453125, -0.004241943359375, 0.0013580322265625, 0.0069580078125, 0.0125579833984375, 0.018157958984375, 0.0237579345703125, 0.02935791015625, 0.0349578857421875, 0.040557861328125, 0.0461578369140625, 0.0517578125, 0.0573577880859375, 0.062957763671875, 0.0685577392578125, 0.07415771484375, 0.0797576904296875, 0.085357666015625, 0.0909576416015625, 0.0965576171875, 0.1021575927734375, 0.107757568359375, 0.1133575439453125, 0.11895751953125, 0.1245574951171875, 0.130157470703125, 0.1357574462890625, 0.141357421875, 0.1469573974609375, 0.152557373046875, 0.1581573486328125, 0.16375732421875, 0.1693572998046875, 0.174957275390625, 0.1805572509765625, 0.1861572265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 7.0, 11.0, 19.0, 15.0, 29.0, 15.0, 31.0, 20.0, 33.0, 36.0, 42.0, 30.0, 35.0, 36.0, 51.0, 47.0, 43.0, 37.0, 31.0, 53.0, 44.0, 47.0, 25.0, 35.0, 18.0, 24.0, 21.0, 27.0, 22.0, 20.0, 9.0, 14.0, 12.0, 11.0, 8.0, 2.0, 5.0, 8.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052001953125, -0.05028820037841797, -0.04857444763183594, -0.046860694885253906, -0.045146942138671875, -0.043433189392089844, -0.04171943664550781, -0.04000568389892578, -0.03829193115234375, -0.03657817840576172, -0.03486442565917969, -0.033150672912597656, -0.031436920166015625, -0.029723167419433594, -0.028009414672851562, -0.02629566192626953, -0.0245819091796875, -0.02286815643310547, -0.021154403686523438, -0.019440650939941406, -0.017726898193359375, -0.016013145446777344, -0.014299392700195312, -0.012585639953613281, -0.01087188720703125, -0.009158134460449219, -0.0074443817138671875, -0.005730628967285156, -0.004016876220703125, -0.0023031234741210938, -0.0005893707275390625, 0.0011243820190429688, 0.002838134765625, 0.004551887512207031, 0.0062656402587890625, 0.007979393005371094, 0.009693145751953125, 0.011406898498535156, 0.013120651245117188, 0.014834403991699219, 0.01654815673828125, 0.01826190948486328, 0.019975662231445312, 0.021689414978027344, 0.023403167724609375, 0.025116920471191406, 0.026830673217773438, 0.02854442596435547, 0.0302581787109375, 0.03197193145751953, 0.03368568420410156, 0.035399436950683594, 0.037113189697265625, 0.038826942443847656, 0.04054069519042969, 0.04225444793701172, 0.04396820068359375, 0.04568195343017578, 0.04739570617675781, 0.049109458923339844, 0.050823211669921875, 0.052536964416503906, 0.05425071716308594, 0.05596446990966797, 0.05767822265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 4.0, 19.0, 17.0, 27.0, 47.0, 87.0, 151.0, 237.0, 435.0, 768.0, 1298.0, 2644.0, 5346.0, 15329.0, 83051.0, 625904.0, 263827.0, 33022.0, 8694.0, 3527.0, 1810.0, 991.0, 568.0, 279.0, 188.0, 109.0, 61.0, 39.0, 23.0, 18.0, 6.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0478515625, -0.04643392562866211, -0.04501628875732422, -0.04359865188598633, -0.04218101501464844, -0.04076337814331055, -0.039345741271972656, -0.037928104400634766, -0.036510467529296875, -0.035092830657958984, -0.033675193786621094, -0.0322575569152832, -0.030839920043945312, -0.029422283172607422, -0.02800464630126953, -0.02658700942993164, -0.02516937255859375, -0.02375173568725586, -0.02233409881591797, -0.020916461944580078, -0.019498825073242188, -0.018081188201904297, -0.016663551330566406, -0.015245914459228516, -0.013828277587890625, -0.012410640716552734, -0.010993003845214844, -0.009575366973876953, -0.008157730102539062, -0.006740093231201172, -0.005322456359863281, -0.0039048194885253906, -0.0024871826171875, -0.0010695457458496094, 0.00034809112548828125, 0.0017657279968261719, 0.0031833648681640625, 0.004601001739501953, 0.006018638610839844, 0.007436275482177734, 0.008853912353515625, 0.010271549224853516, 0.011689186096191406, 0.013106822967529297, 0.014524459838867188, 0.015942096710205078, 0.01735973358154297, 0.01877737045288086, 0.02019500732421875, 0.02161264419555664, 0.02303028106689453, 0.024447917938232422, 0.025865554809570312, 0.027283191680908203, 0.028700828552246094, 0.030118465423583984, 0.031536102294921875, 0.032953739166259766, 0.034371376037597656, 0.03578901290893555, 0.03720664978027344, 0.03862428665161133, 0.04004192352294922, 0.04145956039428711, 0.042877197265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 4.0, 8.0, 18.0, 11.0, 29.0, 46.0, 58.0, 84.0, 121.0, 131.0, 112.0, 109.0, 75.0, 53.0, 37.0, 26.0, 15.0, 15.0, 4.0, 12.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.872943878173828e-05, -2.7796253561973572e-05, -2.6863068342208862e-05, -2.5929883122444153e-05, -2.4996697902679443e-05, -2.4063512682914734e-05, -2.3130327463150024e-05, -2.2197142243385315e-05, -2.1263957023620605e-05, -2.0330771803855896e-05, -1.9397586584091187e-05, -1.8464401364326477e-05, -1.7531216144561768e-05, -1.6598030924797058e-05, -1.566484570503235e-05, -1.473166048526764e-05, -1.379847526550293e-05, -1.286529004573822e-05, -1.193210482597351e-05, -1.0998919606208801e-05, -1.0065734386444092e-05, -9.132549166679382e-06, -8.199363946914673e-06, -7.266178727149963e-06, -6.332993507385254e-06, -5.3998082876205444e-06, -4.466623067855835e-06, -3.5334378480911255e-06, -2.600252628326416e-06, -1.6670674085617065e-06, -7.338821887969971e-07, 1.993030309677124e-07, 1.1324882507324219e-06, 2.0656734704971313e-06, 2.998858690261841e-06, 3.93204391002655e-06, 4.86522912979126e-06, 5.798414349555969e-06, 6.731599569320679e-06, 7.664784789085388e-06, 8.597970008850098e-06, 9.531155228614807e-06, 1.0464340448379517e-05, 1.1397525668144226e-05, 1.2330710887908936e-05, 1.3263896107673645e-05, 1.4197081327438354e-05, 1.5130266547203064e-05, 1.6063451766967773e-05, 1.6996636986732483e-05, 1.7929822206497192e-05, 1.8863007426261902e-05, 1.979619264602661e-05, 2.072937786579132e-05, 2.166256308555603e-05, 2.259574830532074e-05, 2.352893352508545e-05, 2.446211874485016e-05, 2.5395303964614868e-05, 2.6328489184379578e-05, 2.7261674404144287e-05, 2.8194859623908997e-05, 2.9128044843673706e-05, 3.0061230063438416e-05, 3.0994415283203125e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 7.0, 6.0, 5.0, 20.0, 15.0, 25.0, 28.0, 36.0, 63.0, 128.0, 297.0, 1369.0, 10846.0, 213987.0, 769821.0, 47047.0, 3737.0, 628.0, 183.0, 87.0, 41.0, 46.0, 24.0, 20.0, 17.0, 14.0, 18.0, 5.0, 3.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.056854248046875, -0.055242061614990234, -0.05362987518310547, -0.0520176887512207, -0.05040550231933594, -0.04879331588745117, -0.047181129455566406, -0.04556894302368164, -0.043956756591796875, -0.04234457015991211, -0.040732383728027344, -0.03912019729614258, -0.03750801086425781, -0.03589582443237305, -0.03428363800048828, -0.032671451568603516, -0.03105926513671875, -0.029447078704833984, -0.02783489227294922, -0.026222705841064453, -0.024610519409179688, -0.022998332977294922, -0.021386146545410156, -0.01977396011352539, -0.018161773681640625, -0.01654958724975586, -0.014937400817871094, -0.013325214385986328, -0.011713027954101562, -0.010100841522216797, -0.008488655090332031, -0.006876468658447266, -0.0052642822265625, -0.0036520957946777344, -0.0020399093627929688, -0.0004277229309082031, 0.0011844635009765625, 0.002796649932861328, 0.004408836364746094, 0.006021022796630859, 0.007633209228515625, 0.00924539566040039, 0.010857582092285156, 0.012469768524169922, 0.014081954956054688, 0.015694141387939453, 0.01730632781982422, 0.018918514251708984, 0.02053070068359375, 0.022142887115478516, 0.02375507354736328, 0.025367259979248047, 0.026979446411132812, 0.028591632843017578, 0.030203819274902344, 0.03181600570678711, 0.033428192138671875, 0.03504037857055664, 0.036652565002441406, 0.03826475143432617, 0.03987693786621094, 0.0414891242980957, 0.04310131072998047, 0.044713497161865234, 0.04632568359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 6.0, 12.0, 22.0, 20.0, 25.0, 45.0, 53.0, 72.0, 68.0, 63.0, 90.0, 89.0, 83.0, 58.0, 65.0, 43.0, 39.0, 31.0, 25.0, 20.0, 10.0, 9.0, 7.0, 7.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01371002197265625, -0.013250470161437988, -0.012790918350219727, -0.012331366539001465, -0.011871814727783203, -0.011412262916564941, -0.01095271110534668, -0.010493159294128418, -0.010033607482910156, -0.009574055671691895, -0.009114503860473633, -0.008654952049255371, -0.00819540023803711, -0.007735848426818848, -0.007276296615600586, -0.006816744804382324, -0.0063571929931640625, -0.005897641181945801, -0.005438089370727539, -0.004978537559509277, -0.004518985748291016, -0.004059433937072754, -0.003599882125854492, -0.0031403303146362305, -0.0026807785034179688, -0.002221226692199707, -0.0017616748809814453, -0.0013021230697631836, -0.0008425712585449219, -0.00038301944732666016, 7.653236389160156e-05, 0.0005360841751098633, 0.000995635986328125, 0.0014551877975463867, 0.0019147396087646484, 0.00237429141998291, 0.002833843231201172, 0.0032933950424194336, 0.0037529468536376953, 0.004212498664855957, 0.004672050476074219, 0.0051316022872924805, 0.005591154098510742, 0.006050705909729004, 0.006510257720947266, 0.006969809532165527, 0.007429361343383789, 0.00788891315460205, 0.008348464965820312, 0.008808016777038574, 0.009267568588256836, 0.009727120399475098, 0.01018667221069336, 0.010646224021911621, 0.011105775833129883, 0.011565327644348145, 0.012024879455566406, 0.012484431266784668, 0.01294398307800293, 0.013403534889221191, 0.013863086700439453, 0.014322638511657715, 0.014782190322875977, 0.015241742134094238, 0.0157012939453125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 19.0, 810.0, 187.0, 4.0], "bins": [-3.9581050872802734, -3.8939833641052246, -3.829861640930176, -3.765740156173706, -3.7016184329986572, -3.6374967098236084, -3.5733749866485596, -3.50925350189209, -3.445131778717041, -3.381010055541992, -3.3168883323669434, -3.2527668476104736, -3.188645124435425, -3.124523401260376, -3.060401678085327, -2.9962801933288574, -2.9321584701538086, -2.8680367469787598, -2.803915023803711, -2.739793539047241, -2.6756718158721924, -2.6115500926971436, -2.5474283695220947, -2.483306884765625, -2.419184923171997, -2.3550631999969482, -2.2909414768218994, -2.2268199920654297, -2.162698268890381, -2.098576545715332, -2.034454822540283, -1.970333218574524, -1.9062117338180542, -1.8420900106430054, -1.777968406677246, -1.7138466835021973, -1.649725079536438, -1.5856033563613892, -1.5214817523956299, -1.457360029220581, -1.3932383060455322, -1.3291165828704834, -1.2649949789047241, -1.2008732557296753, -1.136751651763916, -1.0726299285888672, -1.0085082054138184, -0.9443866014480591, -0.8802649974822998, -0.8161433339118958, -0.7520216703414917, -0.6878999471664429, -0.6237783432006836, -0.5596566200256348, -0.4955349564552307, -0.43141329288482666, -0.3672916293144226, -0.30316996574401855, -0.2390482872724533, -0.17492660880088806, -0.11080494523048401, -0.046683281660079956, 0.017438411712646484, 0.08156007528305054, 0.1456817388534546]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 7.0, 4.0, 7.0, 4.0, 7.0, 14.0, 7.0, 13.0, 17.0, 18.0, 25.0, 21.0, 31.0, 30.0, 46.0, 50.0, 50.0, 47.0, 56.0, 54.0, 57.0, 40.0, 52.0, 40.0, 42.0, 51.0, 40.0, 36.0, 23.0, 18.0, 20.0, 13.0, 6.0, 12.0, 11.0, 15.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.237434983253479, -0.23022402822971344, -0.22301305830478668, -0.21580210328102112, -0.20859113335609436, -0.2013801783323288, -0.19416922330856323, -0.18695825338363647, -0.1797472983598709, -0.17253634333610535, -0.1653253734111786, -0.15811441838741302, -0.15090346336364746, -0.1436924934387207, -0.13648153841495514, -0.12927058339118958, -0.12205961346626282, -0.11484865099191666, -0.1076376885175705, -0.10042673349380493, -0.09321577101945877, -0.08600480854511261, -0.07879385352134705, -0.07158289104700089, -0.06437192857265472, -0.05716096609830856, -0.0499500073492527, -0.04273904860019684, -0.03552808612585068, -0.028317123651504517, -0.021106164902448654, -0.013895206153392792, -0.006684243679046631, 0.0005267169326543808, 0.0077376775443553925, 0.014948638156056404, 0.022159598767757416, 0.029370561242103577, 0.03658151999115944, 0.0437924787402153, 0.05100344121456146, 0.05821440368890762, 0.06542536616325378, 0.07263632118701935, 0.07984728366136551, 0.08705824613571167, 0.09426920115947723, 0.1014801636338234, 0.10869112610816956, 0.11590208858251572, 0.12311305105686188, 0.13032400608062744, 0.1375349760055542, 0.14474593102931976, 0.15195688605308533, 0.15916785597801208, 0.16637881100177765, 0.1735897660255432, 0.18080073595046997, 0.18801169097423553, 0.1952226459980011, 0.20243361592292786, 0.20964457094669342, 0.21685552597045898, 0.22406649589538574]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 4.0, 10.0, 9.0, 10.0, 9.0, 45.0, 52.0, 65.0, 96.0, 202.0, 269.0, 500.0, 1053.0, 3140.0, 19286.0, 944540.0, 3173339.0, 44045.0, 4673.0, 1374.0, 630.0, 354.0, 228.0, 106.0, 82.0, 57.0, 29.0, 25.0, 16.0, 12.0, 7.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1881103515625, -0.1833057403564453, -0.17850112915039062, -0.17369651794433594, -0.16889190673828125, -0.16408729553222656, -0.15928268432617188, -0.1544780731201172, -0.1496734619140625, -0.1448688507080078, -0.14006423950195312, -0.13525962829589844, -0.13045501708984375, -0.12565040588378906, -0.12084579467773438, -0.11604118347167969, -0.111236572265625, -0.10643196105957031, -0.10162734985351562, -0.09682273864746094, -0.09201812744140625, -0.08721351623535156, -0.08240890502929688, -0.07760429382324219, -0.0727996826171875, -0.06799507141113281, -0.06319046020507812, -0.05838584899902344, -0.05358123779296875, -0.04877662658691406, -0.043972015380859375, -0.03916740417480469, -0.03436279296875, -0.029558181762695312, -0.024753570556640625, -0.019948959350585938, -0.01514434814453125, -0.010339736938476562, -0.005535125732421875, -0.0007305145263671875, 0.0040740966796875, 0.008878707885742188, 0.013683319091796875, 0.018487930297851562, 0.02329254150390625, 0.028097152709960938, 0.032901763916015625, 0.03770637512207031, 0.042510986328125, 0.04731559753417969, 0.052120208740234375, 0.05692481994628906, 0.06172943115234375, 0.06653404235839844, 0.07133865356445312, 0.07614326477050781, 0.0809478759765625, 0.08575248718261719, 0.09055709838867188, 0.09536170959472656, 0.10016632080078125, 0.10497093200683594, 0.10977554321289062, 0.11458015441894531, 0.119384765625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 9.0, 6.0, 18.0, 15.0, 23.0, 19.0, 31.0, 35.0, 32.0, 42.0, 44.0, 36.0, 47.0, 56.0, 58.0, 56.0, 60.0, 58.0, 51.0, 48.0, 44.0, 40.0, 32.0, 26.0, 31.0, 15.0, 6.0, 10.0, 15.0, 9.0, 7.0, 4.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037994384765625, -0.03688669204711914, -0.03577899932861328, -0.03467130661010742, -0.03356361389160156, -0.0324559211730957, -0.031348228454589844, -0.030240535736083984, -0.029132843017578125, -0.028025150299072266, -0.026917457580566406, -0.025809764862060547, -0.024702072143554688, -0.023594379425048828, -0.02248668670654297, -0.02137899398803711, -0.02027130126953125, -0.01916360855102539, -0.01805591583251953, -0.016948223114013672, -0.015840530395507812, -0.014732837677001953, -0.013625144958496094, -0.012517452239990234, -0.011409759521484375, -0.010302066802978516, -0.009194374084472656, -0.008086681365966797, -0.0069789886474609375, -0.005871295928955078, -0.004763603210449219, -0.0036559104919433594, -0.0025482177734375, -0.0014405250549316406, -0.00033283233642578125, 0.0007748603820800781, 0.0018825531005859375, 0.002990245819091797, 0.004097938537597656, 0.005205631256103516, 0.006313323974609375, 0.007421016693115234, 0.008528709411621094, 0.009636402130126953, 0.010744094848632812, 0.011851787567138672, 0.012959480285644531, 0.01406717300415039, 0.01517486572265625, 0.01628255844116211, 0.01739025115966797, 0.018497943878173828, 0.019605636596679688, 0.020713329315185547, 0.021821022033691406, 0.022928714752197266, 0.024036407470703125, 0.025144100189208984, 0.026251792907714844, 0.027359485626220703, 0.028467178344726562, 0.029574871063232422, 0.03068256378173828, 0.03179025650024414, 0.03289794921875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 7.0, 5.0, 12.0, 18.0, 17.0, 27.0, 38.0, 66.0, 99.0, 203.0, 378.0, 908.0, 3147.0, 19551.0, 214013.0, 2458593.0, 1375945.0, 106270.0, 11321.0, 2216.0, 706.0, 314.0, 158.0, 107.0, 51.0, 34.0, 18.0, 17.0, 12.0, 11.0, 6.0, 4.0, 5.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.106201171875, -0.1026449203491211, -0.09908866882324219, -0.09553241729736328, -0.09197616577148438, -0.08841991424560547, -0.08486366271972656, -0.08130741119384766, -0.07775115966796875, -0.07419490814208984, -0.07063865661621094, -0.06708240509033203, -0.06352615356445312, -0.05996990203857422, -0.05641365051269531, -0.052857398986816406, -0.0493011474609375, -0.045744895935058594, -0.04218864440917969, -0.03863239288330078, -0.035076141357421875, -0.03151988983154297, -0.027963638305664062, -0.024407386779785156, -0.02085113525390625, -0.017294883728027344, -0.013738632202148438, -0.010182380676269531, -0.006626129150390625, -0.0030698776245117188, 0.0004863739013671875, 0.004042625427246094, 0.007598876953125, 0.011155128479003906, 0.014711380004882812, 0.01826763153076172, 0.021823883056640625, 0.02538013458251953, 0.028936386108398438, 0.032492637634277344, 0.03604888916015625, 0.039605140686035156, 0.04316139221191406, 0.04671764373779297, 0.050273895263671875, 0.05383014678955078, 0.05738639831542969, 0.060942649841308594, 0.0644989013671875, 0.0680551528930664, 0.07161140441894531, 0.07516765594482422, 0.07872390747070312, 0.08228015899658203, 0.08583641052246094, 0.08939266204833984, 0.09294891357421875, 0.09650516510009766, 0.10006141662597656, 0.10361766815185547, 0.10717391967773438, 0.11073017120361328, 0.11428642272949219, 0.1178426742553711, 0.12139892578125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 4.0, 7.0, 10.0, 13.0, 32.0, 44.0, 57.0, 79.0, 108.0, 135.0, 208.0, 279.0, 360.0, 433.0, 590.0, 416.0, 392.0, 235.0, 178.0, 141.0, 108.0, 74.0, 51.0, 44.0, 23.0, 24.0, 9.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.060211181640625, -0.058721065521240234, -0.05723094940185547, -0.0557408332824707, -0.05425071716308594, -0.05276060104370117, -0.051270484924316406, -0.04978036880493164, -0.048290252685546875, -0.04680013656616211, -0.045310020446777344, -0.04381990432739258, -0.04232978820800781, -0.04083967208862305, -0.03934955596923828, -0.037859439849853516, -0.03636932373046875, -0.034879207611083984, -0.03338909149169922, -0.03189897537231445, -0.030408859252929688, -0.028918743133544922, -0.027428627014160156, -0.02593851089477539, -0.024448394775390625, -0.02295827865600586, -0.021468162536621094, -0.019978046417236328, -0.018487930297851562, -0.016997814178466797, -0.015507698059082031, -0.014017581939697266, -0.0125274658203125, -0.011037349700927734, -0.009547233581542969, -0.008057117462158203, -0.0065670013427734375, -0.005076885223388672, -0.0035867691040039062, -0.0020966529846191406, -0.000606536865234375, 0.0008835792541503906, 0.0023736953735351562, 0.003863811492919922, 0.0053539276123046875, 0.006844043731689453, 0.008334159851074219, 0.009824275970458984, 0.01131439208984375, 0.012804508209228516, 0.014294624328613281, 0.015784740447998047, 0.017274856567382812, 0.018764972686767578, 0.020255088806152344, 0.02174520492553711, 0.023235321044921875, 0.02472543716430664, 0.026215553283691406, 0.027705669403076172, 0.029195785522460938, 0.030685901641845703, 0.03217601776123047, 0.033666133880615234, 0.03515625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 55.0, 460.0, 443.0, 45.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.057135581970215, -2.017524480819702, -1.9779136180877686, -1.9383025169372559, -1.8986915349960327, -1.8590805530548096, -1.8194695711135864, -1.7798585891723633, -1.7402476072311401, -1.700636625289917, -1.6610256433486938, -1.6214146614074707, -1.581803560256958, -1.5421925783157349, -1.5025815963745117, -1.4629706144332886, -1.4233596324920654, -1.3837486505508423, -1.3441376686096191, -1.3045265674591064, -1.2649155855178833, -1.2253046035766602, -1.185693621635437, -1.1460826396942139, -1.1064715385437012, -1.066860556602478, -1.0272495746612549, -0.987638533115387, -0.9480275511741638, -0.9084165096282959, -0.8688055276870728, -0.8291945457458496, -0.7895836234092712, -0.7499726414680481, -0.7103615999221802, -0.670750617980957, -0.6311396360397339, -0.5915286540985107, -0.5519176125526428, -0.5123066306114197, -0.47269561886787415, -0.4330846071243286, -0.39347362518310547, -0.35386261343955994, -0.3142516016960144, -0.27464061975479126, -0.23502960801124573, -0.19541862607002258, -0.15580761432647705, -0.11619661748409271, -0.07658561319112778, -0.03697460889816284, 0.0026363879442214966, 0.042247384786605835, 0.08185839653015137, 0.12146937847137451, 0.16108039021492004, 0.20069138705730438, 0.24030238389968872, 0.27991339564323425, 0.3195244073867798, 0.35913538932800293, 0.39874640107154846, 0.4383573830127716, 0.47796839475631714]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 6.0, 3.0, 8.0, 12.0, 9.0, 10.0, 15.0, 21.0, 28.0, 35.0, 36.0, 35.0, 37.0, 28.0, 43.0, 45.0, 63.0, 49.0, 45.0, 38.0, 54.0, 57.0, 42.0, 46.0, 36.0, 36.0, 28.0, 23.0, 21.0, 14.0, 17.0, 18.0, 11.0, 5.0, 3.0, 8.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12678438425064087, -0.12213010340929031, -0.11747582256793976, -0.1128215417265892, -0.10816726088523865, -0.1035129725933075, -0.09885869175195694, -0.09420441091060638, -0.08955013006925583, -0.08489584922790527, -0.08024156838655472, -0.07558728754520416, -0.07093299925327301, -0.06627872586250305, -0.0616244375705719, -0.056970156729221344, -0.05231587588787079, -0.04766159504652023, -0.04300731420516968, -0.038353029638528824, -0.03369874879717827, -0.029044467955827713, -0.02439018525183201, -0.019735902547836304, -0.015081621706485748, -0.010427339933812618, -0.005773058161139488, -0.0011187763884663582, 0.003535505384206772, 0.008189786225557327, 0.012844068929553032, 0.017498351633548737, 0.022152632474899292, 0.026806913316249847, 0.0314611941576004, 0.03611547872424126, 0.04076975956559181, 0.04542404040694237, 0.05007832497358322, 0.05473260581493378, 0.05938688665628433, 0.06404116749763489, 0.06869544833898544, 0.073349729180336, 0.07800401747226715, 0.08265829086303711, 0.08731257915496826, 0.09196685999631882, 0.09662114083766937, 0.10127542167901993, 0.10592970252037048, 0.11058398336172104, 0.1152382642030716, 0.11989255249500275, 0.1245468333363533, 0.12920111417770386, 0.133855402469635, 0.13850969076156616, 0.14316396415233612, 0.14781825244426727, 0.15247252583503723, 0.15712681412696838, 0.16178108751773834, 0.1664353758096695, 0.17108964920043945]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 3.0, 10.0, 12.0, 22.0, 22.0, 23.0, 48.0, 77.0, 117.0, 183.0, 369.0, 672.0, 1439.0, 2889.0, 6513.0, 15257.0, 44873.0, 185459.0, 498305.0, 211852.0, 50493.0, 16792.0, 6930.0, 3089.0, 1498.0, 704.0, 365.0, 203.0, 112.0, 71.0, 45.0, 25.0, 20.0, 11.0, 9.0, 9.0, 7.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09619140625, -0.09269905090332031, -0.08920669555664062, -0.08571434020996094, -0.08222198486328125, -0.07872962951660156, -0.07523727416992188, -0.07174491882324219, -0.0682525634765625, -0.06476020812988281, -0.061267852783203125, -0.05777549743652344, -0.05428314208984375, -0.05079078674316406, -0.047298431396484375, -0.04380607604980469, -0.040313720703125, -0.03682136535644531, -0.033329010009765625, -0.029836654663085938, -0.02634429931640625, -0.022851943969726562, -0.019359588623046875, -0.015867233276367188, -0.0123748779296875, -0.008882522583007812, -0.005390167236328125, -0.0018978118896484375, 0.00159454345703125, 0.0050868988037109375, 0.008579254150390625, 0.012071609497070312, 0.01556396484375, 0.019056320190429688, 0.022548675537109375, 0.026041030883789062, 0.02953338623046875, 0.03302574157714844, 0.036518096923828125, 0.04001045227050781, 0.0435028076171875, 0.04699516296386719, 0.050487518310546875, 0.05397987365722656, 0.05747222900390625, 0.06096458435058594, 0.06445693969726562, 0.06794929504394531, 0.071441650390625, 0.07493400573730469, 0.07842636108398438, 0.08191871643066406, 0.08541107177734375, 0.08890342712402344, 0.09239578247070312, 0.09588813781738281, 0.0993804931640625, 0.10287284851074219, 0.10636520385742188, 0.10985755920410156, 0.11334991455078125, 0.11684226989746094, 0.12033462524414062, 0.12382698059082031, 0.1273193359375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 13.0, 11.0, 19.0, 24.0, 27.0, 30.0, 35.0, 42.0, 45.0, 49.0, 45.0, 50.0, 64.0, 51.0, 56.0, 65.0, 66.0, 45.0, 36.0, 42.0, 31.0, 28.0, 28.0, 22.0, 9.0, 9.0, 4.0, 14.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.04205322265625, -0.04092669486999512, -0.039800167083740234, -0.03867363929748535, -0.03754711151123047, -0.036420583724975586, -0.0352940559387207, -0.03416752815246582, -0.03304100036621094, -0.031914472579956055, -0.030787944793701172, -0.02966141700744629, -0.028534889221191406, -0.027408361434936523, -0.02628183364868164, -0.025155305862426758, -0.024028778076171875, -0.022902250289916992, -0.02177572250366211, -0.020649194717407227, -0.019522666931152344, -0.01839613914489746, -0.017269611358642578, -0.016143083572387695, -0.015016555786132812, -0.01389002799987793, -0.012763500213623047, -0.011636972427368164, -0.010510444641113281, -0.009383916854858398, -0.008257389068603516, -0.007130861282348633, -0.00600433349609375, -0.004877805709838867, -0.0037512779235839844, -0.0026247501373291016, -0.0014982223510742188, -0.00037169456481933594, 0.0007548332214355469, 0.0018813610076904297, 0.0030078887939453125, 0.004134416580200195, 0.005260944366455078, 0.006387472152709961, 0.007513999938964844, 0.008640527725219727, 0.00976705551147461, 0.010893583297729492, 0.012020111083984375, 0.013146638870239258, 0.01427316665649414, 0.015399694442749023, 0.016526222229003906, 0.01765275001525879, 0.018779277801513672, 0.019905805587768555, 0.021032333374023438, 0.02215886116027832, 0.023285388946533203, 0.024411916732788086, 0.02553844451904297, 0.02666497230529785, 0.027791500091552734, 0.028918027877807617, 0.0300445556640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 10.0, 13.0, 21.0, 28.0, 35.0, 72.0, 86.0, 163.0, 335.0, 1145.0, 4867.0, 24796.0, 260325.0, 664164.0, 77631.0, 11167.0, 2427.0, 621.0, 255.0, 115.0, 88.0, 56.0, 35.0, 20.0, 23.0, 10.0, 7.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1527099609375, -0.1468963623046875, -0.141082763671875, -0.1352691650390625, -0.12945556640625, -0.1236419677734375, -0.117828369140625, -0.1120147705078125, -0.106201171875, -0.1003875732421875, -0.094573974609375, -0.0887603759765625, -0.08294677734375, -0.0771331787109375, -0.071319580078125, -0.0655059814453125, -0.0596923828125, -0.0538787841796875, -0.048065185546875, -0.0422515869140625, -0.03643798828125, -0.0306243896484375, -0.024810791015625, -0.0189971923828125, -0.01318359375, -0.0073699951171875, -0.001556396484375, 0.0042572021484375, 0.01007080078125, 0.0158843994140625, 0.021697998046875, 0.0275115966796875, 0.0333251953125, 0.0391387939453125, 0.044952392578125, 0.0507659912109375, 0.05657958984375, 0.0623931884765625, 0.068206787109375, 0.0740203857421875, 0.079833984375, 0.0856475830078125, 0.091461181640625, 0.0972747802734375, 0.10308837890625, 0.1089019775390625, 0.114715576171875, 0.1205291748046875, 0.1263427734375, 0.1321563720703125, 0.137969970703125, 0.1437835693359375, 0.14959716796875, 0.1554107666015625, 0.161224365234375, 0.1670379638671875, 0.1728515625, 0.1786651611328125, 0.184478759765625, 0.1902923583984375, 0.19610595703125, 0.2019195556640625, 0.207733154296875, 0.2135467529296875, 0.2193603515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 14.0, 12.0, 13.0, 22.0, 29.0, 18.0, 24.0, 44.0, 51.0, 48.0, 52.0, 41.0, 51.0, 47.0, 60.0, 55.0, 47.0, 41.0, 51.0, 38.0, 32.0, 36.0, 34.0, 28.0, 18.0, 21.0, 12.0, 4.0, 11.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.09906005859375, -0.0964365005493164, -0.09381294250488281, -0.09118938446044922, -0.08856582641601562, -0.08594226837158203, -0.08331871032714844, -0.08069515228271484, -0.07807159423828125, -0.07544803619384766, -0.07282447814941406, -0.07020092010498047, -0.06757736206054688, -0.06495380401611328, -0.06233024597167969, -0.059706687927246094, -0.0570831298828125, -0.054459571838378906, -0.05183601379394531, -0.04921245574951172, -0.046588897705078125, -0.04396533966064453, -0.04134178161621094, -0.038718223571777344, -0.03609466552734375, -0.033471107482910156, -0.030847549438476562, -0.02822399139404297, -0.025600433349609375, -0.02297687530517578, -0.020353317260742188, -0.017729759216308594, -0.015106201171875, -0.012482643127441406, -0.009859085083007812, -0.007235527038574219, -0.004611968994140625, -0.0019884109497070312, 0.0006351470947265625, 0.0032587051391601562, 0.00588226318359375, 0.008505821228027344, 0.011129379272460938, 0.013752937316894531, 0.016376495361328125, 0.01900005340576172, 0.021623611450195312, 0.024247169494628906, 0.0268707275390625, 0.029494285583496094, 0.03211784362792969, 0.03474140167236328, 0.037364959716796875, 0.03998851776123047, 0.04261207580566406, 0.045235633850097656, 0.04785919189453125, 0.050482749938964844, 0.05310630798339844, 0.05572986602783203, 0.058353424072265625, 0.06097698211669922, 0.06360054016113281, 0.0662240982055664, 0.06884765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 6.0, 9.0, 11.0, 12.0, 22.0, 20.0, 39.0, 46.0, 70.0, 82.0, 112.0, 128.0, 180.0, 298.0, 429.0, 658.0, 956.0, 1527.0, 3006.0, 6015.0, 13584.0, 37940.0, 136662.0, 412000.0, 306545.0, 82224.0, 25023.0, 10083.0, 4516.0, 2316.0, 1361.0, 745.0, 507.0, 362.0, 270.0, 195.0, 136.0, 111.0, 95.0, 66.0, 43.0, 37.0, 28.0, 15.0, 21.0, 14.0, 9.0, 8.0, 6.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.054656982421875, -0.052991390228271484, -0.05132579803466797, -0.04966020584106445, -0.04799461364746094, -0.04632902145385742, -0.044663429260253906, -0.04299783706665039, -0.041332244873046875, -0.03966665267944336, -0.038001060485839844, -0.03633546829223633, -0.03466987609863281, -0.0330042839050293, -0.03133869171142578, -0.029673099517822266, -0.02800750732421875, -0.026341915130615234, -0.02467632293701172, -0.023010730743408203, -0.021345138549804688, -0.019679546356201172, -0.018013954162597656, -0.01634836196899414, -0.014682769775390625, -0.01301717758178711, -0.011351585388183594, -0.009685993194580078, -0.008020401000976562, -0.006354808807373047, -0.004689216613769531, -0.0030236244201660156, -0.0013580322265625, 0.0003075599670410156, 0.0019731521606445312, 0.003638744354248047, 0.0053043365478515625, 0.006969928741455078, 0.008635520935058594, 0.01030111312866211, 0.011966705322265625, 0.01363229751586914, 0.015297889709472656, 0.016963481903076172, 0.018629074096679688, 0.020294666290283203, 0.02196025848388672, 0.023625850677490234, 0.02529144287109375, 0.026957035064697266, 0.02862262725830078, 0.030288219451904297, 0.03195381164550781, 0.03361940383911133, 0.035284996032714844, 0.03695058822631836, 0.038616180419921875, 0.04028177261352539, 0.041947364807128906, 0.04361295700073242, 0.04527854919433594, 0.04694414138793945, 0.04860973358154297, 0.050275325775146484, 0.05194091796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 16.0, 24.0, 24.0, 26.0, 57.0, 93.0, 111.0, 136.0, 127.0, 117.0, 76.0, 52.0, 39.0, 26.0, 20.0, 7.0, 14.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.081560134887695e-05, -2.975575625896454e-05, -2.8695911169052124e-05, -2.763606607913971e-05, -2.6576220989227295e-05, -2.551637589931488e-05, -2.4456530809402466e-05, -2.339668571949005e-05, -2.2336840629577637e-05, -2.1276995539665222e-05, -2.0217150449752808e-05, -1.9157305359840393e-05, -1.809746026992798e-05, -1.7037615180015564e-05, -1.597777009010315e-05, -1.4917925000190735e-05, -1.385807991027832e-05, -1.2798234820365906e-05, -1.1738389730453491e-05, -1.0678544640541077e-05, -9.618699550628662e-06, -8.558854460716248e-06, -7.499009370803833e-06, -6.4391642808914185e-06, -5.379319190979004e-06, -4.319474101066589e-06, -3.259629011154175e-06, -2.1997839212417603e-06, -1.1399388313293457e-06, -8.009374141693115e-08, 9.797513484954834e-07, 2.039596438407898e-06, 3.0994415283203125e-06, 4.159286618232727e-06, 5.219131708145142e-06, 6.278976798057556e-06, 7.338821887969971e-06, 8.398666977882385e-06, 9.4585120677948e-06, 1.0518357157707214e-05, 1.1578202247619629e-05, 1.2638047337532043e-05, 1.3697892427444458e-05, 1.4757737517356873e-05, 1.5817582607269287e-05, 1.68774276971817e-05, 1.7937272787094116e-05, 1.899711787700653e-05, 2.0056962966918945e-05, 2.111680805683136e-05, 2.2176653146743774e-05, 2.323649823665619e-05, 2.4296343326568604e-05, 2.5356188416481018e-05, 2.6416033506393433e-05, 2.7475878596305847e-05, 2.8535723686218262e-05, 2.9595568776130676e-05, 3.065541386604309e-05, 3.1715258955955505e-05, 3.277510404586792e-05, 3.3834949135780334e-05, 3.489479422569275e-05, 3.5954639315605164e-05, 3.701448440551758e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 15.0, 17.0, 35.0, 34.0, 73.0, 87.0, 185.0, 289.0, 728.0, 1979.0, 6223.0, 20841.0, 80363.0, 305847.0, 427543.0, 151267.0, 37132.0, 10412.0, 3334.0, 1113.0, 476.0, 201.0, 120.0, 62.0, 36.0, 27.0, 22.0, 17.0, 14.0, 12.0, 6.0, 3.0, 0.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04071044921875, -0.039157867431640625, -0.03760528564453125, -0.036052703857421875, -0.0345001220703125, -0.032947540283203125, -0.03139495849609375, -0.029842376708984375, -0.028289794921875, -0.026737213134765625, -0.02518463134765625, -0.023632049560546875, -0.0220794677734375, -0.020526885986328125, -0.01897430419921875, -0.017421722412109375, -0.015869140625, -0.014316558837890625, -0.01276397705078125, -0.011211395263671875, -0.0096588134765625, -0.008106231689453125, -0.00655364990234375, -0.005001068115234375, -0.003448486328125, -0.001895904541015625, -0.00034332275390625, 0.001209259033203125, 0.0027618408203125, 0.004314422607421875, 0.00586700439453125, 0.007419586181640625, 0.00897216796875, 0.010524749755859375, 0.01207733154296875, 0.013629913330078125, 0.0151824951171875, 0.016735076904296875, 0.01828765869140625, 0.019840240478515625, 0.021392822265625, 0.022945404052734375, 0.02449798583984375, 0.026050567626953125, 0.0276031494140625, 0.029155731201171875, 0.03070831298828125, 0.032260894775390625, 0.0338134765625, 0.035366058349609375, 0.03691864013671875, 0.038471221923828125, 0.0400238037109375, 0.041576385498046875, 0.04312896728515625, 0.044681549072265625, 0.046234130859375, 0.047786712646484375, 0.04933929443359375, 0.050891876220703125, 0.0524444580078125, 0.053997039794921875, 0.05554962158203125, 0.057102203369140625, 0.05865478515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 10.0, 12.0, 16.0, 21.0, 18.0, 26.0, 40.0, 34.0, 48.0, 53.0, 56.0, 67.0, 60.0, 53.0, 54.0, 68.0, 73.0, 43.0, 42.0, 36.0, 30.0, 23.0, 22.0, 12.0, 14.0, 8.0, 9.0, 6.0, 6.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02880859375, -0.02801060676574707, -0.02721261978149414, -0.02641463279724121, -0.02561664581298828, -0.02481865882873535, -0.024020671844482422, -0.023222684860229492, -0.022424697875976562, -0.021626710891723633, -0.020828723907470703, -0.020030736923217773, -0.019232749938964844, -0.018434762954711914, -0.017636775970458984, -0.016838788986206055, -0.016040802001953125, -0.015242815017700195, -0.014444828033447266, -0.013646841049194336, -0.012848854064941406, -0.012050867080688477, -0.011252880096435547, -0.010454893112182617, -0.009656906127929688, -0.008858919143676758, -0.008060932159423828, -0.0072629451751708984, -0.006464958190917969, -0.005666971206665039, -0.004868984222412109, -0.00407099723815918, -0.00327301025390625, -0.0024750232696533203, -0.0016770362854003906, -0.0008790493011474609, -8.106231689453125e-05, 0.0007169246673583984, 0.0015149116516113281, 0.002312898635864258, 0.0031108856201171875, 0.003908872604370117, 0.004706859588623047, 0.0055048465728759766, 0.006302833557128906, 0.007100820541381836, 0.007898807525634766, 0.008696794509887695, 0.009494781494140625, 0.010292768478393555, 0.011090755462646484, 0.011888742446899414, 0.012686729431152344, 0.013484716415405273, 0.014282703399658203, 0.015080690383911133, 0.015878677368164062, 0.016676664352416992, 0.017474651336669922, 0.01827263832092285, 0.01907062530517578, 0.01986861228942871, 0.02066659927368164, 0.02146458625793457, 0.0222625732421875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 32.0, 237.0, 517.0, 192.0, 29.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2299584448337555, -0.19433990120887756, -0.15872135758399963, -0.1231028139591217, -0.08748427033424377, -0.051865726709365845, -0.016247183084487915, 0.019371360540390015, 0.054989904165267944, 0.09060844779014587, 0.1262269914150238, 0.16184553503990173, 0.19746407866477966, 0.2330826222896576, 0.2687011659145355, 0.30431970953941345, 0.3399382531642914, 0.3755567967891693, 0.41117534041404724, 0.44679388403892517, 0.4824124276638031, 0.5180310010910034, 0.5536495447158813, 0.5892680883407593, 0.6248866319656372, 0.6605051755905151, 0.6961237192153931, 0.731742262840271, 0.7673608064651489, 0.8029793500900269, 0.8385978937149048, 0.8742164373397827, 0.9098348617553711, 0.945453405380249, 0.981071949005127, 1.0166904926300049, 1.0523090362548828, 1.0879275798797607, 1.1235461235046387, 1.1591646671295166, 1.1947832107543945, 1.2304017543792725, 1.2660202980041504, 1.3016388416290283, 1.3372573852539062, 1.3728759288787842, 1.408494472503662, 1.44411301612854, 1.479731559753418, 1.515350103378296, 1.5509686470031738, 1.5865871906280518, 1.6222057342529297, 1.6578242778778076, 1.6934428215026855, 1.7290613651275635, 1.7646799087524414, 1.8002984523773193, 1.8359169960021973, 1.8715355396270752, 1.9071540832519531, 1.942772626876831, 1.978391170501709, 2.014009714126587, 2.049628257751465]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 7.0, 9.0, 3.0, 10.0, 13.0, 17.0, 17.0, 17.0, 24.0, 25.0, 27.0, 23.0, 40.0, 32.0, 31.0, 46.0, 41.0, 50.0, 45.0, 25.0, 41.0, 45.0, 38.0, 45.0, 38.0, 35.0, 31.0, 23.0, 33.0, 33.0, 27.0, 12.0, 13.0, 10.0, 14.0, 9.0, 14.0, 9.0, 8.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.17601698637008667, -0.1698697805404663, -0.16372257471084595, -0.15757536888122559, -0.15142816305160522, -0.14528097212314606, -0.1391337662935257, -0.13298656046390533, -0.12683935463428497, -0.12069214880466461, -0.11454494297504425, -0.10839774459600449, -0.10225053876638412, -0.09610333293676376, -0.089956134557724, -0.08380892872810364, -0.07766172289848328, -0.07151451706886292, -0.06536731123924255, -0.05922011286020279, -0.05307290703058243, -0.04692570120096207, -0.040778499096632004, -0.03463129699230194, -0.02848409116268158, -0.022336887195706367, -0.016189683228731155, -0.010042479261755943, -0.003895275294780731, 0.002251928672194481, 0.008399132639169693, 0.014546334743499756, 0.020693540573120117, 0.02684074454009533, 0.03298794850707054, 0.039135150611400604, 0.045282356441020966, 0.05142956227064133, 0.05757676437497139, 0.06372396647930145, 0.06987117230892181, 0.07601837813854218, 0.08216558396816254, 0.0883127823472023, 0.09445998817682266, 0.10060719400644302, 0.10675439238548279, 0.11290159821510315, 0.11904880404472351, 0.12519600987434387, 0.13134321570396423, 0.1374904215335846, 0.14363762736320496, 0.14978481829166412, 0.15593202412128448, 0.16207922995090485, 0.1682264357805252, 0.17437364161014557, 0.18052084743976593, 0.1866680532693863, 0.19281524419784546, 0.19896245002746582, 0.20510965585708618, 0.21125686168670654, 0.2174040675163269]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 11.0, 9.0, 9.0, 9.0, 25.0, 14.0, 33.0, 50.0, 85.0, 106.0, 213.0, 315.0, 531.0, 1132.0, 2257.0, 5155.0, 14901.0, 56554.0, 357227.0, 2078787.0, 1428013.0, 195733.0, 35192.0, 10091.0, 3823.0, 1742.0, 919.0, 497.0, 313.0, 176.0, 104.0, 86.0, 57.0, 28.0, 26.0, 23.0, 13.0, 9.0, 6.0, 6.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055206298828125, -0.05341672897338867, -0.051627159118652344, -0.049837589263916016, -0.04804801940917969, -0.04625844955444336, -0.04446887969970703, -0.0426793098449707, -0.040889739990234375, -0.03910017013549805, -0.03731060028076172, -0.03552103042602539, -0.03373146057128906, -0.031941890716552734, -0.030152320861816406, -0.028362751007080078, -0.02657318115234375, -0.024783611297607422, -0.022994041442871094, -0.021204471588134766, -0.019414901733398438, -0.01762533187866211, -0.01583576202392578, -0.014046192169189453, -0.012256622314453125, -0.010467052459716797, -0.008677482604980469, -0.006887912750244141, -0.0050983428955078125, -0.0033087730407714844, -0.0015192031860351562, 0.0002703666687011719, 0.0020599365234375, 0.003849506378173828, 0.005639076232910156, 0.007428646087646484, 0.009218215942382812, 0.01100778579711914, 0.012797355651855469, 0.014586925506591797, 0.016376495361328125, 0.018166065216064453, 0.01995563507080078, 0.02174520492553711, 0.023534774780273438, 0.025324344635009766, 0.027113914489746094, 0.028903484344482422, 0.03069305419921875, 0.03248262405395508, 0.034272193908691406, 0.036061763763427734, 0.03785133361816406, 0.03964090347290039, 0.04143047332763672, 0.04322004318237305, 0.045009613037109375, 0.0467991828918457, 0.04858875274658203, 0.05037832260131836, 0.05216789245605469, 0.053957462310791016, 0.055747032165527344, 0.05753660202026367, 0.059326171875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 8.0, 5.0, 3.0, 7.0, 14.0, 19.0, 13.0, 24.0, 15.0, 23.0, 36.0, 35.0, 42.0, 35.0, 51.0, 47.0, 58.0, 58.0, 49.0, 40.0, 44.0, 51.0, 55.0, 49.0, 38.0, 32.0, 29.0, 20.0, 20.0, 15.0, 15.0, 11.0, 8.0, 4.0, 6.0, 9.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03167724609375, -0.030663013458251953, -0.029648780822753906, -0.02863454818725586, -0.027620315551757812, -0.026606082916259766, -0.02559185028076172, -0.024577617645263672, -0.023563385009765625, -0.022549152374267578, -0.02153491973876953, -0.020520687103271484, -0.019506454467773438, -0.01849222183227539, -0.017477989196777344, -0.016463756561279297, -0.01544952392578125, -0.014435291290283203, -0.013421058654785156, -0.01240682601928711, -0.011392593383789062, -0.010378360748291016, -0.009364128112792969, -0.008349895477294922, -0.007335662841796875, -0.006321430206298828, -0.005307197570800781, -0.004292964935302734, -0.0032787322998046875, -0.0022644996643066406, -0.0012502670288085938, -0.00023603439331054688, 0.0007781982421875, 0.0017924308776855469, 0.0028066635131835938, 0.0038208961486816406, 0.0048351287841796875, 0.005849361419677734, 0.006863594055175781, 0.007877826690673828, 0.008892059326171875, 0.009906291961669922, 0.010920524597167969, 0.011934757232666016, 0.012948989868164062, 0.01396322250366211, 0.014977455139160156, 0.015991687774658203, 0.01700592041015625, 0.018020153045654297, 0.019034385681152344, 0.02004861831665039, 0.021062850952148438, 0.022077083587646484, 0.02309131622314453, 0.024105548858642578, 0.025119781494140625, 0.026134014129638672, 0.02714824676513672, 0.028162479400634766, 0.029176712036132812, 0.03019094467163086, 0.031205177307128906, 0.03221940994262695, 0.033233642578125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 10.0, 24.0, 19.0, 36.0, 59.0, 63.0, 124.0, 170.0, 252.0, 425.0, 855.0, 1908.0, 6420.0, 31717.0, 210800.0, 1320815.0, 2071272.0, 465308.0, 66743.0, 11653.0, 3003.0, 1092.0, 500.0, 328.0, 212.0, 136.0, 98.0, 70.0, 52.0, 31.0, 24.0, 16.0, 12.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.06336593627929688, -0.06111907958984375, -0.058872222900390625, -0.0566253662109375, -0.054378509521484375, -0.05213165283203125, -0.049884796142578125, -0.047637939453125, -0.045391082763671875, -0.04314422607421875, -0.040897369384765625, -0.0386505126953125, -0.036403656005859375, -0.03415679931640625, -0.031909942626953125, -0.0296630859375, -0.027416229248046875, -0.02516937255859375, -0.022922515869140625, -0.0206756591796875, -0.018428802490234375, -0.01618194580078125, -0.013935089111328125, -0.011688232421875, -0.009441375732421875, -0.00719451904296875, -0.004947662353515625, -0.0027008056640625, -0.000453948974609375, 0.00179290771484375, 0.004039764404296875, 0.00628662109375, 0.008533477783203125, 0.01078033447265625, 0.013027191162109375, 0.0152740478515625, 0.017520904541015625, 0.01976776123046875, 0.022014617919921875, 0.024261474609375, 0.026508331298828125, 0.02875518798828125, 0.031002044677734375, 0.0332489013671875, 0.035495758056640625, 0.03774261474609375, 0.039989471435546875, 0.042236328125, 0.044483184814453125, 0.04673004150390625, 0.048976898193359375, 0.0512237548828125, 0.053470611572265625, 0.05571746826171875, 0.057964324951171875, 0.060211181640625, 0.062458038330078125, 0.06470489501953125, 0.06695175170898438, 0.0691986083984375, 0.07144546508789062, 0.07369232177734375, 0.07593917846679688, 0.07818603515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 14.0, 8.0, 10.0, 13.0, 20.0, 18.0, 28.0, 34.0, 49.0, 62.0, 60.0, 85.0, 123.0, 117.0, 142.0, 170.0, 201.0, 226.0, 253.0, 255.0, 275.0, 267.0, 253.0, 246.0, 213.0, 167.0, 128.0, 122.0, 100.0, 86.0, 75.0, 51.0, 46.0, 38.0, 25.0, 26.0, 13.0, 14.0, 9.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.035797119140625, -0.034656524658203125, -0.03351593017578125, -0.032375335693359375, -0.0312347412109375, -0.030094146728515625, -0.02895355224609375, -0.027812957763671875, -0.02667236328125, -0.025531768798828125, -0.02439117431640625, -0.023250579833984375, -0.0221099853515625, -0.020969390869140625, -0.01982879638671875, -0.018688201904296875, -0.017547607421875, -0.016407012939453125, -0.01526641845703125, -0.014125823974609375, -0.0129852294921875, -0.011844635009765625, -0.01070404052734375, -0.009563446044921875, -0.0084228515625, -0.007282257080078125, -0.00614166259765625, -0.005001068115234375, -0.0038604736328125, -0.002719879150390625, -0.00157928466796875, -0.000438690185546875, 0.000701904296875, 0.001842498779296875, 0.00298309326171875, 0.004123687744140625, 0.0052642822265625, 0.006404876708984375, 0.00754547119140625, 0.008686065673828125, 0.00982666015625, 0.010967254638671875, 0.01210784912109375, 0.013248443603515625, 0.0143890380859375, 0.015529632568359375, 0.01667022705078125, 0.017810821533203125, 0.018951416015625, 0.020092010498046875, 0.02123260498046875, 0.022373199462890625, 0.0235137939453125, 0.024654388427734375, 0.02579498291015625, 0.026935577392578125, 0.028076171875, 0.029216766357421875, 0.03035736083984375, 0.031497955322265625, 0.0326385498046875, 0.033779144287109375, 0.03491973876953125, 0.036060333251953125, 0.037200927734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 19.0, 104.0, 396.0, 395.0, 84.0, 13.0, 3.0, 3.0], "bins": [-1.971421480178833, -1.9379518032073975, -1.9044822454452515, -1.871012568473816, -1.83754301071167, -1.8040733337402344, -1.7706037759780884, -1.7371340990066528, -1.7036645412445068, -1.6701948642730713, -1.6367253065109253, -1.6032556295394897, -1.5697860717773438, -1.5363163948059082, -1.5028468370437622, -1.4693771600723267, -1.4359076023101807, -1.4024379253387451, -1.3689683675765991, -1.3354986906051636, -1.3020291328430176, -1.268559455871582, -1.235089898109436, -1.2016202211380005, -1.168150544166565, -1.1346808671951294, -1.1012113094329834, -1.0677416324615479, -1.0342720746994019, -1.0008023977279663, -0.9673328399658203, -0.9338631629943848, -0.900393545627594, -0.8669239282608032, -0.8334543108940125, -0.7999846935272217, -0.7665150761604309, -0.7330454587936401, -0.6995757818222046, -0.6661062240600586, -0.6326366066932678, -0.599166989326477, -0.5656973719596863, -0.5322277545928955, -0.49875813722610474, -0.46528851985931396, -0.4318188726902008, -0.39834925532341003, -0.3648796081542969, -0.3314099907875061, -0.29794037342071533, -0.26447075605392456, -0.2310011237859726, -0.19753150641918182, -0.16406187415122986, -0.1305922567844391, -0.09712265431880951, -0.06365303695201874, -0.03018341213464737, 0.003286212682723999, 0.03675583004951477, 0.07022544741630554, 0.10369507968425751, 0.13716469705104828, 0.17063431441783905]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 16.0, 17.0, 15.0, 13.0, 20.0, 18.0, 33.0, 29.0, 29.0, 35.0, 40.0, 32.0, 45.0, 38.0, 47.0, 41.0, 49.0, 42.0, 41.0, 46.0, 39.0, 29.0, 39.0, 38.0, 33.0, 29.0, 17.0, 20.0, 13.0, 15.0, 15.0, 15.0, 11.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17840546369552612, -0.17300398647785187, -0.1676025092601776, -0.16220103204250336, -0.1567995548248291, -0.15139807760715485, -0.1459966003894806, -0.14059510827064514, -0.13519364595413208, -0.12979216873645782, -0.12439069151878357, -0.11898921430110931, -0.11358773708343506, -0.1081862598657608, -0.10278477519750595, -0.0973832979798317, -0.09198181331157684, -0.08658033609390259, -0.08117885887622833, -0.07577738165855408, -0.07037590444087982, -0.06497442722320557, -0.059572942554950714, -0.05417146533727646, -0.0487699881196022, -0.04336851090192795, -0.03796703368425369, -0.03256555274128914, -0.027164075523614883, -0.021762598305940628, -0.016361117362976074, -0.010959640145301819, -0.0055581629276275635, -0.0001566847786307335, 0.0052447933703660965, 0.010646272450685501, 0.016047749668359756, 0.021449226886034012, 0.026850707828998566, 0.03225218504667282, 0.037653662264347076, 0.04305513948202133, 0.04845661669969559, 0.05385809764266014, 0.059259574860334396, 0.06466105580329895, 0.0700625330209732, 0.07546401023864746, 0.08086548745632172, 0.08626696467399597, 0.09166844189167023, 0.09706991910934448, 0.10247139632701874, 0.107872873544693, 0.11327435821294785, 0.1186758354306221, 0.12407731264829636, 0.1294787973165512, 0.13488027453422546, 0.14028175175189972, 0.14568322896957397, 0.15108470618724823, 0.15648618340492249, 0.16188766062259674, 0.167289137840271]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 5.0, 8.0, 10.0, 14.0, 24.0, 39.0, 41.0, 66.0, 93.0, 122.0, 205.0, 340.0, 610.0, 1265.0, 3055.0, 7724.0, 22146.0, 65656.0, 203690.0, 399396.0, 229339.0, 74750.0, 24648.0, 8862.0, 3357.0, 1446.0, 675.0, 340.0, 188.0, 125.0, 91.0, 54.0, 41.0, 35.0, 25.0, 18.0, 13.0, 7.0, 5.0, 6.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09625244140625, -0.09310245513916016, -0.08995246887207031, -0.08680248260498047, -0.08365249633789062, -0.08050251007080078, -0.07735252380371094, -0.0742025375366211, -0.07105255126953125, -0.0679025650024414, -0.06475257873535156, -0.06160259246826172, -0.058452606201171875, -0.05530261993408203, -0.05215263366699219, -0.049002647399902344, -0.0458526611328125, -0.042702674865722656, -0.03955268859863281, -0.03640270233154297, -0.033252716064453125, -0.03010272979736328, -0.026952743530273438, -0.023802757263183594, -0.02065277099609375, -0.017502784729003906, -0.014352798461914062, -0.011202812194824219, -0.008052825927734375, -0.004902839660644531, -0.0017528533935546875, 0.0013971328735351562, 0.004547119140625, 0.007697105407714844, 0.010847091674804688, 0.013997077941894531, 0.017147064208984375, 0.02029705047607422, 0.023447036743164062, 0.026597023010253906, 0.02974700927734375, 0.032896995544433594, 0.03604698181152344, 0.03919696807861328, 0.042346954345703125, 0.04549694061279297, 0.04864692687988281, 0.051796913146972656, 0.0549468994140625, 0.058096885681152344, 0.06124687194824219, 0.06439685821533203, 0.06754684448242188, 0.07069683074951172, 0.07384681701660156, 0.0769968032836914, 0.08014678955078125, 0.0832967758178711, 0.08644676208496094, 0.08959674835205078, 0.09274673461914062, 0.09589672088623047, 0.09904670715332031, 0.10219669342041016, 0.1053466796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 12.0, 15.0, 14.0, 19.0, 21.0, 25.0, 24.0, 27.0, 44.0, 41.0, 56.0, 62.0, 52.0, 54.0, 70.0, 56.0, 56.0, 55.0, 52.0, 48.0, 35.0, 23.0, 22.0, 25.0, 21.0, 17.0, 13.0, 13.0, 8.0, 2.0, 5.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039306640625, -0.03819990158081055, -0.037093162536621094, -0.03598642349243164, -0.03487968444824219, -0.033772945404052734, -0.03266620635986328, -0.03155946731567383, -0.030452728271484375, -0.029345989227294922, -0.02823925018310547, -0.027132511138916016, -0.026025772094726562, -0.02491903305053711, -0.023812294006347656, -0.022705554962158203, -0.02159881591796875, -0.020492076873779297, -0.019385337829589844, -0.01827859878540039, -0.017171859741210938, -0.016065120697021484, -0.014958381652832031, -0.013851642608642578, -0.012744903564453125, -0.011638164520263672, -0.010531425476074219, -0.009424686431884766, -0.008317947387695312, -0.007211208343505859, -0.006104469299316406, -0.004997730255126953, -0.0038909912109375, -0.002784252166748047, -0.0016775131225585938, -0.0005707740783691406, 0.0005359649658203125, 0.0016427040100097656, 0.0027494430541992188, 0.003856182098388672, 0.004962921142578125, 0.006069660186767578, 0.007176399230957031, 0.008283138275146484, 0.009389877319335938, 0.01049661636352539, 0.011603355407714844, 0.012710094451904297, 0.01381683349609375, 0.014923572540283203, 0.016030311584472656, 0.01713705062866211, 0.018243789672851562, 0.019350528717041016, 0.02045726776123047, 0.021564006805419922, 0.022670745849609375, 0.023777484893798828, 0.02488422393798828, 0.025990962982177734, 0.027097702026367188, 0.02820444107055664, 0.029311180114746094, 0.030417919158935547, 0.031524658203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 10.0, 22.0, 27.0, 28.0, 63.0, 102.0, 183.0, 335.0, 776.0, 2057.0, 6646.0, 23283.0, 81558.0, 285109.0, 426326.0, 159914.0, 43772.0, 12490.0, 3660.0, 1135.0, 453.0, 232.0, 135.0, 76.0, 41.0, 30.0, 20.0, 21.0, 10.0, 9.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1431884765625, -0.13923931121826172, -0.13529014587402344, -0.13134098052978516, -0.12739181518554688, -0.1234426498413086, -0.11949348449707031, -0.11554431915283203, -0.11159515380859375, -0.10764598846435547, -0.10369682312011719, -0.0997476577758789, -0.09579849243164062, -0.09184932708740234, -0.08790016174316406, -0.08395099639892578, -0.0800018310546875, -0.07605266571044922, -0.07210350036621094, -0.06815433502197266, -0.06420516967773438, -0.060256004333496094, -0.05630683898925781, -0.05235767364501953, -0.04840850830078125, -0.04445934295654297, -0.04051017761230469, -0.036561012268066406, -0.032611846923828125, -0.028662681579589844, -0.024713516235351562, -0.02076435089111328, -0.016815185546875, -0.012866020202636719, -0.008916854858398438, -0.004967689514160156, -0.001018524169921875, 0.0029306411743164062, 0.0068798065185546875, 0.010828971862792969, 0.01477813720703125, 0.01872730255126953, 0.022676467895507812, 0.026625633239746094, 0.030574798583984375, 0.034523963928222656, 0.03847312927246094, 0.04242229461669922, 0.0463714599609375, 0.05032062530517578, 0.05426979064941406, 0.058218955993652344, 0.062168121337890625, 0.0661172866821289, 0.07006645202636719, 0.07401561737060547, 0.07796478271484375, 0.08191394805908203, 0.08586311340332031, 0.0898122787475586, 0.09376144409179688, 0.09771060943603516, 0.10165977478027344, 0.10560894012451172, 0.10955810546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 6.0, 8.0, 8.0, 11.0, 12.0, 6.0, 18.0, 27.0, 35.0, 27.0, 30.0, 39.0, 39.0, 47.0, 41.0, 60.0, 41.0, 50.0, 49.0, 52.0, 38.0, 37.0, 44.0, 34.0, 47.0, 33.0, 19.0, 22.0, 22.0, 18.0, 17.0, 12.0, 6.0, 16.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06939697265625, -0.0668172836303711, -0.06423759460449219, -0.06165790557861328, -0.059078216552734375, -0.05649852752685547, -0.05391883850097656, -0.051339149475097656, -0.04875946044921875, -0.046179771423339844, -0.04360008239746094, -0.04102039337158203, -0.038440704345703125, -0.03586101531982422, -0.03328132629394531, -0.030701637268066406, -0.0281219482421875, -0.025542259216308594, -0.022962570190429688, -0.02038288116455078, -0.017803192138671875, -0.015223503112792969, -0.012643814086914062, -0.010064125061035156, -0.00748443603515625, -0.004904747009277344, -0.0023250579833984375, 0.00025463104248046875, 0.002834320068359375, 0.005414009094238281, 0.007993698120117188, 0.010573387145996094, 0.013153076171875, 0.015732765197753906, 0.018312454223632812, 0.02089214324951172, 0.023471832275390625, 0.02605152130126953, 0.028631210327148438, 0.031210899353027344, 0.03379058837890625, 0.036370277404785156, 0.03894996643066406, 0.04152965545654297, 0.044109344482421875, 0.04668903350830078, 0.04926872253417969, 0.051848411560058594, 0.0544281005859375, 0.057007789611816406, 0.05958747863769531, 0.06216716766357422, 0.06474685668945312, 0.06732654571533203, 0.06990623474121094, 0.07248592376708984, 0.07506561279296875, 0.07764530181884766, 0.08022499084472656, 0.08280467987060547, 0.08538436889648438, 0.08796405792236328, 0.09054374694824219, 0.0931234359741211, 0.095703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 17.0, 9.0, 13.0, 23.0, 36.0, 38.0, 59.0, 76.0, 131.0, 144.0, 212.0, 323.0, 553.0, 966.0, 1997.0, 5075.0, 17779.0, 78791.0, 334665.0, 437693.0, 129051.0, 27843.0, 7316.0, 2697.0, 1200.0, 635.0, 389.0, 207.0, 170.0, 119.0, 86.0, 60.0, 35.0, 35.0, 25.0, 24.0, 13.0, 9.0, 4.0, 5.0, 8.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.077880859375, -0.07538127899169922, -0.07288169860839844, -0.07038211822509766, -0.06788253784179688, -0.0653829574584961, -0.06288337707519531, -0.06038379669189453, -0.05788421630859375, -0.05538463592529297, -0.05288505554199219, -0.050385475158691406, -0.047885894775390625, -0.045386314392089844, -0.04288673400878906, -0.04038715362548828, -0.0378875732421875, -0.03538799285888672, -0.03288841247558594, -0.030388832092285156, -0.027889251708984375, -0.025389671325683594, -0.022890090942382812, -0.02039051055908203, -0.01789093017578125, -0.015391349792480469, -0.012891769409179688, -0.010392189025878906, -0.007892608642578125, -0.005393028259277344, -0.0028934478759765625, -0.00039386749267578125, 0.002105712890625, 0.004605293273925781, 0.0071048736572265625, 0.009604454040527344, 0.012104034423828125, 0.014603614807128906, 0.017103195190429688, 0.01960277557373047, 0.02210235595703125, 0.02460193634033203, 0.027101516723632812, 0.029601097106933594, 0.032100677490234375, 0.034600257873535156, 0.03709983825683594, 0.03959941864013672, 0.0420989990234375, 0.04459857940673828, 0.04709815979003906, 0.049597740173339844, 0.052097320556640625, 0.054596900939941406, 0.05709648132324219, 0.05959606170654297, 0.06209564208984375, 0.06459522247314453, 0.06709480285644531, 0.0695943832397461, 0.07209396362304688, 0.07459354400634766, 0.07709312438964844, 0.07959270477294922, 0.08209228515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 7.0, 2.0, 8.0, 13.0, 14.0, 21.0, 29.0, 68.0, 81.0, 101.0, 172.0, 159.0, 115.0, 74.0, 49.0, 31.0, 26.0, 14.0, 12.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-05, -4.378892481327057e-05, -4.227831959724426e-05, -4.0767714381217957e-05, -3.925710916519165e-05, -3.7746503949165344e-05, -3.623589873313904e-05, -3.472529351711273e-05, -3.3214688301086426e-05, -3.170408308506012e-05, -3.0193477869033813e-05, -2.8682872653007507e-05, -2.71722674369812e-05, -2.5661662220954895e-05, -2.415105700492859e-05, -2.2640451788902283e-05, -2.1129846572875977e-05, -1.961924135684967e-05, -1.8108636140823364e-05, -1.6598030924797058e-05, -1.5087425708770752e-05, -1.3576820492744446e-05, -1.206621527671814e-05, -1.0555610060691833e-05, -9.045004844665527e-06, -7.534399628639221e-06, -6.023794412612915e-06, -4.513189196586609e-06, -3.0025839805603027e-06, -1.4919787645339966e-06, 1.862645149230957e-08, 1.5292316675186157e-06, 3.039836883544922e-06, 4.550442099571228e-06, 6.061047315597534e-06, 7.57165253162384e-06, 9.082257747650146e-06, 1.0592862963676453e-05, 1.2103468179702759e-05, 1.3614073395729065e-05, 1.5124678611755371e-05, 1.6635283827781677e-05, 1.8145889043807983e-05, 1.965649425983429e-05, 2.1167099475860596e-05, 2.2677704691886902e-05, 2.4188309907913208e-05, 2.5698915123939514e-05, 2.720952033996582e-05, 2.8720125555992126e-05, 3.0230730772018433e-05, 3.174133598804474e-05, 3.3251941204071045e-05, 3.476254642009735e-05, 3.627315163612366e-05, 3.778375685214996e-05, 3.929436206817627e-05, 4.0804967284202576e-05, 4.231557250022888e-05, 4.382617771625519e-05, 4.5336782932281494e-05, 4.68473881483078e-05, 4.8357993364334106e-05, 4.986859858036041e-05, 5.137920379638672e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 10.0, 14.0, 24.0, 16.0, 20.0, 39.0, 74.0, 114.0, 175.0, 377.0, 705.0, 1601.0, 3869.0, 11031.0, 33650.0, 102172.0, 253810.0, 335837.0, 196945.0, 71862.0, 23241.0, 7678.0, 2856.0, 1154.0, 520.0, 301.0, 174.0, 91.0, 71.0, 34.0, 28.0, 15.0, 8.0, 8.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043060302734375, -0.0416407585144043, -0.040221214294433594, -0.03880167007446289, -0.03738212585449219, -0.035962581634521484, -0.03454303741455078, -0.03312349319458008, -0.031703948974609375, -0.030284404754638672, -0.02886486053466797, -0.027445316314697266, -0.026025772094726562, -0.02460622787475586, -0.023186683654785156, -0.021767139434814453, -0.02034759521484375, -0.018928050994873047, -0.017508506774902344, -0.01608896255493164, -0.014669418334960938, -0.013249874114990234, -0.011830329895019531, -0.010410785675048828, -0.008991241455078125, -0.007571697235107422, -0.006152153015136719, -0.004732608795166016, -0.0033130645751953125, -0.0018935203552246094, -0.00047397613525390625, 0.0009455680847167969, 0.0023651123046875, 0.003784656524658203, 0.005204200744628906, 0.006623744964599609, 0.008043289184570312, 0.009462833404541016, 0.010882377624511719, 0.012301921844482422, 0.013721466064453125, 0.015141010284423828, 0.01656055450439453, 0.017980098724365234, 0.019399642944335938, 0.02081918716430664, 0.022238731384277344, 0.023658275604248047, 0.02507781982421875, 0.026497364044189453, 0.027916908264160156, 0.02933645248413086, 0.030755996704101562, 0.032175540924072266, 0.03359508514404297, 0.03501462936401367, 0.036434173583984375, 0.03785371780395508, 0.03927326202392578, 0.040692806243896484, 0.04211235046386719, 0.04353189468383789, 0.044951438903808594, 0.0463709831237793, 0.04779052734375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 10.0, 8.0, 9.0, 13.0, 18.0, 16.0, 26.0, 32.0, 34.0, 51.0, 43.0, 45.0, 57.0, 50.0, 50.0, 75.0, 64.0, 63.0, 51.0, 39.0, 32.0, 36.0, 31.0, 31.0, 18.0, 19.0, 15.0, 10.0, 9.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.032501220703125, -0.03159904479980469, -0.030696868896484375, -0.029794692993164062, -0.02889251708984375, -0.027990341186523438, -0.027088165283203125, -0.026185989379882812, -0.0252838134765625, -0.024381637573242188, -0.023479461669921875, -0.022577285766601562, -0.02167510986328125, -0.020772933959960938, -0.019870758056640625, -0.018968582153320312, -0.01806640625, -0.017164230346679688, -0.016262054443359375, -0.015359878540039062, -0.01445770263671875, -0.013555526733398438, -0.012653350830078125, -0.011751174926757812, -0.0108489990234375, -0.009946823120117188, -0.009044647216796875, -0.008142471313476562, -0.00724029541015625, -0.0063381195068359375, -0.005435943603515625, -0.0045337677001953125, -0.003631591796875, -0.0027294158935546875, -0.001827239990234375, -0.0009250640869140625, -2.288818359375e-05, 0.0008792877197265625, 0.001781463623046875, 0.0026836395263671875, 0.0035858154296875, 0.0044879913330078125, 0.005390167236328125, 0.0062923431396484375, 0.00719451904296875, 0.008096694946289062, 0.008998870849609375, 0.009901046752929688, 0.01080322265625, 0.011705398559570312, 0.012607574462890625, 0.013509750366210938, 0.01441192626953125, 0.015314102172851562, 0.016216278076171875, 0.017118453979492188, 0.0180206298828125, 0.018922805786132812, 0.019824981689453125, 0.020727157592773438, 0.02162933349609375, 0.022531509399414062, 0.023433685302734375, 0.024335861206054688, 0.025238037109375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 23.0, 53.0, 124.0, 251.0, 246.0, 173.0, 81.0, 34.0, 11.0, 4.0, 7.0], "bins": [-1.3495289087295532, -1.3259398937225342, -1.3023508787155151, -1.2787617444992065, -1.2551727294921875, -1.2315837144851685, -1.2079946994781494, -1.1844055652618408, -1.1608165502548218, -1.1372275352478027, -1.1136385202407837, -1.090049386024475, -1.066460371017456, -1.042871356010437, -1.019282341003418, -0.9956932663917542, -0.9721041917800903, -0.9485151767730713, -0.9249261021614075, -0.9013370871543884, -0.8777480125427246, -0.8541589975357056, -0.8305699229240417, -0.8069809079170227, -0.7833918929100037, -0.7598028779029846, -0.7362138032913208, -0.7126247882843018, -0.6890357136726379, -0.6654466986656189, -0.6418576240539551, -0.618268609046936, -0.5946794748306274, -0.5710904598236084, -0.5475013852119446, -0.5239123702049255, -0.5003232955932617, -0.4767342507839203, -0.45314520597457886, -0.4295561909675598, -0.40596717596054077, -0.38237813115119934, -0.3587890863418579, -0.3352000415325165, -0.31161099672317505, -0.2880219519138336, -0.2644329071044922, -0.24084387719631195, -0.21725481748580933, -0.1936657726764679, -0.17007672786712646, -0.14648768305778503, -0.1228986456990242, -0.09930960088968277, -0.07572056353092194, -0.052131518721580505, -0.028542473912239075, -0.004953430965542793, 0.018635611981153488, 0.04222465306520462, 0.06581369787454605, 0.08940274268388748, 0.11299178004264832, 0.13658082485198975, 0.16016986966133118]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 4.0, 3.0, 4.0, 6.0, 7.0, 9.0, 13.0, 15.0, 12.0, 28.0, 26.0, 29.0, 42.0, 26.0, 39.0, 53.0, 43.0, 46.0, 44.0, 36.0, 40.0, 46.0, 46.0, 41.0, 56.0, 34.0, 30.0, 33.0, 25.0, 27.0, 31.0, 23.0, 14.0, 23.0, 12.0, 9.0, 6.0, 6.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27329468727111816, -0.26509422063827515, -0.25689375400543213, -0.2486932873725891, -0.2404928058385849, -0.23229233920574188, -0.22409187257289886, -0.21589140594005585, -0.20769092440605164, -0.19949045777320862, -0.1912899911403656, -0.18308952450752258, -0.17488904297351837, -0.16668857634067535, -0.15848810970783234, -0.15028764307498932, -0.1420871764421463, -0.13388670980930328, -0.12568624317646027, -0.11748576909303665, -0.10928529500961304, -0.10108482837677002, -0.092884361743927, -0.08468389511108398, -0.07648342102766037, -0.06828295439481735, -0.06008248031139374, -0.05188201367855072, -0.043681543320417404, -0.03548107296228409, -0.02728060632944107, -0.019080135971307755, -0.010879665613174438, -0.002679196186363697, 0.005521273240447044, 0.013721741735935211, 0.021922212094068527, 0.030122682452201843, 0.03832314908504486, 0.04652361944317818, 0.05472408980131149, 0.06292455643415451, 0.07112503051757812, 0.07932549715042114, 0.08752596378326416, 0.09572643786668777, 0.10392690449953079, 0.1121273785829544, 0.12032784521579742, 0.12852831184864044, 0.13672877848148346, 0.14492926001548767, 0.1531297266483307, 0.1613301932811737, 0.16953065991401672, 0.17773112654685974, 0.18593159317970276, 0.19413205981254578, 0.2023325264453888, 0.2105329930782318, 0.21873347461223602, 0.22693394124507904, 0.23513440787792206, 0.24333487451076508, 0.2515353560447693]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 6.0, 7.0, 12.0, 11.0, 15.0, 16.0, 23.0, 36.0, 56.0, 81.0, 93.0, 137.0, 161.0, 238.0, 422.0, 1094.0, 3946.0, 27651.0, 562309.0, 3240063.0, 333236.0, 19240.0, 3272.0, 916.0, 379.0, 226.0, 163.0, 116.0, 90.0, 60.0, 58.0, 37.0, 30.0, 12.0, 22.0, 10.0, 7.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08868408203125, -0.0858621597290039, -0.08304023742675781, -0.08021831512451172, -0.07739639282226562, -0.07457447052001953, -0.07175254821777344, -0.06893062591552734, -0.06610870361328125, -0.06328678131103516, -0.06046485900878906, -0.05764293670654297, -0.054821014404296875, -0.05199909210205078, -0.04917716979980469, -0.046355247497558594, -0.0435333251953125, -0.040711402893066406, -0.03788948059082031, -0.03506755828857422, -0.032245635986328125, -0.02942371368408203, -0.026601791381835938, -0.023779869079589844, -0.02095794677734375, -0.018136024475097656, -0.015314102172851562, -0.012492179870605469, -0.009670257568359375, -0.006848335266113281, -0.0040264129638671875, -0.0012044906616210938, 0.001617431640625, 0.004439353942871094, 0.0072612762451171875, 0.010083198547363281, 0.012905120849609375, 0.01572704315185547, 0.018548965454101562, 0.021370887756347656, 0.02419281005859375, 0.027014732360839844, 0.029836654663085938, 0.03265857696533203, 0.035480499267578125, 0.03830242156982422, 0.04112434387207031, 0.043946266174316406, 0.0467681884765625, 0.049590110778808594, 0.05241203308105469, 0.05523395538330078, 0.058055877685546875, 0.06087779998779297, 0.06369972229003906, 0.06652164459228516, 0.06934356689453125, 0.07216548919677734, 0.07498741149902344, 0.07780933380126953, 0.08063125610351562, 0.08345317840576172, 0.08627510070800781, 0.0890970230102539, 0.0919189453125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 13.0, 6.0, 13.0, 11.0, 16.0, 14.0, 13.0, 40.0, 31.0, 42.0, 37.0, 39.0, 45.0, 42.0, 36.0, 52.0, 42.0, 66.0, 47.0, 51.0, 44.0, 44.0, 33.0, 40.0, 24.0, 23.0, 15.0, 25.0, 17.0, 12.0, 13.0, 15.0, 11.0, 9.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.032073974609375, -0.031070232391357422, -0.030066490173339844, -0.029062747955322266, -0.028059005737304688, -0.02705526351928711, -0.02605152130126953, -0.025047779083251953, -0.024044036865234375, -0.023040294647216797, -0.02203655242919922, -0.02103281021118164, -0.020029067993164062, -0.019025325775146484, -0.018021583557128906, -0.017017841339111328, -0.01601409912109375, -0.015010356903076172, -0.014006614685058594, -0.013002872467041016, -0.011999130249023438, -0.01099538803100586, -0.009991645812988281, -0.008987903594970703, -0.007984161376953125, -0.006980419158935547, -0.005976676940917969, -0.004972934722900391, -0.0039691925048828125, -0.0029654502868652344, -0.0019617080688476562, -0.0009579658508300781, 4.57763671875e-05, 0.0010495185852050781, 0.0020532608032226562, 0.0030570030212402344, 0.0040607452392578125, 0.005064487457275391, 0.006068229675292969, 0.007071971893310547, 0.008075714111328125, 0.009079456329345703, 0.010083198547363281, 0.01108694076538086, 0.012090682983398438, 0.013094425201416016, 0.014098167419433594, 0.015101909637451172, 0.01610565185546875, 0.017109394073486328, 0.018113136291503906, 0.019116878509521484, 0.020120620727539062, 0.02112436294555664, 0.02212810516357422, 0.023131847381591797, 0.024135589599609375, 0.025139331817626953, 0.02614307403564453, 0.02714681625366211, 0.028150558471679688, 0.029154300689697266, 0.030158042907714844, 0.031161785125732422, 0.03216552734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 6.0, 9.0, 12.0, 22.0, 33.0, 51.0, 79.0, 136.0, 222.0, 355.0, 676.0, 1909.0, 7756.0, 52249.0, 526207.0, 2563443.0, 931629.0, 93256.0, 11680.0, 2595.0, 900.0, 422.0, 227.0, 146.0, 91.0, 56.0, 37.0, 25.0, 15.0, 10.0, 9.0, 7.0, 2.0, 2.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0643310546875, -0.06171894073486328, -0.05910682678222656, -0.056494712829589844, -0.053882598876953125, -0.051270484924316406, -0.04865837097167969, -0.04604625701904297, -0.04343414306640625, -0.04082202911376953, -0.03820991516113281, -0.035597801208496094, -0.032985687255859375, -0.030373573303222656, -0.027761459350585938, -0.02514934539794922, -0.0225372314453125, -0.01992511749267578, -0.017313003540039062, -0.014700889587402344, -0.012088775634765625, -0.009476661682128906, -0.0068645477294921875, -0.004252433776855469, -0.00164031982421875, 0.0009717941284179688, 0.0035839080810546875, 0.006196022033691406, 0.008808135986328125, 0.011420249938964844, 0.014032363891601562, 0.01664447784423828, 0.019256591796875, 0.02186870574951172, 0.024480819702148438, 0.027092933654785156, 0.029705047607421875, 0.032317161560058594, 0.03492927551269531, 0.03754138946533203, 0.04015350341796875, 0.04276561737060547, 0.04537773132324219, 0.047989845275878906, 0.050601959228515625, 0.053214073181152344, 0.05582618713378906, 0.05843830108642578, 0.0610504150390625, 0.06366252899169922, 0.06627464294433594, 0.06888675689697266, 0.07149887084960938, 0.0741109848022461, 0.07672309875488281, 0.07933521270751953, 0.08194732666015625, 0.08455944061279297, 0.08717155456542969, 0.0897836685180664, 0.09239578247070312, 0.09500789642333984, 0.09762001037597656, 0.10023212432861328, 0.10284423828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 11.0, 6.0, 8.0, 13.0, 10.0, 18.0, 24.0, 25.0, 36.0, 42.0, 58.0, 69.0, 98.0, 118.0, 151.0, 196.0, 222.0, 263.0, 265.0, 280.0, 306.0, 300.0, 285.0, 231.0, 190.0, 186.0, 151.0, 107.0, 88.0, 74.0, 54.0, 63.0, 39.0, 27.0, 13.0, 13.0, 11.0, 12.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0439453125, -0.0427393913269043, -0.041533470153808594, -0.04032754898071289, -0.03912162780761719, -0.037915706634521484, -0.03670978546142578, -0.03550386428833008, -0.034297943115234375, -0.03309202194213867, -0.03188610076904297, -0.030680179595947266, -0.029474258422851562, -0.02826833724975586, -0.027062416076660156, -0.025856494903564453, -0.02465057373046875, -0.023444652557373047, -0.022238731384277344, -0.02103281021118164, -0.019826889038085938, -0.018620967864990234, -0.01741504669189453, -0.016209125518798828, -0.015003204345703125, -0.013797283172607422, -0.012591361999511719, -0.011385440826416016, -0.010179519653320312, -0.00897359848022461, -0.007767677307128906, -0.006561756134033203, -0.0053558349609375, -0.004149913787841797, -0.0029439926147460938, -0.0017380714416503906, -0.0005321502685546875, 0.0006737709045410156, 0.0018796920776367188, 0.003085613250732422, 0.004291534423828125, 0.005497455596923828, 0.006703376770019531, 0.007909297943115234, 0.009115219116210938, 0.01032114028930664, 0.011527061462402344, 0.012732982635498047, 0.01393890380859375, 0.015144824981689453, 0.016350746154785156, 0.01755666732788086, 0.018762588500976562, 0.019968509674072266, 0.02117443084716797, 0.022380352020263672, 0.023586273193359375, 0.024792194366455078, 0.02599811553955078, 0.027204036712646484, 0.028409957885742188, 0.02961587905883789, 0.030821800231933594, 0.0320277214050293, 0.033233642578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 14.0, 17.0, 25.0, 46.0, 79.0, 111.0, 127.0, 165.0, 131.0, 109.0, 78.0, 47.0, 21.0, 18.0, 9.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4146982431411743, -0.40541550517082214, -0.39613276720046997, -0.3868500292301178, -0.3775672912597656, -0.36828452348709106, -0.3590018153190613, -0.3497190475463867, -0.34043630957603455, -0.3311535716056824, -0.3218708336353302, -0.312588095664978, -0.30330535769462585, -0.2940226197242737, -0.2847398519515991, -0.27545711398124695, -0.2661743760108948, -0.2568916380405426, -0.24760890007019043, -0.23832616209983826, -0.2290434092283249, -0.21976067125797272, -0.21047793328762054, -0.20119518041610718, -0.1919124722480774, -0.18262973427772522, -0.17334699630737305, -0.16406425833702087, -0.1547815054655075, -0.14549876749515533, -0.13621602952480316, -0.1269332766532898, -0.11765053868293762, -0.10836780071258545, -0.09908505529165268, -0.0898023173213005, -0.08051957190036774, -0.07123683393001556, -0.06195409595966339, -0.05267135053873062, -0.04338861256837845, -0.03410587087273598, -0.024823131039738655, -0.015540391206741333, -0.006257649511098862, 0.0030250921845436096, 0.012307830154895782, 0.021590575575828552, 0.030873313546180725, 0.040156055241823196, 0.04943879693746567, 0.05872153490781784, 0.06800428032875061, 0.07728701829910278, 0.08656975626945496, 0.09585250169038773, 0.1051352396607399, 0.11441797763109207, 0.12370072305202484, 0.13298346102237701, 0.1422661989927292, 0.15154895186424255, 0.16083168983459473, 0.1701144278049469, 0.17939716577529907]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 7.0, 15.0, 21.0, 21.0, 19.0, 37.0, 17.0, 30.0, 35.0, 29.0, 29.0, 34.0, 45.0, 39.0, 53.0, 33.0, 45.0, 39.0, 48.0, 48.0, 36.0, 28.0, 31.0, 27.0, 31.0, 22.0, 18.0, 23.0, 25.0, 18.0, 11.0, 15.0, 7.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14856374263763428, -0.14370004832744598, -0.1388363540172577, -0.1339726597070694, -0.1291089653968811, -0.12424526363611221, -0.11938156187534332, -0.11451786756515503, -0.10965417325496674, -0.10479047894477844, -0.09992678463459015, -0.09506308287382126, -0.09019938856363297, -0.08533569425344467, -0.08047199249267578, -0.07560829818248749, -0.0707446038722992, -0.0658809095621109, -0.06101721152663231, -0.05615351349115372, -0.051289819180965424, -0.04642612487077713, -0.04156242683529854, -0.036698728799819946, -0.03183503448963165, -0.02697133831679821, -0.022107642143964767, -0.017243945971131325, -0.012380249798297882, -0.007516553625464439, -0.0026528574526309967, 0.002210840582847595, 0.007074534893035889, 0.011938231065869331, 0.016801927238702774, 0.021665623411536217, 0.02652931958436966, 0.03139301389455795, 0.036256711930036545, 0.04112040996551514, 0.04598410427570343, 0.050847798585891724, 0.055711496621370316, 0.06057519465684891, 0.0654388889670372, 0.0703025832772255, 0.07516628503799438, 0.08002997934818268, 0.08489367365837097, 0.08975736796855927, 0.09462106227874756, 0.09948476403951645, 0.10434845834970474, 0.10921215265989304, 0.11407585442066193, 0.11893954873085022, 0.12380324304103851, 0.1286669373512268, 0.1335306316614151, 0.1383943259716034, 0.14325803518295288, 0.14812172949314117, 0.15298542380332947, 0.15784911811351776, 0.16271281242370605]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 6.0, 10.0, 8.0, 21.0, 25.0, 35.0, 44.0, 90.0, 121.0, 188.0, 392.0, 810.0, 1793.0, 4556.0, 11778.0, 32618.0, 113697.0, 380665.0, 352613.0, 100803.0, 30072.0, 10832.0, 4120.0, 1665.0, 752.0, 312.0, 175.0, 119.0, 79.0, 41.0, 30.0, 27.0, 21.0, 6.0, 9.0, 10.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1168212890625, -0.11327648162841797, -0.10973167419433594, -0.1061868667602539, -0.10264205932617188, -0.09909725189208984, -0.09555244445800781, -0.09200763702392578, -0.08846282958984375, -0.08491802215576172, -0.08137321472167969, -0.07782840728759766, -0.07428359985351562, -0.0707387924194336, -0.06719398498535156, -0.06364917755126953, -0.0601043701171875, -0.05655956268310547, -0.05301475524902344, -0.049469947814941406, -0.045925140380859375, -0.042380332946777344, -0.03883552551269531, -0.03529071807861328, -0.03174591064453125, -0.02820110321044922, -0.024656295776367188, -0.021111488342285156, -0.017566680908203125, -0.014021873474121094, -0.010477066040039062, -0.006932258605957031, -0.003387451171875, 0.00015735626220703125, 0.0037021636962890625, 0.007246971130371094, 0.010791778564453125, 0.014336585998535156, 0.017881393432617188, 0.02142620086669922, 0.02497100830078125, 0.02851581573486328, 0.03206062316894531, 0.035605430603027344, 0.039150238037109375, 0.042695045471191406, 0.04623985290527344, 0.04978466033935547, 0.0533294677734375, 0.05687427520751953, 0.06041908264160156, 0.0639638900756836, 0.06750869750976562, 0.07105350494384766, 0.07459831237792969, 0.07814311981201172, 0.08168792724609375, 0.08523273468017578, 0.08877754211425781, 0.09232234954833984, 0.09586715698242188, 0.0994119644165039, 0.10295677185058594, 0.10650157928466797, 0.11004638671875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 9.0, 10.0, 18.0, 15.0, 17.0, 23.0, 28.0, 38.0, 35.0, 38.0, 37.0, 42.0, 57.0, 51.0, 56.0, 56.0, 49.0, 60.0, 40.0, 43.0, 45.0, 36.0, 29.0, 34.0, 31.0, 22.0, 16.0, 7.0, 10.0, 11.0, 7.0, 8.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0364990234375, -0.035466909408569336, -0.03443479537963867, -0.03340268135070801, -0.032370567321777344, -0.03133845329284668, -0.030306339263916016, -0.02927422523498535, -0.028242111206054688, -0.027209997177124023, -0.02617788314819336, -0.025145769119262695, -0.02411365509033203, -0.023081541061401367, -0.022049427032470703, -0.02101731300354004, -0.019985198974609375, -0.01895308494567871, -0.017920970916748047, -0.016888856887817383, -0.01585674285888672, -0.014824628829956055, -0.01379251480102539, -0.012760400772094727, -0.011728286743164062, -0.010696172714233398, -0.009664058685302734, -0.00863194465637207, -0.007599830627441406, -0.006567716598510742, -0.005535602569580078, -0.004503488540649414, -0.00347137451171875, -0.002439260482788086, -0.0014071464538574219, -0.0003750324249267578, 0.0006570816040039062, 0.0016891956329345703, 0.0027213096618652344, 0.0037534236907958984, 0.0047855377197265625, 0.0058176517486572266, 0.006849765777587891, 0.007881879806518555, 0.008913993835449219, 0.009946107864379883, 0.010978221893310547, 0.012010335922241211, 0.013042449951171875, 0.014074563980102539, 0.015106678009033203, 0.016138792037963867, 0.01717090606689453, 0.018203020095825195, 0.01923513412475586, 0.020267248153686523, 0.021299362182617188, 0.02233147621154785, 0.023363590240478516, 0.02439570426940918, 0.025427818298339844, 0.026459932327270508, 0.027492046356201172, 0.028524160385131836, 0.0295562744140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 10.0, 9.0, 7.0, 15.0, 21.0, 22.0, 28.0, 52.0, 73.0, 85.0, 111.0, 154.0, 215.0, 336.0, 504.0, 989.0, 1984.0, 4391.0, 10037.0, 24094.0, 59981.0, 148319.0, 289543.0, 277137.0, 135897.0, 55030.0, 21891.0, 9317.0, 4010.0, 1807.0, 918.0, 519.0, 283.0, 200.0, 139.0, 96.0, 77.0, 64.0, 42.0, 38.0, 27.0, 21.0, 16.0, 10.0, 7.0, 7.0, 2.0, 9.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.07502937316894531, -0.07260513305664062, -0.07018089294433594, -0.06775665283203125, -0.06533241271972656, -0.06290817260742188, -0.06048393249511719, -0.0580596923828125, -0.05563545227050781, -0.053211212158203125, -0.05078697204589844, -0.04836273193359375, -0.04593849182128906, -0.043514251708984375, -0.04109001159667969, -0.038665771484375, -0.03624153137207031, -0.033817291259765625, -0.03139305114746094, -0.02896881103515625, -0.026544570922851562, -0.024120330810546875, -0.021696090698242188, -0.0192718505859375, -0.016847610473632812, -0.014423370361328125, -0.011999130249023438, -0.00957489013671875, -0.0071506500244140625, -0.004726409912109375, -0.0023021697998046875, 0.0001220703125, 0.0025463104248046875, 0.004970550537109375, 0.0073947906494140625, 0.00981903076171875, 0.012243270874023438, 0.014667510986328125, 0.017091751098632812, 0.0195159912109375, 0.021940231323242188, 0.024364471435546875, 0.026788711547851562, 0.02921295166015625, 0.03163719177246094, 0.034061431884765625, 0.03648567199707031, 0.038909912109375, 0.04133415222167969, 0.043758392333984375, 0.04618263244628906, 0.04860687255859375, 0.05103111267089844, 0.053455352783203125, 0.05587959289550781, 0.0583038330078125, 0.06072807312011719, 0.06315231323242188, 0.06557655334472656, 0.06800079345703125, 0.07042503356933594, 0.07284927368164062, 0.07527351379394531, 0.07769775390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 13.0, 9.0, 6.0, 8.0, 10.0, 11.0, 10.0, 19.0, 20.0, 13.0, 16.0, 25.0, 43.0, 33.0, 36.0, 40.0, 39.0, 38.0, 32.0, 40.0, 37.0, 37.0, 38.0, 33.0, 42.0, 34.0, 34.0, 28.0, 32.0, 23.0, 28.0, 25.0, 22.0, 20.0, 21.0, 17.0, 11.0, 9.0, 6.0, 6.0, 6.0, 4.0, 8.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.07525634765625, -0.07300090789794922, -0.07074546813964844, -0.06849002838134766, -0.06623458862304688, -0.0639791488647461, -0.06172370910644531, -0.05946826934814453, -0.05721282958984375, -0.05495738983154297, -0.05270195007324219, -0.050446510314941406, -0.048191070556640625, -0.045935630798339844, -0.04368019104003906, -0.04142475128173828, -0.0391693115234375, -0.03691387176513672, -0.03465843200683594, -0.032402992248535156, -0.030147552490234375, -0.027892112731933594, -0.025636672973632812, -0.02338123321533203, -0.02112579345703125, -0.01887035369873047, -0.016614913940429688, -0.014359474182128906, -0.012104034423828125, -0.009848594665527344, -0.0075931549072265625, -0.005337715148925781, -0.003082275390625, -0.0008268356323242188, 0.0014286041259765625, 0.0036840438842773438, 0.005939483642578125, 0.008194923400878906, 0.010450363159179688, 0.012705802917480469, 0.01496124267578125, 0.01721668243408203, 0.019472122192382812, 0.021727561950683594, 0.023983001708984375, 0.026238441467285156, 0.028493881225585938, 0.03074932098388672, 0.0330047607421875, 0.03526020050048828, 0.03751564025878906, 0.039771080017089844, 0.042026519775390625, 0.044281959533691406, 0.04653739929199219, 0.04879283905029297, 0.05104827880859375, 0.05330371856689453, 0.05555915832519531, 0.057814598083496094, 0.060070037841796875, 0.062325477600097656, 0.06458091735839844, 0.06683635711669922, 0.069091796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 11.0, 3.0, 12.0, 20.0, 29.0, 45.0, 75.0, 104.0, 170.0, 315.0, 495.0, 833.0, 1439.0, 2521.0, 4216.0, 7838.0, 13959.0, 26917.0, 55336.0, 116531.0, 210117.0, 249681.0, 176922.0, 90772.0, 42778.0, 21158.0, 11340.0, 6268.0, 3541.0, 2059.0, 1209.0, 696.0, 419.0, 268.0, 161.0, 103.0, 65.0, 42.0, 27.0, 16.0, 11.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.028045654296875, -0.027150392532348633, -0.026255130767822266, -0.0253598690032959, -0.02446460723876953, -0.023569345474243164, -0.022674083709716797, -0.02177882194519043, -0.020883560180664062, -0.019988298416137695, -0.019093036651611328, -0.01819777488708496, -0.017302513122558594, -0.016407251358032227, -0.01551198959350586, -0.014616727828979492, -0.013721466064453125, -0.012826204299926758, -0.01193094253540039, -0.011035680770874023, -0.010140419006347656, -0.009245157241821289, -0.008349895477294922, -0.007454633712768555, -0.0065593719482421875, -0.00566411018371582, -0.004768848419189453, -0.003873586654663086, -0.0029783248901367188, -0.0020830631256103516, -0.0011878013610839844, -0.0002925395965576172, 0.00060272216796875, 0.0014979839324951172, 0.0023932456970214844, 0.0032885074615478516, 0.004183769226074219, 0.005079030990600586, 0.005974292755126953, 0.00686955451965332, 0.0077648162841796875, 0.008660078048706055, 0.009555339813232422, 0.010450601577758789, 0.011345863342285156, 0.012241125106811523, 0.01313638687133789, 0.014031648635864258, 0.014926910400390625, 0.015822172164916992, 0.01671743392944336, 0.017612695693969727, 0.018507957458496094, 0.01940321922302246, 0.020298480987548828, 0.021193742752075195, 0.022089004516601562, 0.02298426628112793, 0.023879528045654297, 0.024774789810180664, 0.02567005157470703, 0.0265653133392334, 0.027460575103759766, 0.028355836868286133, 0.0292510986328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 6.0, 8.0, 6.0, 3.0, 13.0, 7.0, 8.0, 14.0, 16.0, 27.0, 22.0, 38.0, 36.0, 54.0, 62.0, 67.0, 62.0, 58.0, 77.0, 39.0, 41.0, 61.0, 54.0, 26.0, 29.0, 25.0, 24.0, 24.0, 10.0, 19.0, 11.0, 7.0, 8.0, 8.0, 7.0, 4.0, 0.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5735626220703125e-05, -1.524016261100769e-05, -1.4744699001312256e-05, -1.4249235391616821e-05, -1.3753771781921387e-05, -1.3258308172225952e-05, -1.2762844562530518e-05, -1.2267380952835083e-05, -1.1771917343139648e-05, -1.1276453733444214e-05, -1.078099012374878e-05, -1.0285526514053345e-05, -9.79006290435791e-06, -9.294599294662476e-06, -8.799135684967041e-06, -8.303672075271606e-06, -7.808208465576172e-06, -7.312744855880737e-06, -6.817281246185303e-06, -6.321817636489868e-06, -5.826354026794434e-06, -5.330890417098999e-06, -4.8354268074035645e-06, -4.33996319770813e-06, -3.844499588012695e-06, -3.3490359783172607e-06, -2.853572368621826e-06, -2.3581087589263916e-06, -1.862645149230957e-06, -1.3671815395355225e-06, -8.717179298400879e-07, -3.762543201446533e-07, 1.1920928955078125e-07, 6.146728992462158e-07, 1.1101365089416504e-06, 1.605600118637085e-06, 2.1010637283325195e-06, 2.596527338027954e-06, 3.0919909477233887e-06, 3.5874545574188232e-06, 4.082918167114258e-06, 4.578381776809692e-06, 5.073845386505127e-06, 5.5693089962005615e-06, 6.064772605895996e-06, 6.560236215591431e-06, 7.055699825286865e-06, 7.5511634349823e-06, 8.046627044677734e-06, 8.542090654373169e-06, 9.037554264068604e-06, 9.533017873764038e-06, 1.0028481483459473e-05, 1.0523945093154907e-05, 1.1019408702850342e-05, 1.1514872312545776e-05, 1.2010335922241211e-05, 1.2505799531936646e-05, 1.300126314163208e-05, 1.3496726751327515e-05, 1.399219036102295e-05, 1.4487653970718384e-05, 1.4983117580413818e-05, 1.5478581190109253e-05, 1.5974044799804688e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 12.0, 8.0, 6.0, 15.0, 25.0, 33.0, 52.0, 78.0, 102.0, 148.0, 263.0, 420.0, 797.0, 1243.0, 2463.0, 4556.0, 9234.0, 19270.0, 45065.0, 114898.0, 251801.0, 300195.0, 173616.0, 69315.0, 28180.0, 13069.0, 6320.0, 3227.0, 1789.0, 942.0, 533.0, 311.0, 181.0, 113.0, 76.0, 61.0, 33.0, 23.0, 23.0, 23.0, 6.0, 7.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.030303955078125, -0.029267311096191406, -0.028230667114257812, -0.02719402313232422, -0.026157379150390625, -0.02512073516845703, -0.024084091186523438, -0.023047447204589844, -0.02201080322265625, -0.020974159240722656, -0.019937515258789062, -0.01890087127685547, -0.017864227294921875, -0.01682758331298828, -0.015790939331054688, -0.014754295349121094, -0.0137176513671875, -0.012681007385253906, -0.011644363403320312, -0.010607719421386719, -0.009571075439453125, -0.008534431457519531, -0.0074977874755859375, -0.006461143493652344, -0.00542449951171875, -0.004387855529785156, -0.0033512115478515625, -0.0023145675659179688, -0.001277923583984375, -0.00024127960205078125, 0.0007953643798828125, 0.0018320083618164062, 0.00286865234375, 0.0039052963256835938, 0.0049419403076171875, 0.005978584289550781, 0.007015228271484375, 0.008051872253417969, 0.009088516235351562, 0.010125160217285156, 0.01116180419921875, 0.012198448181152344, 0.013235092163085938, 0.014271736145019531, 0.015308380126953125, 0.01634502410888672, 0.017381668090820312, 0.018418312072753906, 0.0194549560546875, 0.020491600036621094, 0.021528244018554688, 0.02256488800048828, 0.023601531982421875, 0.02463817596435547, 0.025674819946289062, 0.026711463928222656, 0.02774810791015625, 0.028784751892089844, 0.029821395874023438, 0.03085803985595703, 0.031894683837890625, 0.03293132781982422, 0.03396797180175781, 0.035004615783691406, 0.036041259765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 4.0, 7.0, 8.0, 13.0, 6.0, 18.0, 19.0, 28.0, 26.0, 30.0, 26.0, 51.0, 51.0, 58.0, 64.0, 49.0, 76.0, 52.0, 47.0, 51.0, 51.0, 32.0, 33.0, 21.0, 31.0, 21.0, 18.0, 17.0, 15.0, 18.0, 7.0, 8.0, 5.0, 4.0, 4.0, 3.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.024627685546875, -0.023848295211791992, -0.023068904876708984, -0.022289514541625977, -0.02151012420654297, -0.02073073387145996, -0.019951343536376953, -0.019171953201293945, -0.018392562866210938, -0.01761317253112793, -0.016833782196044922, -0.016054391860961914, -0.015275001525878906, -0.014495611190795898, -0.01371622085571289, -0.012936830520629883, -0.012157440185546875, -0.011378049850463867, -0.01059865951538086, -0.009819269180297852, -0.009039878845214844, -0.008260488510131836, -0.007481098175048828, -0.00670170783996582, -0.0059223175048828125, -0.005142927169799805, -0.004363536834716797, -0.003584146499633789, -0.0028047561645507812, -0.0020253658294677734, -0.0012459754943847656, -0.0004665851593017578, 0.00031280517578125, 0.0010921955108642578, 0.0018715858459472656, 0.0026509761810302734, 0.0034303665161132812, 0.004209756851196289, 0.004989147186279297, 0.005768537521362305, 0.0065479278564453125, 0.00732731819152832, 0.008106708526611328, 0.008886098861694336, 0.009665489196777344, 0.010444879531860352, 0.01122426986694336, 0.012003660202026367, 0.012783050537109375, 0.013562440872192383, 0.01434183120727539, 0.015121221542358398, 0.015900611877441406, 0.016680002212524414, 0.017459392547607422, 0.01823878288269043, 0.019018173217773438, 0.019797563552856445, 0.020576953887939453, 0.02135634422302246, 0.02213573455810547, 0.022915124893188477, 0.023694515228271484, 0.024473905563354492, 0.0252532958984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 11.0, 39.0, 74.0, 180.0, 254.0, 235.0, 141.0, 54.0, 15.0, 5.0, 5.0, 2.0], "bins": [-1.3594342470169067, -1.3354487419128418, -1.3114632368087769, -1.287477731704712, -1.2634923458099365, -1.2395068407058716, -1.2155213356018066, -1.1915358304977417, -1.1675503253936768, -1.1435648202896118, -1.1195793151855469, -1.095593810081482, -1.0716084241867065, -1.0476229190826416, -1.0236374139785767, -0.9996519088745117, -0.9756664037704468, -0.9516808986663818, -0.9276954531669617, -0.9037099480628967, -0.8797244429588318, -0.8557389378547668, -0.8317534923553467, -0.8077679872512817, -0.7837825417518616, -0.7597970366477966, -0.7358115911483765, -0.7118260860443115, -0.6878405809402466, -0.6638550758361816, -0.6398696303367615, -0.6158841252326965, -0.5918985605239868, -0.5679130554199219, -0.5439276099205017, -0.5199421048164368, -0.4959565997123718, -0.4719711244106293, -0.4479856491088867, -0.4240001440048218, -0.4000146687030792, -0.37602919340133667, -0.35204368829727173, -0.3280582129955292, -0.30407270789146423, -0.2800872325897217, -0.25610172748565674, -0.23211625218391418, -0.20813076198101044, -0.1841452717781067, -0.16015978157520294, -0.1361742913722992, -0.11218880861997604, -0.0882033184170723, -0.06421783566474915, -0.0402323454618454, -0.01624685525894165, 0.007738633081316948, 0.031724121421575546, 0.055709607899188995, 0.07969509810209274, 0.10368058830499649, 0.12766607105731964, 0.1516515612602234, 0.17563705146312714]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 5.0, 8.0, 10.0, 10.0, 13.0, 23.0, 16.0, 14.0, 30.0, 29.0, 20.0, 43.0, 35.0, 32.0, 49.0, 49.0, 47.0, 62.0, 50.0, 52.0, 40.0, 34.0, 44.0, 27.0, 36.0, 30.0, 28.0, 29.0, 21.0, 20.0, 14.0, 17.0, 13.0, 8.0, 12.0, 9.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.309553861618042, -0.3011791706085205, -0.29280444979667664, -0.28442972898483276, -0.2760550379753113, -0.2676803469657898, -0.2593056261539459, -0.25093090534210205, -0.24255621433258057, -0.2341815084218979, -0.2258068025112152, -0.21743209660053253, -0.20905739068984985, -0.20068268477916718, -0.1923079788684845, -0.18393327295780182, -0.17555856704711914, -0.16718386113643646, -0.15880915522575378, -0.1504344493150711, -0.14205974340438843, -0.13368503749370575, -0.12531033158302307, -0.1169356256723404, -0.10856091976165771, -0.10018621385097504, -0.09181150794029236, -0.08343680202960968, -0.075062096118927, -0.06668739020824432, -0.058312684297561646, -0.04993797838687897, -0.04156327247619629, -0.03318856656551361, -0.024813860654830933, -0.016439154744148254, -0.008064448833465576, 0.00031025707721710205, 0.00868496298789978, 0.01705966889858246, 0.025434374809265137, 0.033809080719947815, 0.04218378663063049, 0.05055849254131317, 0.05893319845199585, 0.06730790436267853, 0.0756826102733612, 0.08405731618404388, 0.09243202209472656, 0.10080672800540924, 0.10918143391609192, 0.1175561398267746, 0.12593084573745728, 0.13430555164813995, 0.14268025755882263, 0.1510549634695053, 0.159429669380188, 0.16780437529087067, 0.17617908120155334, 0.18455378711223602, 0.1929284930229187, 0.20130319893360138, 0.20967790484428406, 0.21805261075496674, 0.22642731666564941]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 12.0, 15.0, 18.0, 26.0, 31.0, 56.0, 89.0, 142.0, 206.0, 366.0, 686.0, 1379.0, 3392.0, 9229.0, 29643.0, 128808.0, 763541.0, 2142959.0, 909036.0, 152981.0, 34142.0, 10434.0, 3679.0, 1521.0, 759.0, 439.0, 221.0, 127.0, 107.0, 80.0, 47.0, 31.0, 24.0, 14.0, 18.0, 4.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.05206298828125, -0.05051136016845703, -0.04895973205566406, -0.047408103942871094, -0.045856475830078125, -0.044304847717285156, -0.04275321960449219, -0.04120159149169922, -0.03964996337890625, -0.03809833526611328, -0.03654670715332031, -0.034995079040527344, -0.033443450927734375, -0.031891822814941406, -0.030340194702148438, -0.02878856658935547, -0.0272369384765625, -0.02568531036376953, -0.024133682250976562, -0.022582054138183594, -0.021030426025390625, -0.019478797912597656, -0.017927169799804688, -0.01637554168701172, -0.01482391357421875, -0.013272285461425781, -0.011720657348632812, -0.010169029235839844, -0.008617401123046875, -0.007065773010253906, -0.0055141448974609375, -0.003962516784667969, -0.002410888671875, -0.0008592605590820312, 0.0006923675537109375, 0.0022439956665039062, 0.003795623779296875, 0.005347251892089844, 0.0068988800048828125, 0.008450508117675781, 0.01000213623046875, 0.011553764343261719, 0.013105392456054688, 0.014657020568847656, 0.016208648681640625, 0.017760276794433594, 0.019311904907226562, 0.02086353302001953, 0.0224151611328125, 0.02396678924560547, 0.025518417358398438, 0.027070045471191406, 0.028621673583984375, 0.030173301696777344, 0.03172492980957031, 0.03327655792236328, 0.03482818603515625, 0.03637981414794922, 0.03793144226074219, 0.039483070373535156, 0.041034698486328125, 0.042586326599121094, 0.04413795471191406, 0.04568958282470703, 0.0472412109375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 9.0, 3.0, 7.0, 18.0, 19.0, 17.0, 20.0, 29.0, 24.0, 28.0, 29.0, 31.0, 37.0, 45.0, 44.0, 49.0, 55.0, 39.0, 33.0, 56.0, 38.0, 44.0, 41.0, 39.0, 24.0, 37.0, 25.0, 25.0, 15.0, 19.0, 16.0, 10.0, 16.0, 14.0, 6.0, 5.0, 6.0, 9.0, 7.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.02825927734375, -0.027347564697265625, -0.02643585205078125, -0.025524139404296875, -0.0246124267578125, -0.023700714111328125, -0.02278900146484375, -0.021877288818359375, -0.020965576171875, -0.020053863525390625, -0.01914215087890625, -0.018230438232421875, -0.0173187255859375, -0.016407012939453125, -0.01549530029296875, -0.014583587646484375, -0.013671875, -0.012760162353515625, -0.01184844970703125, -0.010936737060546875, -0.0100250244140625, -0.009113311767578125, -0.00820159912109375, -0.007289886474609375, -0.006378173828125, -0.005466461181640625, -0.00455474853515625, -0.003643035888671875, -0.0027313232421875, -0.001819610595703125, -0.00090789794921875, 3.814697265625e-06, 0.00091552734375, 0.001827239990234375, 0.00273895263671875, 0.003650665283203125, 0.0045623779296875, 0.005474090576171875, 0.00638580322265625, 0.007297515869140625, 0.008209228515625, 0.009120941162109375, 0.01003265380859375, 0.010944366455078125, 0.0118560791015625, 0.012767791748046875, 0.01367950439453125, 0.014591217041015625, 0.0155029296875, 0.016414642333984375, 0.01732635498046875, 0.018238067626953125, 0.0191497802734375, 0.020061492919921875, 0.02097320556640625, 0.021884918212890625, 0.022796630859375, 0.023708343505859375, 0.02462005615234375, 0.025531768798828125, 0.0264434814453125, 0.027355194091796875, 0.02826690673828125, 0.029178619384765625, 0.03009033203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 14.0, 19.0, 39.0, 70.0, 142.0, 289.0, 769.0, 4011.0, 78167.0, 2733496.0, 1343081.0, 30780.0, 2343.0, 564.0, 239.0, 106.0, 61.0, 45.0, 12.0, 16.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1072998046875, -0.10280418395996094, -0.09830856323242188, -0.09381294250488281, -0.08931732177734375, -0.08482170104980469, -0.08032608032226562, -0.07583045959472656, -0.0713348388671875, -0.06683921813964844, -0.062343597412109375, -0.05784797668457031, -0.05335235595703125, -0.04885673522949219, -0.044361114501953125, -0.03986549377441406, -0.035369873046875, -0.030874252319335938, -0.026378631591796875, -0.021883010864257812, -0.01738739013671875, -0.012891769409179688, -0.008396148681640625, -0.0039005279541015625, 0.0005950927734375, 0.0050907135009765625, 0.009586334228515625, 0.014081954956054688, 0.01857757568359375, 0.023073196411132812, 0.027568817138671875, 0.03206443786621094, 0.03656005859375, 0.04105567932128906, 0.045551300048828125, 0.05004692077636719, 0.05454254150390625, 0.05903816223144531, 0.06353378295898438, 0.06802940368652344, 0.0725250244140625, 0.07702064514160156, 0.08151626586914062, 0.08601188659667969, 0.09050750732421875, 0.09500312805175781, 0.09949874877929688, 0.10399436950683594, 0.108489990234375, 0.11298561096191406, 0.11748123168945312, 0.12197685241699219, 0.12647247314453125, 0.1309680938720703, 0.13546371459960938, 0.13995933532714844, 0.1444549560546875, 0.14895057678222656, 0.15344619750976562, 0.1579418182373047, 0.16243743896484375, 0.1669330596923828, 0.17142868041992188, 0.17592430114746094, 0.180419921875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 23.0, 27.0, 46.0, 56.0, 88.0, 148.0, 232.0, 298.0, 419.0, 478.0, 550.0, 490.0, 338.0, 290.0, 238.0, 123.0, 82.0, 53.0, 38.0, 18.0, 14.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0775146484375, -0.075439453125, -0.0733642578125, -0.0712890625, -0.0692138671875, -0.067138671875, -0.0650634765625, -0.06298828125, -0.0609130859375, -0.058837890625, -0.0567626953125, -0.0546875, -0.0526123046875, -0.050537109375, -0.0484619140625, -0.04638671875, -0.0443115234375, -0.042236328125, -0.0401611328125, -0.0380859375, -0.0360107421875, -0.033935546875, -0.0318603515625, -0.02978515625, -0.0277099609375, -0.025634765625, -0.0235595703125, -0.021484375, -0.0194091796875, -0.017333984375, -0.0152587890625, -0.01318359375, -0.0111083984375, -0.009033203125, -0.0069580078125, -0.0048828125, -0.0028076171875, -0.000732421875, 0.0013427734375, 0.00341796875, 0.0054931640625, 0.007568359375, 0.0096435546875, 0.01171875, 0.0137939453125, 0.015869140625, 0.0179443359375, 0.02001953125, 0.0220947265625, 0.024169921875, 0.0262451171875, 0.0283203125, 0.0303955078125, 0.032470703125, 0.0345458984375, 0.03662109375, 0.0386962890625, 0.040771484375, 0.0428466796875, 0.044921875, 0.0469970703125, 0.049072265625, 0.0511474609375, 0.05322265625, 0.0552978515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 11.0, 19.0, 28.0, 58.0, 111.0, 146.0, 175.0, 180.0, 117.0, 55.0, 50.0, 18.0, 20.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4937243163585663, -0.481842964887619, -0.46996158361434937, -0.4580802321434021, -0.44619888067245483, -0.43431752920150757, -0.4224361479282379, -0.41055479645729065, -0.398673415184021, -0.38679206371307373, -0.3749106824398041, -0.3630293309688568, -0.35114797949790955, -0.3392665982246399, -0.3273852467536926, -0.31550389528274536, -0.3036225438117981, -0.29174119234085083, -0.2798598110675812, -0.2679784595966339, -0.25609710812568665, -0.24421574175357819, -0.23233437538146973, -0.22045302391052246, -0.208571657538414, -0.19669029116630554, -0.18480893969535828, -0.17292757332324982, -0.16104620695114136, -0.1491648554801941, -0.13728348910808563, -0.12540212273597717, -0.11352074146270752, -0.10163938254117966, -0.0897580236196518, -0.07787665724754333, -0.06599529832601547, -0.05411393940448761, -0.04223257303237915, -0.030351214110851288, -0.018469855189323425, -0.0065884944051504135, 0.005292866379022598, 0.01717422902584076, 0.029055587947368622, 0.040936946868896484, 0.052818313241004944, 0.0646996721625328, 0.07658103108406067, 0.08846239000558853, 0.1003437489271164, 0.11222511529922485, 0.12410647422075272, 0.13598783314228058, 0.14786919951438904, 0.1597505509853363, 0.17163191735744476, 0.18351328372955322, 0.1953946352005005, 0.20727600157260895, 0.2191573679447174, 0.23103871941566467, 0.24292008578777313, 0.2548014521598816, 0.26668280363082886]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 4.0, 7.0, 4.0, 12.0, 22.0, 12.0, 11.0, 13.0, 18.0, 15.0, 23.0, 39.0, 29.0, 43.0, 42.0, 36.0, 38.0, 32.0, 36.0, 39.0, 45.0, 40.0, 44.0, 41.0, 41.0, 33.0, 34.0, 33.0, 23.0, 29.0, 28.0, 15.0, 19.0, 11.0, 10.0, 12.0, 16.0, 11.0, 3.0, 7.0, 13.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14827698469161987, -0.1432119905948639, -0.1381469964981079, -0.13308200240135193, -0.12801700830459595, -0.12295201420783997, -0.11788702756166458, -0.1128220334649086, -0.10775703936815262, -0.10269204527139664, -0.09762705117464066, -0.09256205707788467, -0.08749707043170929, -0.08243207633495331, -0.07736708223819733, -0.07230208814144135, -0.06723709404468536, -0.06217209994792938, -0.0571071058511734, -0.05204211547970772, -0.046977121382951736, -0.041912127286195755, -0.03684713691473007, -0.03178214281797409, -0.02671714872121811, -0.021652154624462128, -0.016587162390351295, -0.011522169224917889, -0.006457176059484482, -0.0013921819627285004, 0.003672810271382332, 0.008737802505493164, 0.013802796602249146, 0.018867790699005127, 0.02393278293311596, 0.02899777516722679, 0.03406276926398277, 0.039127763360738754, 0.04419275373220444, 0.04925774782896042, 0.0543227419257164, 0.05938773602247238, 0.06445273011922836, 0.06951772421598434, 0.07458271086215973, 0.07964770495891571, 0.08471269905567169, 0.08977769315242767, 0.09484268724918365, 0.09990768134593964, 0.10497267544269562, 0.1100376695394516, 0.11510266363620758, 0.12016765773296356, 0.12523265182971954, 0.13029763102531433, 0.1353626251220703, 0.1404276192188263, 0.14549261331558228, 0.15055760741233826, 0.15562260150909424, 0.16068759560585022, 0.1657525897026062, 0.17081758379936218, 0.17588257789611816]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 6.0, 7.0, 11.0, 12.0, 24.0, 22.0, 41.0, 52.0, 68.0, 82.0, 129.0, 228.0, 395.0, 704.0, 1423.0, 3023.0, 6623.0, 16036.0, 40259.0, 105128.0, 260436.0, 334109.0, 170449.0, 64996.0, 25245.0, 10189.0, 4461.0, 2022.0, 980.0, 504.0, 315.0, 180.0, 109.0, 80.0, 69.0, 34.0, 22.0, 19.0, 11.0, 19.0, 9.0, 6.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07879638671875, -0.07627487182617188, -0.07375335693359375, -0.07123184204101562, -0.0687103271484375, -0.06618881225585938, -0.06366729736328125, -0.061145782470703125, -0.058624267578125, -0.056102752685546875, -0.05358123779296875, -0.051059722900390625, -0.0485382080078125, -0.046016693115234375, -0.04349517822265625, -0.040973663330078125, -0.0384521484375, -0.035930633544921875, -0.03340911865234375, -0.030887603759765625, -0.0283660888671875, -0.025844573974609375, -0.02332305908203125, -0.020801544189453125, -0.018280029296875, -0.015758514404296875, -0.01323699951171875, -0.010715484619140625, -0.0081939697265625, -0.005672454833984375, -0.00315093994140625, -0.000629425048828125, 0.00189208984375, 0.004413604736328125, 0.00693511962890625, 0.009456634521484375, 0.0119781494140625, 0.014499664306640625, 0.01702117919921875, 0.019542694091796875, 0.022064208984375, 0.024585723876953125, 0.02710723876953125, 0.029628753662109375, 0.0321502685546875, 0.034671783447265625, 0.03719329833984375, 0.039714813232421875, 0.042236328125, 0.044757843017578125, 0.04727935791015625, 0.049800872802734375, 0.0523223876953125, 0.054843902587890625, 0.05736541748046875, 0.059886932373046875, 0.062408447265625, 0.06492996215820312, 0.06745147705078125, 0.06997299194335938, 0.0724945068359375, 0.07501602172851562, 0.07753753662109375, 0.08005905151367188, 0.08258056640625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 6.0, 7.0, 10.0, 15.0, 23.0, 19.0, 24.0, 28.0, 32.0, 34.0, 42.0, 42.0, 28.0, 47.0, 60.0, 58.0, 48.0, 46.0, 53.0, 45.0, 46.0, 37.0, 46.0, 31.0, 31.0, 19.0, 16.0, 25.0, 11.0, 15.0, 7.0, 10.0, 9.0, 10.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0299224853515625, -0.02894425392150879, -0.027966022491455078, -0.026987791061401367, -0.026009559631347656, -0.025031328201293945, -0.024053096771240234, -0.023074865341186523, -0.022096633911132812, -0.0211184024810791, -0.02014017105102539, -0.01916193962097168, -0.01818370819091797, -0.017205476760864258, -0.016227245330810547, -0.015249013900756836, -0.014270782470703125, -0.013292551040649414, -0.012314319610595703, -0.011336088180541992, -0.010357856750488281, -0.00937962532043457, -0.00840139389038086, -0.0074231624603271484, -0.0064449310302734375, -0.0054666996002197266, -0.004488468170166016, -0.0035102367401123047, -0.0025320053100585938, -0.0015537738800048828, -0.0005755424499511719, 0.00040268898010253906, 0.00138092041015625, 0.002359151840209961, 0.003337383270263672, 0.004315614700317383, 0.005293846130371094, 0.006272077560424805, 0.007250308990478516, 0.008228540420532227, 0.009206771850585938, 0.010185003280639648, 0.01116323471069336, 0.01214146614074707, 0.013119697570800781, 0.014097929000854492, 0.015076160430908203, 0.016054391860961914, 0.017032623291015625, 0.018010854721069336, 0.018989086151123047, 0.019967317581176758, 0.02094554901123047, 0.02192378044128418, 0.02290201187133789, 0.0238802433013916, 0.024858474731445312, 0.025836706161499023, 0.026814937591552734, 0.027793169021606445, 0.028771400451660156, 0.029749631881713867, 0.030727863311767578, 0.03170609474182129, 0.032684326171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 8.0, 9.0, 11.0, 14.0, 19.0, 24.0, 39.0, 53.0, 78.0, 135.0, 257.0, 617.0, 1749.0, 5154.0, 15737.0, 46790.0, 128381.0, 292782.0, 319264.0, 152119.0, 55943.0, 19425.0, 6320.0, 2030.0, 793.0, 320.0, 151.0, 77.0, 67.0, 33.0, 23.0, 22.0, 19.0, 18.0, 17.0, 8.0, 8.0, 8.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08404541015625, -0.0812520980834961, -0.07845878601074219, -0.07566547393798828, -0.07287216186523438, -0.07007884979248047, -0.06728553771972656, -0.06449222564697266, -0.06169891357421875, -0.058905601501464844, -0.05611228942871094, -0.05331897735595703, -0.050525665283203125, -0.04773235321044922, -0.04493904113769531, -0.042145729064941406, -0.0393524169921875, -0.036559104919433594, -0.03376579284667969, -0.03097248077392578, -0.028179168701171875, -0.02538585662841797, -0.022592544555664062, -0.019799232482910156, -0.01700592041015625, -0.014212608337402344, -0.011419296264648438, -0.008625984191894531, -0.005832672119140625, -0.0030393600463867188, -0.0002460479736328125, 0.0025472640991210938, 0.005340576171875, 0.008133888244628906, 0.010927200317382812, 0.013720512390136719, 0.016513824462890625, 0.01930713653564453, 0.022100448608398438, 0.024893760681152344, 0.02768707275390625, 0.030480384826660156, 0.03327369689941406, 0.03606700897216797, 0.038860321044921875, 0.04165363311767578, 0.04444694519042969, 0.047240257263183594, 0.0500335693359375, 0.052826881408691406, 0.05562019348144531, 0.05841350555419922, 0.061206817626953125, 0.06400012969970703, 0.06679344177246094, 0.06958675384521484, 0.07238006591796875, 0.07517337799072266, 0.07796669006347656, 0.08076000213623047, 0.08355331420898438, 0.08634662628173828, 0.08913993835449219, 0.0919332504272461, 0.0947265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 9.0, 7.0, 9.0, 8.0, 11.0, 17.0, 11.0, 17.0, 20.0, 17.0, 32.0, 28.0, 26.0, 37.0, 36.0, 36.0, 45.0, 42.0, 42.0, 37.0, 38.0, 47.0, 46.0, 42.0, 45.0, 38.0, 39.0, 30.0, 26.0, 32.0, 18.0, 25.0, 17.0, 11.0, 11.0, 14.0, 9.0, 7.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.090087890625, -0.08753395080566406, -0.08498001098632812, -0.08242607116699219, -0.07987213134765625, -0.07731819152832031, -0.07476425170898438, -0.07221031188964844, -0.0696563720703125, -0.06710243225097656, -0.06454849243164062, -0.06199455261230469, -0.05944061279296875, -0.05688667297363281, -0.054332733154296875, -0.05177879333496094, -0.049224853515625, -0.04667091369628906, -0.044116973876953125, -0.04156303405761719, -0.03900909423828125, -0.03645515441894531, -0.033901214599609375, -0.03134727478027344, -0.0287933349609375, -0.026239395141601562, -0.023685455322265625, -0.021131515502929688, -0.01857757568359375, -0.016023635864257812, -0.013469696044921875, -0.010915756225585938, -0.00836181640625, -0.0058078765869140625, -0.003253936767578125, -0.0006999969482421875, 0.00185394287109375, 0.0044078826904296875, 0.006961822509765625, 0.009515762329101562, 0.0120697021484375, 0.014623641967773438, 0.017177581787109375, 0.019731521606445312, 0.02228546142578125, 0.024839401245117188, 0.027393341064453125, 0.029947280883789062, 0.032501220703125, 0.03505516052246094, 0.037609100341796875, 0.04016304016113281, 0.04271697998046875, 0.04527091979980469, 0.047824859619140625, 0.05037879943847656, 0.0529327392578125, 0.05548667907714844, 0.058040618896484375, 0.06059455871582031, 0.06314849853515625, 0.06570243835449219, 0.06825637817382812, 0.07081031799316406, 0.0733642578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 15.0, 28.0, 54.0, 57.0, 82.0, 94.0, 165.0, 242.0, 365.0, 468.0, 760.0, 1231.0, 1941.0, 3180.0, 5172.0, 8726.0, 15180.0, 26385.0, 45840.0, 77841.0, 123483.0, 168467.0, 179385.0, 146387.0, 99410.0, 60171.0, 34827.0, 19873.0, 11395.0, 6510.0, 3941.0, 2506.0, 1468.0, 986.0, 615.0, 444.0, 309.0, 175.0, 121.0, 75.0, 58.0, 33.0, 22.0, 15.0, 16.0, 8.0, 8.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.020111083984375, -0.019487380981445312, -0.018863677978515625, -0.018239974975585938, -0.01761627197265625, -0.016992568969726562, -0.016368865966796875, -0.015745162963867188, -0.0151214599609375, -0.014497756958007812, -0.013874053955078125, -0.013250350952148438, -0.01262664794921875, -0.012002944946289062, -0.011379241943359375, -0.010755538940429688, -0.0101318359375, -0.009508132934570312, -0.008884429931640625, -0.008260726928710938, -0.00763702392578125, -0.0070133209228515625, -0.006389617919921875, -0.0057659149169921875, -0.0051422119140625, -0.0045185089111328125, -0.003894805908203125, -0.0032711029052734375, -0.00264739990234375, -0.0020236968994140625, -0.001399993896484375, -0.0007762908935546875, -0.000152587890625, 0.0004711151123046875, 0.001094818115234375, 0.0017185211181640625, 0.00234222412109375, 0.0029659271240234375, 0.003589630126953125, 0.0042133331298828125, 0.0048370361328125, 0.0054607391357421875, 0.006084442138671875, 0.0067081451416015625, 0.00733184814453125, 0.007955551147460938, 0.008579254150390625, 0.009202957153320312, 0.00982666015625, 0.010450363159179688, 0.011074066162109375, 0.011697769165039062, 0.01232147216796875, 0.012945175170898438, 0.013568878173828125, 0.014192581176757812, 0.0148162841796875, 0.015439987182617188, 0.016063690185546875, 0.016687393188476562, 0.01731109619140625, 0.017934799194335938, 0.018558502197265625, 0.019182205200195312, 0.019805908203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 9.0, 5.0, 12.0, 13.0, 15.0, 20.0, 24.0, 35.0, 25.0, 38.0, 39.0, 51.0, 54.0, 73.0, 83.0, 71.0, 66.0, 59.0, 65.0, 42.0, 27.0, 30.0, 32.0, 16.0, 14.0, 14.0, 14.0, 19.0, 6.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5795230865478516e-05, -1.5161000192165375e-05, -1.4526769518852234e-05, -1.3892538845539093e-05, -1.3258308172225952e-05, -1.2624077498912811e-05, -1.198984682559967e-05, -1.135561615228653e-05, -1.0721385478973389e-05, -1.0087154805660248e-05, -9.452924132347107e-06, -8.818693459033966e-06, -8.184462785720825e-06, -7.550232112407684e-06, -6.9160014390945435e-06, -6.281770765781403e-06, -5.647540092468262e-06, -5.013309419155121e-06, -4.37907874584198e-06, -3.744848072528839e-06, -3.1106173992156982e-06, -2.4763867259025574e-06, -1.8421560525894165e-06, -1.2079253792762756e-06, -5.736947059631348e-07, 6.05359673500061e-08, 6.94766640663147e-07, 1.3289973139762878e-06, 1.9632279872894287e-06, 2.5974586606025696e-06, 3.2316893339157104e-06, 3.865920007228851e-06, 4.500150680541992e-06, 5.134381353855133e-06, 5.768612027168274e-06, 6.402842700481415e-06, 7.037073373794556e-06, 7.671304047107697e-06, 8.305534720420837e-06, 8.939765393733978e-06, 9.573996067047119e-06, 1.020822674036026e-05, 1.0842457413673401e-05, 1.1476688086986542e-05, 1.2110918760299683e-05, 1.2745149433612823e-05, 1.3379380106925964e-05, 1.4013610780239105e-05, 1.4647841453552246e-05, 1.5282072126865387e-05, 1.5916302800178528e-05, 1.655053347349167e-05, 1.718476414680481e-05, 1.781899482011795e-05, 1.845322549343109e-05, 1.9087456166744232e-05, 1.9721686840057373e-05, 2.0355917513370514e-05, 2.0990148186683655e-05, 2.1624378859996796e-05, 2.2258609533309937e-05, 2.2892840206623077e-05, 2.3527070879936218e-05, 2.416130155324936e-05, 2.47955322265625e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 24.0, 27.0, 54.0, 72.0, 103.0, 215.0, 352.0, 683.0, 1375.0, 2888.0, 5930.0, 13083.0, 28832.0, 62676.0, 129098.0, 218101.0, 246140.0, 171289.0, 89379.0, 42221.0, 19260.0, 8586.0, 4006.0, 1978.0, 974.0, 511.0, 262.0, 168.0, 77.0, 53.0, 37.0, 24.0, 18.0, 10.0, 4.0, 3.0, 3.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0267333984375, -0.025952577590942383, -0.025171756744384766, -0.02439093589782715, -0.02361011505126953, -0.022829294204711914, -0.022048473358154297, -0.02126765251159668, -0.020486831665039062, -0.019706010818481445, -0.018925189971923828, -0.01814436912536621, -0.017363548278808594, -0.016582727432250977, -0.01580190658569336, -0.015021085739135742, -0.014240264892578125, -0.013459444046020508, -0.01267862319946289, -0.011897802352905273, -0.011116981506347656, -0.010336160659790039, -0.009555339813232422, -0.008774518966674805, -0.007993698120117188, -0.00721287727355957, -0.006432056427001953, -0.005651235580444336, -0.004870414733886719, -0.0040895938873291016, -0.0033087730407714844, -0.002527952194213867, -0.00174713134765625, -0.0009663105010986328, -0.00018548965454101562, 0.0005953311920166016, 0.0013761520385742188, 0.002156972885131836, 0.002937793731689453, 0.0037186145782470703, 0.0044994354248046875, 0.005280256271362305, 0.006061077117919922, 0.006841897964477539, 0.007622718811035156, 0.008403539657592773, 0.00918436050415039, 0.009965181350708008, 0.010746002197265625, 0.011526823043823242, 0.01230764389038086, 0.013088464736938477, 0.013869285583496094, 0.014650106430053711, 0.015430927276611328, 0.016211748123168945, 0.016992568969726562, 0.01777338981628418, 0.018554210662841797, 0.019335031509399414, 0.02011585235595703, 0.02089667320251465, 0.021677494049072266, 0.022458314895629883, 0.0232391357421875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 10.0, 7.0, 10.0, 14.0, 13.0, 16.0, 21.0, 27.0, 34.0, 34.0, 30.0, 44.0, 47.0, 46.0, 57.0, 48.0, 50.0, 57.0, 49.0, 57.0, 36.0, 49.0, 40.0, 34.0, 25.0, 30.0, 27.0, 25.0, 11.0, 11.0, 6.0, 4.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0201416015625, -0.019455671310424805, -0.01876974105834961, -0.018083810806274414, -0.01739788055419922, -0.016711950302124023, -0.016026020050048828, -0.015340089797973633, -0.014654159545898438, -0.013968229293823242, -0.013282299041748047, -0.012596368789672852, -0.011910438537597656, -0.011224508285522461, -0.010538578033447266, -0.00985264778137207, -0.009166717529296875, -0.00848078727722168, -0.007794857025146484, -0.007108926773071289, -0.006422996520996094, -0.0057370662689208984, -0.005051136016845703, -0.004365205764770508, -0.0036792755126953125, -0.002993345260620117, -0.002307415008544922, -0.0016214847564697266, -0.0009355545043945312, -0.00024962425231933594, 0.0004363059997558594, 0.0011222362518310547, 0.00180816650390625, 0.0024940967559814453, 0.0031800270080566406, 0.003865957260131836, 0.004551887512207031, 0.0052378177642822266, 0.005923748016357422, 0.006609678268432617, 0.0072956085205078125, 0.007981538772583008, 0.008667469024658203, 0.009353399276733398, 0.010039329528808594, 0.010725259780883789, 0.011411190032958984, 0.01209712028503418, 0.012783050537109375, 0.01346898078918457, 0.014154911041259766, 0.014840841293334961, 0.015526771545410156, 0.01621270179748535, 0.016898632049560547, 0.017584562301635742, 0.018270492553710938, 0.018956422805786133, 0.019642353057861328, 0.020328283309936523, 0.02101421356201172, 0.021700143814086914, 0.02238607406616211, 0.023072004318237305, 0.0237579345703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 10.0, 17.0, 30.0, 31.0, 56.0, 80.0, 101.0, 109.0, 102.0, 120.0, 100.0, 62.0, 60.0, 52.0, 27.0, 21.0, 8.0, 8.0, 6.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4090379476547241, -0.3979947566986084, -0.3869515657424927, -0.37590837478637695, -0.36486518383026123, -0.3538219928741455, -0.3427788019180298, -0.33173561096191406, -0.32069242000579834, -0.3096492290496826, -0.2986060380935669, -0.28756284713745117, -0.27651965618133545, -0.2654764652252197, -0.254433274269104, -0.2433900684118271, -0.23234686255455017, -0.22130367159843445, -0.21026048064231873, -0.199217289686203, -0.18817409873008728, -0.17713090777397156, -0.16608770191669464, -0.15504451096057892, -0.1440013200044632, -0.13295812904834747, -0.12191493809223175, -0.11087173968553543, -0.09982854872941971, -0.08878535777330399, -0.07774215936660767, -0.06669896841049194, -0.05565577745437622, -0.0446125864982605, -0.03356939181685448, -0.022526197135448456, -0.011483006179332733, -0.0004398152232170105, 0.010603383183479309, 0.021646574139595032, 0.032689765095710754, 0.04373295605182648, 0.0547761507332325, 0.06581934541463852, 0.07686253637075424, 0.08790572732686996, 0.09894892573356628, 0.109992116689682, 0.12103530764579773, 0.13207849860191345, 0.14312168955802917, 0.1541648805141449, 0.16520807147026062, 0.17625126242637634, 0.18729446828365326, 0.19833765923976898, 0.2093808501958847, 0.22042404115200043, 0.23146723210811615, 0.24251043796539307, 0.2535536289215088, 0.2645968198776245, 0.27564001083374023, 0.28668320178985596, 0.2977263927459717]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 8.0, 2.0, 4.0, 11.0, 6.0, 12.0, 17.0, 11.0, 16.0, 20.0, 29.0, 25.0, 23.0, 27.0, 28.0, 29.0, 46.0, 34.0, 36.0, 44.0, 38.0, 43.0, 31.0, 35.0, 40.0, 42.0, 22.0, 41.0, 35.0, 35.0, 26.0, 19.0, 26.0, 21.0, 17.0, 22.0, 5.0, 10.0, 15.0, 7.0, 9.0, 11.0, 6.0, 10.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21515154838562012, -0.20781943202018738, -0.20048733055591583, -0.1931552141904831, -0.18582309782505035, -0.1784909963607788, -0.17115887999534607, -0.16382676362991333, -0.1564946472644806, -0.14916253089904785, -0.1418304294347763, -0.13449831306934357, -0.12716619670391083, -0.11983408778905869, -0.11250197887420654, -0.1051698625087738, -0.09783776104450226, -0.09050565212965012, -0.08317353576421738, -0.07584142684936523, -0.0685093104839325, -0.06117720156908035, -0.05384509265422821, -0.04651298001408577, -0.03918086737394333, -0.03184875473380089, -0.024516643956303596, -0.017184533178806305, -0.009852420538663864, -0.0025203078985214233, 0.004811801016330719, 0.01214391365647316, 0.0194760262966156, 0.02680813893675804, 0.03414025157690048, 0.041472360491752625, 0.048804473131895065, 0.056136585772037506, 0.06346869468688965, 0.07080081105232239, 0.07813291996717453, 0.08546502888202667, 0.09279714524745941, 0.10012925416231155, 0.1074613630771637, 0.11479347944259644, 0.12212558835744858, 0.12945769727230072, 0.13678981363773346, 0.1441219300031662, 0.15145403146743774, 0.15878614783287048, 0.16611826419830322, 0.17345038056373596, 0.1807824820280075, 0.18811459839344025, 0.1954466998577118, 0.20277881622314453, 0.21011091768741608, 0.21744303405284882, 0.22477515041828156, 0.2321072518825531, 0.23943936824798584, 0.24677148461341858, 0.2541036009788513]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 9.0, 10.0, 4.0, 5.0, 10.0, 15.0, 15.0, 33.0, 51.0, 53.0, 68.0, 137.0, 210.0, 393.0, 695.0, 1469.0, 3268.0, 8211.0, 25182.0, 106060.0, 685932.0, 2305118.0, 877819.0, 132674.0, 29845.0, 9591.0, 3701.0, 1679.0, 803.0, 424.0, 278.0, 154.0, 92.0, 54.0, 48.0, 40.0, 27.0, 25.0, 24.0, 17.0, 15.0, 7.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04876708984375, -0.046998023986816406, -0.04522895812988281, -0.04345989227294922, -0.041690826416015625, -0.03992176055908203, -0.03815269470214844, -0.036383628845214844, -0.03461456298828125, -0.032845497131347656, -0.031076431274414062, -0.02930736541748047, -0.027538299560546875, -0.02576923370361328, -0.024000167846679688, -0.022231101989746094, -0.0204620361328125, -0.018692970275878906, -0.016923904418945312, -0.015154838562011719, -0.013385772705078125, -0.011616706848144531, -0.009847640991210938, -0.008078575134277344, -0.00630950927734375, -0.004540443420410156, -0.0027713775634765625, -0.0010023117065429688, 0.000766754150390625, 0.0025358200073242188, 0.0043048858642578125, 0.006073951721191406, 0.007843017578125, 0.009612083435058594, 0.011381149291992188, 0.013150215148925781, 0.014919281005859375, 0.01668834686279297, 0.018457412719726562, 0.020226478576660156, 0.02199554443359375, 0.023764610290527344, 0.025533676147460938, 0.02730274200439453, 0.029071807861328125, 0.03084087371826172, 0.03260993957519531, 0.034379005432128906, 0.0361480712890625, 0.037917137145996094, 0.03968620300292969, 0.04145526885986328, 0.043224334716796875, 0.04499340057373047, 0.04676246643066406, 0.048531532287597656, 0.05030059814453125, 0.052069664001464844, 0.05383872985839844, 0.05560779571533203, 0.057376861572265625, 0.05914592742919922, 0.06091499328613281, 0.0626840591430664, 0.064453125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 8.0, 10.0, 5.0, 5.0, 18.0, 21.0, 26.0, 26.0, 22.0, 38.0, 34.0, 45.0, 35.0, 55.0, 57.0, 40.0, 49.0, 38.0, 59.0, 65.0, 56.0, 41.0, 34.0, 34.0, 31.0, 23.0, 23.0, 24.0, 18.0, 12.0, 6.0, 7.0, 13.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.039093017578125, -0.038010358810424805, -0.03692770004272461, -0.035845041275024414, -0.03476238250732422, -0.03367972373962402, -0.03259706497192383, -0.03151440620422363, -0.030431747436523438, -0.029349088668823242, -0.028266429901123047, -0.02718377113342285, -0.026101112365722656, -0.02501845359802246, -0.023935794830322266, -0.02285313606262207, -0.021770477294921875, -0.02068781852722168, -0.019605159759521484, -0.01852250099182129, -0.017439842224121094, -0.0163571834564209, -0.015274524688720703, -0.014191865921020508, -0.013109207153320312, -0.012026548385620117, -0.010943889617919922, -0.009861230850219727, -0.008778572082519531, -0.007695913314819336, -0.006613254547119141, -0.005530595779418945, -0.00444793701171875, -0.0033652782440185547, -0.0022826194763183594, -0.001199960708618164, -0.00011730194091796875, 0.0009653568267822266, 0.002048015594482422, 0.003130674362182617, 0.0042133331298828125, 0.005295991897583008, 0.006378650665283203, 0.0074613094329833984, 0.008543968200683594, 0.009626626968383789, 0.010709285736083984, 0.01179194450378418, 0.012874603271484375, 0.01395726203918457, 0.015039920806884766, 0.01612257957458496, 0.017205238342285156, 0.01828789710998535, 0.019370555877685547, 0.020453214645385742, 0.021535873413085938, 0.022618532180786133, 0.023701190948486328, 0.024783849716186523, 0.02586650848388672, 0.026949167251586914, 0.02803182601928711, 0.029114484786987305, 0.0301971435546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 9.0, 13.0, 10.0, 27.0, 49.0, 64.0, 143.0, 224.0, 766.0, 3040.0, 27156.0, 591889.0, 3257651.0, 293748.0, 16181.0, 2134.0, 631.0, 228.0, 130.0, 77.0, 40.0, 29.0, 16.0, 14.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10247802734375, -0.09859561920166016, -0.09471321105957031, -0.09083080291748047, -0.08694839477539062, -0.08306598663330078, -0.07918357849121094, -0.0753011703491211, -0.07141876220703125, -0.0675363540649414, -0.06365394592285156, -0.05977153778076172, -0.055889129638671875, -0.05200672149658203, -0.04812431335449219, -0.044241905212402344, -0.0403594970703125, -0.036477088928222656, -0.03259468078613281, -0.02871227264404297, -0.024829864501953125, -0.02094745635986328, -0.017065048217773438, -0.013182640075683594, -0.00930023193359375, -0.005417823791503906, -0.0015354156494140625, 0.0023469924926757812, 0.006229400634765625, 0.010111808776855469, 0.013994216918945312, 0.017876625061035156, 0.021759033203125, 0.025641441345214844, 0.029523849487304688, 0.03340625762939453, 0.037288665771484375, 0.04117107391357422, 0.04505348205566406, 0.048935890197753906, 0.05281829833984375, 0.056700706481933594, 0.06058311462402344, 0.06446552276611328, 0.06834793090820312, 0.07223033905029297, 0.07611274719238281, 0.07999515533447266, 0.0838775634765625, 0.08775997161865234, 0.09164237976074219, 0.09552478790283203, 0.09940719604492188, 0.10328960418701172, 0.10717201232910156, 0.1110544204711914, 0.11493682861328125, 0.1188192367553711, 0.12270164489746094, 0.12658405303955078, 0.13046646118164062, 0.13434886932373047, 0.1382312774658203, 0.14211368560791016, 0.14599609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 15.0, 25.0, 23.0, 41.0, 62.0, 101.0, 127.0, 176.0, 223.0, 314.0, 397.0, 425.0, 466.0, 404.0, 351.0, 278.0, 193.0, 142.0, 80.0, 54.0, 50.0, 27.0, 25.0, 15.0, 11.0, 12.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.056549072265625, -0.0549015998840332, -0.053254127502441406, -0.05160665512084961, -0.04995918273925781, -0.048311710357666016, -0.04666423797607422, -0.04501676559448242, -0.043369293212890625, -0.04172182083129883, -0.04007434844970703, -0.038426876068115234, -0.03677940368652344, -0.03513193130493164, -0.033484458923339844, -0.03183698654174805, -0.03018951416015625, -0.028542041778564453, -0.026894569396972656, -0.02524709701538086, -0.023599624633789062, -0.021952152252197266, -0.02030467987060547, -0.018657207489013672, -0.017009735107421875, -0.015362262725830078, -0.013714790344238281, -0.012067317962646484, -0.010419845581054688, -0.00877237319946289, -0.007124900817871094, -0.005477428436279297, -0.0038299560546875, -0.002182483673095703, -0.0005350112915039062, 0.0011124610900878906, 0.0027599334716796875, 0.004407405853271484, 0.006054878234863281, 0.007702350616455078, 0.009349822998046875, 0.010997295379638672, 0.012644767761230469, 0.014292240142822266, 0.015939712524414062, 0.01758718490600586, 0.019234657287597656, 0.020882129669189453, 0.02252960205078125, 0.024177074432373047, 0.025824546813964844, 0.02747201919555664, 0.029119491577148438, 0.030766963958740234, 0.03241443634033203, 0.03406190872192383, 0.035709381103515625, 0.03735685348510742, 0.03900432586669922, 0.040651798248291016, 0.04229927062988281, 0.04394674301147461, 0.045594215393066406, 0.0472416877746582, 0.04888916015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 5.0, 8.0, 8.0, 19.0, 28.0, 59.0, 84.0, 128.0, 184.0, 173.0, 131.0, 91.0, 57.0, 22.0, 11.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17561709880828857, -0.16230110824108124, -0.1489851176738739, -0.13566912710666656, -0.12235313653945923, -0.10903714597225189, -0.09572115540504456, -0.08240516483783722, -0.06908917427062988, -0.055773183703422546, -0.04245719313621521, -0.029141202569007874, -0.015825212001800537, -0.0025092214345932007, 0.010806769132614136, 0.024122759699821472, 0.03743875026702881, 0.050754740834236145, 0.06407073140144348, 0.07738672196865082, 0.09070271253585815, 0.10401870310306549, 0.11733469367027283, 0.13065068423748016, 0.1439666748046875, 0.15728266537189484, 0.17059865593910217, 0.1839146465063095, 0.19723063707351685, 0.21054662764072418, 0.22386261820793152, 0.23717860877513885, 0.2504945993423462, 0.26381057500839233, 0.27712658047676086, 0.2904425859451294, 0.30375856161117554, 0.3170745372772217, 0.3303905427455902, 0.34370654821395874, 0.3570225238800049, 0.370338499546051, 0.38365450501441956, 0.3969705104827881, 0.41028648614883423, 0.42360246181488037, 0.4369184672832489, 0.45023447275161743, 0.4635504484176636, 0.4768664240837097, 0.49018242955207825, 0.5034984350204468, 0.5168144106864929, 0.5301303863525391, 0.54344642162323, 0.5567623972892761, 0.5700783729553223, 0.5833943486213684, 0.5967103242874146, 0.6100263595581055, 0.6233423352241516, 0.6366583108901978, 0.6499743461608887, 0.6632903218269348, 0.676606297492981]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 8.0, 3.0, 5.0, 3.0, 8.0, 8.0, 9.0, 9.0, 21.0, 13.0, 12.0, 21.0, 18.0, 13.0, 21.0, 27.0, 27.0, 44.0, 23.0, 32.0, 38.0, 30.0, 21.0, 37.0, 41.0, 37.0, 35.0, 30.0, 28.0, 42.0, 44.0, 37.0, 22.0, 30.0, 29.0, 22.0, 28.0, 16.0, 20.0, 13.0, 13.0, 10.0, 12.0, 12.0, 8.0, 6.0, 9.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.15889489650726318, -0.15409672260284424, -0.1492985635995865, -0.14450040459632874, -0.1397022306919098, -0.13490405678749084, -0.1301058977842331, -0.12530773878097534, -0.1205095648765564, -0.11571139842271805, -0.1109132319688797, -0.10611506551504135, -0.101316899061203, -0.09651873260736465, -0.0917205661535263, -0.08692239969968796, -0.08212423324584961, -0.07732606679201126, -0.07252790033817291, -0.06772973388433456, -0.06293156743049622, -0.05813340097665787, -0.05333523452281952, -0.04853706806898117, -0.04373890161514282, -0.038940735161304474, -0.034142568707466125, -0.029344402253627777, -0.02454623579978943, -0.01974806934595108, -0.014949902892112732, -0.010151736438274384, -0.005353569984436035, -0.0005554035305976868, 0.004242762923240662, 0.00904092937707901, 0.013839095830917358, 0.018637262284755707, 0.023435428738594055, 0.028233595192432404, 0.03303176164627075, 0.0378299281001091, 0.04262809455394745, 0.0474262610077858, 0.052224427461624146, 0.057022593915462494, 0.06182076036930084, 0.06661892682313919, 0.07141709327697754, 0.07621525973081589, 0.08101342618465424, 0.08581159263849258, 0.09060975909233093, 0.09540792554616928, 0.10020609200000763, 0.10500425845384598, 0.10980242490768433, 0.11460059136152267, 0.11939875781536102, 0.12419692426919937, 0.12899509072303772, 0.13379326462745667, 0.13859142363071442, 0.14338958263397217, 0.1481877565383911]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 9.0, 5.0, 9.0, 19.0, 24.0, 31.0, 49.0, 65.0, 110.0, 169.0, 291.0, 507.0, 939.0, 1887.0, 3841.0, 8241.0, 19076.0, 46606.0, 120248.0, 268463.0, 310230.0, 159461.0, 62402.0, 25175.0, 10892.0, 4820.0, 2332.0, 1110.0, 596.0, 340.0, 194.0, 125.0, 86.0, 47.0, 47.0, 28.0, 23.0, 15.0, 9.0, 8.0, 9.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1103515625, -0.10613250732421875, -0.1019134521484375, -0.09769439697265625, -0.093475341796875, -0.08925628662109375, -0.0850372314453125, -0.08081817626953125, -0.07659912109375, -0.07238006591796875, -0.0681610107421875, -0.06394195556640625, -0.059722900390625, -0.05550384521484375, -0.0512847900390625, -0.04706573486328125, -0.0428466796875, -0.03862762451171875, -0.0344085693359375, -0.03018951416015625, -0.025970458984375, -0.02175140380859375, -0.0175323486328125, -0.01331329345703125, -0.00909423828125, -0.00487518310546875, -0.0006561279296875, 0.00356292724609375, 0.007781982421875, 0.01200103759765625, 0.0162200927734375, 0.02043914794921875, 0.024658203125, 0.02887725830078125, 0.0330963134765625, 0.03731536865234375, 0.041534423828125, 0.04575347900390625, 0.0499725341796875, 0.05419158935546875, 0.05841064453125, 0.06262969970703125, 0.0668487548828125, 0.07106781005859375, 0.075286865234375, 0.07950592041015625, 0.0837249755859375, 0.08794403076171875, 0.0921630859375, 0.09638214111328125, 0.1006011962890625, 0.10482025146484375, 0.109039306640625, 0.11325836181640625, 0.1174774169921875, 0.12169647216796875, 0.12591552734375, 0.13013458251953125, 0.1343536376953125, 0.13857269287109375, 0.142791748046875, 0.14701080322265625, 0.1512298583984375, 0.15544891357421875, 0.15966796875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 2.0, 8.0, 12.0, 16.0, 18.0, 18.0, 27.0, 30.0, 32.0, 28.0, 38.0, 44.0, 45.0, 48.0, 50.0, 63.0, 43.0, 53.0, 56.0, 65.0, 40.0, 42.0, 32.0, 31.0, 28.0, 29.0, 14.0, 16.0, 15.0, 10.0, 6.0, 12.0, 10.0, 5.0, 4.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03411865234375, -0.03310227394104004, -0.03208589553833008, -0.031069517135620117, -0.030053138732910156, -0.029036760330200195, -0.028020381927490234, -0.027004003524780273, -0.025987625122070312, -0.02497124671936035, -0.02395486831665039, -0.02293848991394043, -0.02192211151123047, -0.020905733108520508, -0.019889354705810547, -0.018872976303100586, -0.017856597900390625, -0.016840219497680664, -0.015823841094970703, -0.014807462692260742, -0.013791084289550781, -0.01277470588684082, -0.01175832748413086, -0.010741949081420898, -0.009725570678710938, -0.008709192276000977, -0.007692813873291016, -0.006676435470581055, -0.005660057067871094, -0.004643678665161133, -0.003627300262451172, -0.002610921859741211, -0.00159454345703125, -0.0005781650543212891, 0.0004382133483886719, 0.0014545917510986328, 0.0024709701538085938, 0.0034873485565185547, 0.004503726959228516, 0.0055201053619384766, 0.0065364837646484375, 0.0075528621673583984, 0.00856924057006836, 0.00958561897277832, 0.010601997375488281, 0.011618375778198242, 0.012634754180908203, 0.013651132583618164, 0.014667510986328125, 0.015683889389038086, 0.016700267791748047, 0.017716646194458008, 0.01873302459716797, 0.01974940299987793, 0.02076578140258789, 0.02178215980529785, 0.022798538208007812, 0.023814916610717773, 0.024831295013427734, 0.025847673416137695, 0.026864051818847656, 0.027880430221557617, 0.028896808624267578, 0.02991318702697754, 0.0309295654296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 21.0, 26.0, 36.0, 66.0, 80.0, 171.0, 278.0, 479.0, 979.0, 2343.0, 6070.0, 17717.0, 56492.0, 166606.0, 332603.0, 285735.0, 119550.0, 38776.0, 12578.0, 4449.0, 1784.0, 764.0, 372.0, 207.0, 97.0, 83.0, 51.0, 41.0, 33.0, 20.0, 12.0, 5.0, 8.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.1671142578125, -0.16302204132080078, -0.15892982482910156, -0.15483760833740234, -0.15074539184570312, -0.1466531753540039, -0.1425609588623047, -0.13846874237060547, -0.13437652587890625, -0.13028430938720703, -0.1261920928955078, -0.1220998764038086, -0.11800765991210938, -0.11391544342041016, -0.10982322692871094, -0.10573101043701172, -0.1016387939453125, -0.09754657745361328, -0.09345436096191406, -0.08936214447021484, -0.08526992797851562, -0.0811777114868164, -0.07708549499511719, -0.07299327850341797, -0.06890106201171875, -0.06480884552001953, -0.06071662902832031, -0.056624412536621094, -0.052532196044921875, -0.048439979553222656, -0.04434776306152344, -0.04025554656982422, -0.036163330078125, -0.03207111358642578, -0.027978897094726562, -0.023886680603027344, -0.019794464111328125, -0.015702247619628906, -0.011610031127929688, -0.007517814636230469, -0.00342559814453125, 0.0006666183471679688, 0.0047588348388671875, 0.008851051330566406, 0.012943267822265625, 0.017035484313964844, 0.021127700805664062, 0.02521991729736328, 0.0293121337890625, 0.03340435028076172, 0.03749656677246094, 0.041588783264160156, 0.045680999755859375, 0.049773216247558594, 0.05386543273925781, 0.05795764923095703, 0.06204986572265625, 0.06614208221435547, 0.07023429870605469, 0.0743265151977539, 0.07841873168945312, 0.08251094818115234, 0.08660316467285156, 0.09069538116455078, 0.09478759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 15.0, 4.0, 5.0, 16.0, 9.0, 15.0, 17.0, 25.0, 30.0, 35.0, 30.0, 47.0, 48.0, 39.0, 55.0, 49.0, 51.0, 48.0, 54.0, 45.0, 53.0, 46.0, 49.0, 44.0, 25.0, 28.0, 19.0, 23.0, 15.0, 11.0, 8.0, 17.0, 7.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1005859375, -0.09747123718261719, -0.09435653686523438, -0.09124183654785156, -0.08812713623046875, -0.08501243591308594, -0.08189773559570312, -0.07878303527832031, -0.0756683349609375, -0.07255363464355469, -0.06943893432617188, -0.06632423400878906, -0.06320953369140625, -0.06009483337402344, -0.056980133056640625, -0.05386543273925781, -0.050750732421875, -0.04763603210449219, -0.044521331787109375, -0.04140663146972656, -0.03829193115234375, -0.03517723083496094, -0.032062530517578125, -0.028947830200195312, -0.0258331298828125, -0.022718429565429688, -0.019603729248046875, -0.016489028930664062, -0.01337432861328125, -0.010259628295898438, -0.007144927978515625, -0.0040302276611328125, -0.00091552734375, 0.0021991729736328125, 0.005313873291015625, 0.008428573608398438, 0.01154327392578125, 0.014657974243164062, 0.017772674560546875, 0.020887374877929688, 0.0240020751953125, 0.027116775512695312, 0.030231475830078125, 0.03334617614746094, 0.03646087646484375, 0.03957557678222656, 0.042690277099609375, 0.04580497741699219, 0.048919677734375, 0.05203437805175781, 0.055149078369140625, 0.05826377868652344, 0.06137847900390625, 0.06449317932128906, 0.06760787963867188, 0.07072257995605469, 0.0738372802734375, 0.07695198059082031, 0.08006668090820312, 0.08318138122558594, 0.08629608154296875, 0.08941078186035156, 0.09252548217773438, 0.09564018249511719, 0.0987548828125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 4.0, 5.0, 3.0, 17.0, 18.0, 22.0, 40.0, 70.0, 91.0, 120.0, 225.0, 339.0, 562.0, 868.0, 1495.0, 2458.0, 4200.0, 7252.0, 12461.0, 22877.0, 42947.0, 80073.0, 142297.0, 210437.0, 208964.0, 139401.0, 77819.0, 41489.0, 22455.0, 12368.0, 7017.0, 4006.0, 2399.0, 1394.0, 894.0, 506.0, 334.0, 232.0, 120.0, 92.0, 57.0, 41.0, 35.0, 15.0, 9.0, 13.0, 9.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.032379150390625, -0.031221866607666016, -0.03006458282470703, -0.028907299041748047, -0.027750015258789062, -0.026592731475830078, -0.025435447692871094, -0.02427816390991211, -0.023120880126953125, -0.02196359634399414, -0.020806312561035156, -0.019649028778076172, -0.018491744995117188, -0.017334461212158203, -0.01617717742919922, -0.015019893646240234, -0.01386260986328125, -0.012705326080322266, -0.011548042297363281, -0.010390758514404297, -0.009233474731445312, -0.008076190948486328, -0.006918907165527344, -0.005761623382568359, -0.004604339599609375, -0.0034470558166503906, -0.0022897720336914062, -0.0011324882507324219, 2.47955322265625e-05, 0.0011820793151855469, 0.0023393630981445312, 0.0034966468811035156, 0.0046539306640625, 0.005811214447021484, 0.006968498229980469, 0.008125782012939453, 0.009283065795898438, 0.010440349578857422, 0.011597633361816406, 0.01275491714477539, 0.013912200927734375, 0.01506948471069336, 0.016226768493652344, 0.017384052276611328, 0.018541336059570312, 0.019698619842529297, 0.02085590362548828, 0.022013187408447266, 0.02317047119140625, 0.024327754974365234, 0.02548503875732422, 0.026642322540283203, 0.027799606323242188, 0.028956890106201172, 0.030114173889160156, 0.03127145767211914, 0.032428741455078125, 0.03358602523803711, 0.034743309020996094, 0.03590059280395508, 0.03705787658691406, 0.03821516036987305, 0.03937244415283203, 0.040529727935791016, 0.04168701171875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 2.0, 4.0, 7.0, 11.0, 10.0, 7.0, 20.0, 24.0, 25.0, 21.0, 46.0, 41.0, 44.0, 44.0, 43.0, 53.0, 62.0, 55.0, 58.0, 57.0, 45.0, 51.0, 53.0, 32.0, 32.0, 37.0, 22.0, 25.0, 21.0, 11.0, 3.0, 6.0, 8.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.390146255493164e-05, -2.3244880139827728e-05, -2.2588297724723816e-05, -2.1931715309619904e-05, -2.127513289451599e-05, -2.061855047941208e-05, -1.9961968064308167e-05, -1.9305385649204254e-05, -1.8648803234100342e-05, -1.799222081899643e-05, -1.7335638403892517e-05, -1.6679055988788605e-05, -1.6022473573684692e-05, -1.536589115858078e-05, -1.4709308743476868e-05, -1.4052726328372955e-05, -1.3396143913269043e-05, -1.273956149816513e-05, -1.2082979083061218e-05, -1.1426396667957306e-05, -1.0769814252853394e-05, -1.0113231837749481e-05, -9.456649422645569e-06, -8.800067007541656e-06, -8.143484592437744e-06, -7.486902177333832e-06, -6.8303197622299194e-06, -6.173737347126007e-06, -5.517154932022095e-06, -4.860572516918182e-06, -4.20399010181427e-06, -3.5474076867103577e-06, -2.8908252716064453e-06, -2.234242856502533e-06, -1.5776604413986206e-06, -9.210780262947083e-07, -2.644956111907959e-07, 3.9208680391311646e-07, 1.0486692190170288e-06, 1.7052516341209412e-06, 2.3618340492248535e-06, 3.018416464328766e-06, 3.6749988794326782e-06, 4.3315812945365906e-06, 4.988163709640503e-06, 5.644746124744415e-06, 6.301328539848328e-06, 6.95791095495224e-06, 7.614493370056152e-06, 8.271075785160065e-06, 8.927658200263977e-06, 9.58424061536789e-06, 1.0240823030471802e-05, 1.0897405445575714e-05, 1.1553987860679626e-05, 1.2210570275783539e-05, 1.2867152690887451e-05, 1.3523735105991364e-05, 1.4180317521095276e-05, 1.4836899936199188e-05, 1.54934823513031e-05, 1.6150064766407013e-05, 1.6806647181510925e-05, 1.7463229596614838e-05, 1.811981201171875e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 5.0, 6.0, 15.0, 18.0, 21.0, 23.0, 44.0, 73.0, 116.0, 168.0, 289.0, 537.0, 912.0, 1641.0, 3144.0, 6080.0, 12085.0, 25627.0, 56941.0, 128963.0, 253922.0, 275981.0, 153796.0, 68291.0, 30607.0, 14353.0, 7034.0, 3511.0, 1876.0, 1004.0, 591.0, 334.0, 184.0, 123.0, 83.0, 49.0, 27.0, 29.0, 15.0, 12.0, 6.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.04736328125, -0.0459747314453125, -0.044586181640625, -0.0431976318359375, -0.04180908203125, -0.0404205322265625, -0.039031982421875, -0.0376434326171875, -0.0362548828125, -0.0348663330078125, -0.033477783203125, -0.0320892333984375, -0.03070068359375, -0.0293121337890625, -0.027923583984375, -0.0265350341796875, -0.025146484375, -0.0237579345703125, -0.022369384765625, -0.0209808349609375, -0.01959228515625, -0.0182037353515625, -0.016815185546875, -0.0154266357421875, -0.0140380859375, -0.0126495361328125, -0.011260986328125, -0.0098724365234375, -0.00848388671875, -0.0070953369140625, -0.005706787109375, -0.0043182373046875, -0.0029296875, -0.0015411376953125, -0.000152587890625, 0.0012359619140625, 0.00262451171875, 0.0040130615234375, 0.005401611328125, 0.0067901611328125, 0.0081787109375, 0.0095672607421875, 0.010955810546875, 0.0123443603515625, 0.01373291015625, 0.0151214599609375, 0.016510009765625, 0.0178985595703125, 0.019287109375, 0.0206756591796875, 0.022064208984375, 0.0234527587890625, 0.02484130859375, 0.0262298583984375, 0.027618408203125, 0.0290069580078125, 0.0303955078125, 0.0317840576171875, 0.033172607421875, 0.0345611572265625, 0.03594970703125, 0.0373382568359375, 0.038726806640625, 0.0401153564453125, 0.04150390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 5.0, 5.0, 14.0, 12.0, 15.0, 19.0, 32.0, 31.0, 29.0, 42.0, 44.0, 50.0, 59.0, 72.0, 69.0, 85.0, 67.0, 61.0, 52.0, 36.0, 35.0, 22.0, 20.0, 26.0, 16.0, 19.0, 11.0, 8.0, 6.0, 6.0, 6.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.03443002700805664, -0.03330707550048828, -0.03218412399291992, -0.031061172485351562, -0.029938220977783203, -0.028815269470214844, -0.027692317962646484, -0.026569366455078125, -0.025446414947509766, -0.024323463439941406, -0.023200511932373047, -0.022077560424804688, -0.020954608917236328, -0.01983165740966797, -0.01870870590209961, -0.01758575439453125, -0.01646280288696289, -0.015339851379394531, -0.014216899871826172, -0.013093948364257812, -0.011970996856689453, -0.010848045349121094, -0.009725093841552734, -0.008602142333984375, -0.007479190826416016, -0.006356239318847656, -0.005233287811279297, -0.0041103363037109375, -0.002987384796142578, -0.0018644332885742188, -0.0007414817810058594, 0.0003814697265625, 0.0015044212341308594, 0.0026273727416992188, 0.003750324249267578, 0.0048732757568359375, 0.005996227264404297, 0.007119178771972656, 0.008242130279541016, 0.009365081787109375, 0.010488033294677734, 0.011610984802246094, 0.012733936309814453, 0.013856887817382812, 0.014979839324951172, 0.01610279083251953, 0.01722574234008789, 0.01834869384765625, 0.01947164535522461, 0.02059459686279297, 0.021717548370361328, 0.022840499877929688, 0.023963451385498047, 0.025086402893066406, 0.026209354400634766, 0.027332305908203125, 0.028455257415771484, 0.029578208923339844, 0.030701160430908203, 0.03182411193847656, 0.03294706344604492, 0.03407001495361328, 0.03519296646118164, 0.03631591796875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 16.0, 34.0, 58.0, 76.0, 108.0, 145.0, 150.0, 128.0, 106.0, 86.0, 46.0, 28.0, 11.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4259274899959564, -0.403861939907074, -0.38179636001586914, -0.3597308099269867, -0.33766525983810425, -0.3155997097492218, -0.29353415966033936, -0.2714685797691345, -0.24940302968025208, -0.22733747959136963, -0.205271914601326, -0.18320634961128235, -0.1611407995223999, -0.13907524943351746, -0.11700968444347382, -0.09494411945343018, -0.07287856936454773, -0.050813011825084686, -0.028747454285621643, -0.0066818967461586, 0.015383660793304443, 0.03744921833276749, 0.05951477587223053, 0.08158034086227417, 0.10364589095115662, 0.12571144104003906, 0.1477770060300827, 0.16984257102012634, 0.1919081211090088, 0.21397367119789124, 0.23603923618793488, 0.2581048011779785, 0.2801703214645386, 0.302235871553421, 0.32430142164230347, 0.3463670015335083, 0.36843255162239075, 0.3904981017112732, 0.412563681602478, 0.4346292316913605, 0.4566947817802429, 0.47876033186912537, 0.5008258819580078, 0.5228914618492126, 0.5449570417404175, 0.5670225620269775, 0.5890881419181824, 0.6111537218093872, 0.6332192420959473, 0.6552848219871521, 0.6773503422737122, 0.699415922164917, 0.721481442451477, 0.7435470223426819, 0.7656126022338867, 0.7876781225204468, 0.8097437024116516, 0.8318092823028564, 0.8538748025894165, 0.8759403824806213, 0.8980059623718262, 0.9200714826583862, 0.9421370625495911, 0.9642026424407959, 0.986268162727356]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 9.0, 11.0, 10.0, 10.0, 13.0, 15.0, 20.0, 18.0, 31.0, 17.0, 34.0, 23.0, 32.0, 22.0, 30.0, 35.0, 52.0, 35.0, 40.0, 41.0, 48.0, 42.0, 41.0, 32.0, 38.0, 27.0, 39.0, 31.0, 32.0, 23.0, 24.0, 22.0, 14.0, 17.0, 15.0, 9.0, 8.0, 8.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2940804362297058, -0.284506618976593, -0.2749328017234802, -0.2653590142726898, -0.255785197019577, -0.24621137976646423, -0.23663756251335144, -0.22706376016139984, -0.21748995780944824, -0.20791614055633545, -0.19834233820438385, -0.18876852095127106, -0.17919471859931946, -0.16962090134620667, -0.16004708409309387, -0.15047328174114227, -0.14089946448802948, -0.1313256472349167, -0.12175184488296509, -0.1121780276298523, -0.1026042252779007, -0.0930304080247879, -0.0834565982222557, -0.07388278841972351, -0.06430897861719131, -0.05473516881465912, -0.04516135901212692, -0.03558754548430443, -0.026013735681772232, -0.016439925879240036, -0.0068661123514175415, 0.0027076974511146545, 0.01228150725364685, 0.021855317056179047, 0.03142912685871124, 0.04100294038653374, 0.05057675018906593, 0.06015055999159813, 0.06972437351942062, 0.07929818332195282, 0.08887199312448502, 0.09844580292701721, 0.10801961272954941, 0.1175934225320816, 0.1271672397851944, 0.136741042137146, 0.1463148593902588, 0.15588867664337158, 0.16546247899532318, 0.17503629624843597, 0.18461009860038757, 0.19418391585350037, 0.20375771820545197, 0.21333153545856476, 0.22290533781051636, 0.23247915506362915, 0.24205297231674194, 0.25162678956985474, 0.26120060682296753, 0.27077439427375793, 0.2803482115268707, 0.2899220287799835, 0.2994958460330963, 0.3090696334838867, 0.3186434507369995]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 11.0, 15.0, 31.0, 36.0, 54.0, 95.0, 201.0, 321.0, 577.0, 1145.0, 2594.0, 6256.0, 17891.0, 64532.0, 342740.0, 1864379.0, 1554466.0, 261003.0, 52496.0, 15135.0, 5460.0, 2390.0, 1081.0, 550.0, 343.0, 161.0, 112.0, 72.0, 33.0, 25.0, 13.0, 17.0, 12.0, 10.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047332763671875, -0.04517412185668945, -0.043015480041503906, -0.04085683822631836, -0.03869819641113281, -0.036539554595947266, -0.03438091278076172, -0.03222227096557617, -0.030063629150390625, -0.027904987335205078, -0.02574634552001953, -0.023587703704833984, -0.021429061889648438, -0.01927042007446289, -0.017111778259277344, -0.014953136444091797, -0.01279449462890625, -0.010635852813720703, -0.008477210998535156, -0.006318569183349609, -0.0041599273681640625, -0.0020012855529785156, 0.00015735626220703125, 0.002315998077392578, 0.004474639892578125, 0.006633281707763672, 0.008791923522949219, 0.010950565338134766, 0.013109207153320312, 0.01526784896850586, 0.017426490783691406, 0.019585132598876953, 0.0217437744140625, 0.023902416229248047, 0.026061058044433594, 0.02821969985961914, 0.030378341674804688, 0.032536983489990234, 0.03469562530517578, 0.03685426712036133, 0.039012908935546875, 0.04117155075073242, 0.04333019256591797, 0.045488834381103516, 0.04764747619628906, 0.04980611801147461, 0.051964759826660156, 0.0541234016418457, 0.05628204345703125, 0.0584406852722168, 0.060599327087402344, 0.06275796890258789, 0.06491661071777344, 0.06707525253295898, 0.06923389434814453, 0.07139253616333008, 0.07355117797851562, 0.07570981979370117, 0.07786846160888672, 0.08002710342407227, 0.08218574523925781, 0.08434438705444336, 0.0865030288696289, 0.08866167068481445, 0.0908203125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 7.0, 3.0, 4.0, 3.0, 9.0, 5.0, 19.0, 11.0, 15.0, 23.0, 24.0, 25.0, 28.0, 33.0, 41.0, 47.0, 35.0, 46.0, 39.0, 45.0, 47.0, 58.0, 44.0, 41.0, 53.0, 50.0, 45.0, 26.0, 28.0, 24.0, 26.0, 12.0, 12.0, 10.0, 15.0, 17.0, 6.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03082275390625, -0.02970266342163086, -0.02858257293701172, -0.027462482452392578, -0.026342391967773438, -0.025222301483154297, -0.024102210998535156, -0.022982120513916016, -0.021862030029296875, -0.020741939544677734, -0.019621849060058594, -0.018501758575439453, -0.017381668090820312, -0.016261577606201172, -0.015141487121582031, -0.01402139663696289, -0.01290130615234375, -0.01178121566772461, -0.010661125183105469, -0.009541034698486328, -0.008420944213867188, -0.007300853729248047, -0.006180763244628906, -0.005060672760009766, -0.003940582275390625, -0.0028204917907714844, -0.0017004013061523438, -0.0005803108215332031, 0.0005397796630859375, 0.0016598701477050781, 0.0027799606323242188, 0.0039000511169433594, 0.0050201416015625, 0.006140232086181641, 0.007260322570800781, 0.008380413055419922, 0.009500503540039062, 0.010620594024658203, 0.011740684509277344, 0.012860774993896484, 0.013980865478515625, 0.015100955963134766, 0.016221046447753906, 0.017341136932373047, 0.018461227416992188, 0.019581317901611328, 0.02070140838623047, 0.02182149887084961, 0.02294158935546875, 0.02406167984008789, 0.02518177032470703, 0.026301860809326172, 0.027421951293945312, 0.028542041778564453, 0.029662132263183594, 0.030782222747802734, 0.031902313232421875, 0.033022403717041016, 0.034142494201660156, 0.0352625846862793, 0.03638267517089844, 0.03750276565551758, 0.03862285614013672, 0.03974294662475586, 0.040863037109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 6.0, 8.0, 7.0, 16.0, 28.0, 40.0, 55.0, 76.0, 132.0, 237.0, 406.0, 708.0, 1402.0, 2852.0, 6013.0, 14167.0, 37261.0, 113530.0, 404040.0, 1357324.0, 1546317.0, 498215.0, 137323.0, 44149.0, 16317.0, 7006.0, 3165.0, 1559.0, 822.0, 428.0, 264.0, 147.0, 93.0, 52.0, 41.0, 26.0, 15.0, 13.0, 8.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06268310546875, -0.06078815460205078, -0.05889320373535156, -0.056998252868652344, -0.055103302001953125, -0.053208351135253906, -0.05131340026855469, -0.04941844940185547, -0.04752349853515625, -0.04562854766845703, -0.04373359680175781, -0.041838645935058594, -0.039943695068359375, -0.038048744201660156, -0.03615379333496094, -0.03425884246826172, -0.0323638916015625, -0.03046894073486328, -0.028573989868164062, -0.026679039001464844, -0.024784088134765625, -0.022889137268066406, -0.020994186401367188, -0.01909923553466797, -0.01720428466796875, -0.015309333801269531, -0.013414382934570312, -0.011519432067871094, -0.009624481201171875, -0.007729530334472656, -0.0058345794677734375, -0.003939628601074219, -0.002044677734375, -0.00014972686767578125, 0.0017452239990234375, 0.0036401748657226562, 0.005535125732421875, 0.007430076599121094, 0.009325027465820312, 0.011219978332519531, 0.01311492919921875, 0.015009880065917969, 0.016904830932617188, 0.018799781799316406, 0.020694732666015625, 0.022589683532714844, 0.024484634399414062, 0.02637958526611328, 0.0282745361328125, 0.03016948699951172, 0.03206443786621094, 0.033959388732910156, 0.035854339599609375, 0.037749290466308594, 0.03964424133300781, 0.04153919219970703, 0.04343414306640625, 0.04532909393310547, 0.04722404479980469, 0.049118995666503906, 0.051013946533203125, 0.052908897399902344, 0.05480384826660156, 0.05669879913330078, 0.05859375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 9.0, 8.0, 11.0, 18.0, 21.0, 44.0, 41.0, 83.0, 113.0, 144.0, 215.0, 298.0, 370.0, 480.0, 503.0, 450.0, 329.0, 248.0, 212.0, 120.0, 94.0, 75.0, 47.0, 26.0, 33.0, 15.0, 12.0, 15.0, 2.0, 10.0, 7.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05072021484375, -0.04864501953125, -0.04656982421875, -0.04449462890625, -0.04241943359375, -0.04034423828125, -0.03826904296875, -0.03619384765625, -0.03411865234375, -0.03204345703125, -0.02996826171875, -0.02789306640625, -0.02581787109375, -0.02374267578125, -0.02166748046875, -0.01959228515625, -0.01751708984375, -0.01544189453125, -0.01336669921875, -0.01129150390625, -0.00921630859375, -0.00714111328125, -0.00506591796875, -0.00299072265625, -0.00091552734375, 0.00115966796875, 0.00323486328125, 0.00531005859375, 0.00738525390625, 0.00946044921875, 0.01153564453125, 0.01361083984375, 0.01568603515625, 0.01776123046875, 0.01983642578125, 0.02191162109375, 0.02398681640625, 0.02606201171875, 0.02813720703125, 0.03021240234375, 0.03228759765625, 0.03436279296875, 0.03643798828125, 0.03851318359375, 0.04058837890625, 0.04266357421875, 0.04473876953125, 0.04681396484375, 0.04888916015625, 0.05096435546875, 0.05303955078125, 0.05511474609375, 0.05718994140625, 0.05926513671875, 0.06134033203125, 0.06341552734375, 0.06549072265625, 0.06756591796875, 0.06964111328125, 0.07171630859375, 0.07379150390625, 0.07586669921875, 0.07794189453125, 0.08001708984375, 0.08209228515625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 19.0, 25.0, 44.0, 57.0, 71.0, 92.0, 111.0, 150.0, 132.0, 104.0, 73.0, 48.0, 31.0, 17.0, 8.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5389519929885864, -0.5237274765968323, -0.5085029006004333, -0.4932783544063568, -0.4780538082122803, -0.46282926201820374, -0.4476047158241272, -0.43238019943237305, -0.4171556234359741, -0.4019310772418976, -0.38670653104782104, -0.3714819848537445, -0.35625743865966797, -0.34103289246559143, -0.3258083462715149, -0.31058382987976074, -0.2953592836856842, -0.28013473749160767, -0.26491019129753113, -0.2496856451034546, -0.23446109890937805, -0.2192365527153015, -0.20401202142238617, -0.18878747522830963, -0.1735629290342331, -0.15833838284015656, -0.14311383664608002, -0.12788930535316467, -0.11266475170850754, -0.097440205514431, -0.08221566677093506, -0.06699112057685852, -0.05176657438278198, -0.036542028188705444, -0.021317485719919205, -0.006092943251132965, 0.009131602942943573, 0.02435614913702011, 0.03958068788051605, 0.05480523407459259, 0.07002978026866913, 0.08525432646274567, 0.1004788726568222, 0.11570341140031815, 0.1309279501438141, 0.14615249633789062, 0.16137704253196716, 0.1766015887260437, 0.19182613492012024, 0.20705068111419678, 0.22227522730827332, 0.23749977350234985, 0.2527243196964264, 0.26794886589050293, 0.2831733822822571, 0.298397958278656, 0.31362247467041016, 0.3288470208644867, 0.34407156705856323, 0.35929611325263977, 0.3745206594467163, 0.38974520564079285, 0.4049697518348694, 0.42019426822662354, 0.43541884422302246]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 6.0, 6.0, 3.0, 7.0, 12.0, 9.0, 8.0, 11.0, 16.0, 14.0, 24.0, 24.0, 20.0, 31.0, 30.0, 32.0, 39.0, 38.0, 44.0, 33.0, 39.0, 41.0, 42.0, 41.0, 34.0, 43.0, 23.0, 34.0, 37.0, 39.0, 16.0, 36.0, 23.0, 17.0, 15.0, 15.0, 22.0, 14.0, 7.0, 10.0, 10.0, 5.0, 4.0, 7.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.20167559385299683, -0.19519001245498657, -0.1887044459581375, -0.18221886456012726, -0.1757332980632782, -0.16924771666526794, -0.1627621352672577, -0.15627656877040863, -0.14979100227355957, -0.14330542087554932, -0.13681985437870026, -0.13033427298069, -0.12384870648384094, -0.11736312508583069, -0.11087755113840103, -0.10439197719097137, -0.09790639579296112, -0.09142082184553146, -0.0849352478981018, -0.07844966650009155, -0.07196410000324249, -0.06547851860523224, -0.05899294465780258, -0.052507370710372925, -0.04602179676294327, -0.03953622281551361, -0.033050648868083954, -0.026565071195364, -0.02007949724793434, -0.013593923300504684, -0.007108345627784729, -0.000622771680355072, 0.005862802267074585, 0.012348377145826817, 0.018833952024579048, 0.025319527834653854, 0.03180510178208351, 0.03829067572951317, 0.044776253402233124, 0.05126182734966278, 0.05774740129709244, 0.0642329752445221, 0.07071854919195175, 0.07720412313938141, 0.08368970453739166, 0.09017527103424072, 0.09666085243225098, 0.10314642637968063, 0.10963200032711029, 0.11611757427453995, 0.1226031482219696, 0.12908872961997986, 0.13557429611682892, 0.14205987751483917, 0.14854544401168823, 0.1550310254096985, 0.16151660680770874, 0.168002188205719, 0.17448775470256805, 0.1809733361005783, 0.18745890259742737, 0.19394448399543762, 0.20043006539344788, 0.20691563189029694, 0.213401198387146]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 3.0, 10.0, 12.0, 20.0, 18.0, 34.0, 56.0, 63.0, 123.0, 195.0, 343.0, 617.0, 1081.0, 2151.0, 4310.0, 8835.0, 18203.0, 38262.0, 88308.0, 239093.0, 355258.0, 169347.0, 64686.0, 29339.0, 13884.0, 6982.0, 3328.0, 1787.0, 894.0, 536.0, 301.0, 175.0, 102.0, 61.0, 34.0, 21.0, 22.0, 13.0, 20.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.11053466796875, -0.10700607299804688, -0.10347747802734375, -0.09994888305664062, -0.0964202880859375, -0.09289169311523438, -0.08936309814453125, -0.08583450317382812, -0.082305908203125, -0.07877731323242188, -0.07524871826171875, -0.07172012329101562, -0.0681915283203125, -0.06466293334960938, -0.06113433837890625, -0.057605743408203125, -0.0540771484375, -0.050548553466796875, -0.04701995849609375, -0.043491363525390625, -0.0399627685546875, -0.036434173583984375, -0.03290557861328125, -0.029376983642578125, -0.025848388671875, -0.022319793701171875, -0.01879119873046875, -0.015262603759765625, -0.0117340087890625, -0.008205413818359375, -0.00467681884765625, -0.001148223876953125, 0.00238037109375, 0.005908966064453125, 0.00943756103515625, 0.012966156005859375, 0.0164947509765625, 0.020023345947265625, 0.02355194091796875, 0.027080535888671875, 0.030609130859375, 0.034137725830078125, 0.03766632080078125, 0.041194915771484375, 0.0447235107421875, 0.048252105712890625, 0.05178070068359375, 0.055309295654296875, 0.058837890625, 0.062366485595703125, 0.06589508056640625, 0.06942367553710938, 0.0729522705078125, 0.07648086547851562, 0.08000946044921875, 0.08353805541992188, 0.087066650390625, 0.09059524536132812, 0.09412384033203125, 0.09765243530273438, 0.1011810302734375, 0.10470962524414062, 0.10823822021484375, 0.11176681518554688, 0.11529541015625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 11.0, 8.0, 8.0, 15.0, 11.0, 17.0, 17.0, 26.0, 33.0, 34.0, 23.0, 32.0, 27.0, 45.0, 39.0, 61.0, 50.0, 45.0, 51.0, 45.0, 55.0, 49.0, 28.0, 37.0, 40.0, 26.0, 35.0, 24.0, 22.0, 14.0, 12.0, 15.0, 6.0, 11.0, 7.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0343017578125, -0.03318500518798828, -0.03206825256347656, -0.030951499938964844, -0.029834747314453125, -0.028717994689941406, -0.027601242065429688, -0.02648448944091797, -0.02536773681640625, -0.02425098419189453, -0.023134231567382812, -0.022017478942871094, -0.020900726318359375, -0.019783973693847656, -0.018667221069335938, -0.01755046844482422, -0.0164337158203125, -0.015316963195800781, -0.014200210571289062, -0.013083457946777344, -0.011966705322265625, -0.010849952697753906, -0.009733200073242188, -0.008616447448730469, -0.00749969482421875, -0.006382942199707031, -0.0052661895751953125, -0.004149436950683594, -0.003032684326171875, -0.0019159317016601562, -0.0007991790771484375, 0.00031757354736328125, 0.001434326171875, 0.0025510787963867188, 0.0036678314208984375, 0.004784584045410156, 0.005901336669921875, 0.007018089294433594, 0.008134841918945312, 0.009251594543457031, 0.01036834716796875, 0.011485099792480469, 0.012601852416992188, 0.013718605041503906, 0.014835357666015625, 0.015952110290527344, 0.017068862915039062, 0.01818561553955078, 0.0193023681640625, 0.02041912078857422, 0.021535873413085938, 0.022652626037597656, 0.023769378662109375, 0.024886131286621094, 0.026002883911132812, 0.02711963653564453, 0.02823638916015625, 0.02935314178466797, 0.030469894409179688, 0.031586647033691406, 0.032703399658203125, 0.033820152282714844, 0.03493690490722656, 0.03605365753173828, 0.03717041015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 5.0, 12.0, 13.0, 24.0, 25.0, 36.0, 56.0, 65.0, 88.0, 126.0, 182.0, 310.0, 546.0, 1196.0, 3002.0, 8800.0, 24908.0, 73308.0, 243665.0, 431739.0, 176054.0, 54541.0, 18642.0, 6558.0, 2375.0, 960.0, 456.0, 269.0, 156.0, 114.0, 94.0, 50.0, 40.0, 37.0, 18.0, 29.0, 10.0, 11.0, 5.0, 5.0, 5.0, 7.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.140869140625, -0.13677024841308594, -0.13267135620117188, -0.1285724639892578, -0.12447357177734375, -0.12037467956542969, -0.11627578735351562, -0.11217689514160156, -0.1080780029296875, -0.10397911071777344, -0.09988021850585938, -0.09578132629394531, -0.09168243408203125, -0.08758354187011719, -0.08348464965820312, -0.07938575744628906, -0.075286865234375, -0.07118797302246094, -0.06708908081054688, -0.06299018859863281, -0.05889129638671875, -0.05479240417480469, -0.050693511962890625, -0.04659461975097656, -0.0424957275390625, -0.03839683532714844, -0.034297943115234375, -0.030199050903320312, -0.02610015869140625, -0.022001266479492188, -0.017902374267578125, -0.013803482055664062, -0.00970458984375, -0.0056056976318359375, -0.001506805419921875, 0.0025920867919921875, 0.00669097900390625, 0.010789871215820312, 0.014888763427734375, 0.018987655639648438, 0.0230865478515625, 0.027185440063476562, 0.031284332275390625, 0.03538322448730469, 0.03948211669921875, 0.04358100891113281, 0.047679901123046875, 0.05177879333496094, 0.055877685546875, 0.05997657775878906, 0.06407546997070312, 0.06817436218261719, 0.07227325439453125, 0.07637214660644531, 0.08047103881835938, 0.08456993103027344, 0.0886688232421875, 0.09276771545410156, 0.09686660766601562, 0.10096549987792969, 0.10506439208984375, 0.10916328430175781, 0.11326217651367188, 0.11736106872558594, 0.1214599609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 5.0, 6.0, 7.0, 9.0, 15.0, 15.0, 15.0, 20.0, 23.0, 21.0, 18.0, 43.0, 37.0, 39.0, 37.0, 31.0, 54.0, 45.0, 42.0, 35.0, 42.0, 35.0, 53.0, 35.0, 26.0, 37.0, 33.0, 20.0, 32.0, 25.0, 14.0, 22.0, 14.0, 11.0, 18.0, 8.0, 11.0, 7.0, 8.0, 5.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.093994140625, -0.09104251861572266, -0.08809089660644531, -0.08513927459716797, -0.08218765258789062, -0.07923603057861328, -0.07628440856933594, -0.0733327865600586, -0.07038116455078125, -0.0674295425415039, -0.06447792053222656, -0.06152629852294922, -0.058574676513671875, -0.05562305450439453, -0.05267143249511719, -0.049719810485839844, -0.0467681884765625, -0.043816566467285156, -0.04086494445800781, -0.03791332244873047, -0.034961700439453125, -0.03201007843017578, -0.029058456420898438, -0.026106834411621094, -0.02315521240234375, -0.020203590393066406, -0.017251968383789062, -0.014300346374511719, -0.011348724365234375, -0.008397102355957031, -0.0054454803466796875, -0.0024938583374023438, 0.000457763671875, 0.0034093856811523438, 0.0063610076904296875, 0.009312629699707031, 0.012264251708984375, 0.015215873718261719, 0.018167495727539062, 0.021119117736816406, 0.02407073974609375, 0.027022361755371094, 0.029973983764648438, 0.03292560577392578, 0.035877227783203125, 0.03882884979248047, 0.04178047180175781, 0.044732093811035156, 0.0476837158203125, 0.050635337829589844, 0.05358695983886719, 0.05653858184814453, 0.059490203857421875, 0.06244182586669922, 0.06539344787597656, 0.0683450698852539, 0.07129669189453125, 0.0742483139038086, 0.07719993591308594, 0.08015155792236328, 0.08310317993164062, 0.08605480194091797, 0.08900642395019531, 0.09195804595947266, 0.09490966796875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 13.0, 11.0, 11.0, 30.0, 53.0, 53.0, 116.0, 200.0, 319.0, 537.0, 900.0, 1618.0, 2742.0, 4713.0, 8522.0, 15038.0, 27363.0, 51121.0, 102868.0, 206272.0, 266692.0, 177388.0, 85297.0, 43348.0, 23088.0, 13099.0, 7331.0, 4156.0, 2389.0, 1285.0, 774.0, 458.0, 295.0, 168.0, 105.0, 54.0, 57.0, 23.0, 17.0, 9.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.050140380859375, -0.048761844635009766, -0.04738330841064453, -0.0460047721862793, -0.04462623596191406, -0.04324769973754883, -0.041869163513183594, -0.04049062728881836, -0.039112091064453125, -0.03773355484008789, -0.036355018615722656, -0.03497648239135742, -0.03359794616699219, -0.03221940994262695, -0.03084087371826172, -0.029462337493896484, -0.02808380126953125, -0.026705265045166016, -0.02532672882080078, -0.023948192596435547, -0.022569656372070312, -0.021191120147705078, -0.019812583923339844, -0.01843404769897461, -0.017055511474609375, -0.01567697525024414, -0.014298439025878906, -0.012919902801513672, -0.011541366577148438, -0.010162830352783203, -0.008784294128417969, -0.007405757904052734, -0.0060272216796875, -0.004648685455322266, -0.0032701492309570312, -0.0018916130065917969, -0.0005130767822265625, 0.0008654594421386719, 0.0022439956665039062, 0.0036225318908691406, 0.005001068115234375, 0.006379604339599609, 0.007758140563964844, 0.009136676788330078, 0.010515213012695312, 0.011893749237060547, 0.013272285461425781, 0.014650821685791016, 0.01602935791015625, 0.017407894134521484, 0.01878643035888672, 0.020164966583251953, 0.021543502807617188, 0.022922039031982422, 0.024300575256347656, 0.02567911148071289, 0.027057647705078125, 0.02843618392944336, 0.029814720153808594, 0.031193256378173828, 0.03257179260253906, 0.0339503288269043, 0.03532886505126953, 0.036707401275634766, 0.0380859375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 6.0, 8.0, 10.0, 9.0, 14.0, 7.0, 20.0, 17.0, 21.0, 25.0, 29.0, 28.0, 37.0, 35.0, 41.0, 36.0, 56.0, 50.0, 58.0, 49.0, 55.0, 55.0, 37.0, 35.0, 43.0, 31.0, 25.0, 20.0, 29.0, 17.0, 23.0, 14.0, 8.0, 4.0, 15.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.9669532775878906e-05, -1.907162368297577e-05, -1.8473714590072632e-05, -1.7875805497169495e-05, -1.7277896404266357e-05, -1.667998731136322e-05, -1.6082078218460083e-05, -1.5484169125556946e-05, -1.4886260032653809e-05, -1.4288350939750671e-05, -1.3690441846847534e-05, -1.3092532753944397e-05, -1.249462366104126e-05, -1.1896714568138123e-05, -1.1298805475234985e-05, -1.0700896382331848e-05, -1.0102987289428711e-05, -9.505078196525574e-06, -8.907169103622437e-06, -8.3092600107193e-06, -7.711350917816162e-06, -7.113441824913025e-06, -6.515532732009888e-06, -5.9176236391067505e-06, -5.319714546203613e-06, -4.721805453300476e-06, -4.123896360397339e-06, -3.5259872674942017e-06, -2.9280781745910645e-06, -2.3301690816879272e-06, -1.73225998878479e-06, -1.1343508958816528e-06, -5.364418029785156e-07, 6.146728992462158e-08, 6.593763828277588e-07, 1.257285475730896e-06, 1.8551945686340332e-06, 2.4531036615371704e-06, 3.0510127544403076e-06, 3.648921847343445e-06, 4.246830940246582e-06, 4.844740033149719e-06, 5.4426491260528564e-06, 6.040558218955994e-06, 6.638467311859131e-06, 7.236376404762268e-06, 7.834285497665405e-06, 8.432194590568542e-06, 9.03010368347168e-06, 9.628012776374817e-06, 1.0225921869277954e-05, 1.0823830962181091e-05, 1.1421740055084229e-05, 1.2019649147987366e-05, 1.2617558240890503e-05, 1.321546733379364e-05, 1.3813376426696777e-05, 1.4411285519599915e-05, 1.5009194612503052e-05, 1.560710370540619e-05, 1.6205012798309326e-05, 1.6802921891212463e-05, 1.74008309841156e-05, 1.7998740077018738e-05, 1.8596649169921875e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 3.0, 7.0, 15.0, 15.0, 17.0, 35.0, 47.0, 75.0, 142.0, 201.0, 401.0, 925.0, 2273.0, 6303.0, 17477.0, 48374.0, 153924.0, 436613.0, 263439.0, 75454.0, 26842.0, 9743.0, 3520.0, 1356.0, 617.0, 274.0, 157.0, 102.0, 61.0, 50.0, 23.0, 21.0, 16.0, 6.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060272216796875, -0.05817270278930664, -0.05607318878173828, -0.05397367477416992, -0.05187416076660156, -0.0497746467590332, -0.047675132751464844, -0.045575618743896484, -0.043476104736328125, -0.041376590728759766, -0.039277076721191406, -0.03717756271362305, -0.03507804870605469, -0.03297853469848633, -0.03087902069091797, -0.02877950668334961, -0.02667999267578125, -0.02458047866821289, -0.02248096466064453, -0.020381450653076172, -0.018281936645507812, -0.016182422637939453, -0.014082908630371094, -0.011983394622802734, -0.009883880615234375, -0.007784366607666016, -0.005684852600097656, -0.003585338592529297, -0.0014858245849609375, 0.0006136894226074219, 0.0027132034301757812, 0.004812717437744141, 0.0069122314453125, 0.00901174545288086, 0.011111259460449219, 0.013210773468017578, 0.015310287475585938, 0.017409801483154297, 0.019509315490722656, 0.021608829498291016, 0.023708343505859375, 0.025807857513427734, 0.027907371520996094, 0.030006885528564453, 0.03210639953613281, 0.03420591354370117, 0.03630542755126953, 0.03840494155883789, 0.04050445556640625, 0.04260396957397461, 0.04470348358154297, 0.04680299758911133, 0.04890251159667969, 0.05100202560424805, 0.053101539611816406, 0.055201053619384766, 0.057300567626953125, 0.059400081634521484, 0.061499595642089844, 0.0635991096496582, 0.06569862365722656, 0.06779813766479492, 0.06989765167236328, 0.07199716567993164, 0.0740966796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 13.0, 10.0, 12.0, 18.0, 29.0, 38.0, 37.0, 51.0, 82.0, 93.0, 109.0, 89.0, 96.0, 53.0, 61.0, 41.0, 35.0, 32.0, 15.0, 7.0, 5.0, 10.0, 14.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.070068359375, -0.0682682991027832, -0.0664682388305664, -0.06466817855834961, -0.06286811828613281, -0.061068058013916016, -0.05926799774169922, -0.05746793746948242, -0.055667877197265625, -0.05386781692504883, -0.05206775665283203, -0.050267696380615234, -0.04846763610839844, -0.04666757583618164, -0.044867515563964844, -0.04306745529174805, -0.04126739501953125, -0.03946733474731445, -0.037667274475097656, -0.03586721420288086, -0.03406715393066406, -0.032267093658447266, -0.03046703338623047, -0.028666973114013672, -0.026866912841796875, -0.025066852569580078, -0.02326679229736328, -0.021466732025146484, -0.019666671752929688, -0.01786661148071289, -0.016066551208496094, -0.014266490936279297, -0.0124664306640625, -0.010666370391845703, -0.008866310119628906, -0.007066249847412109, -0.0052661895751953125, -0.0034661293029785156, -0.0016660690307617188, 0.00013399124145507812, 0.001934051513671875, 0.003734111785888672, 0.005534172058105469, 0.007334232330322266, 0.009134292602539062, 0.01093435287475586, 0.012734413146972656, 0.014534473419189453, 0.01633453369140625, 0.018134593963623047, 0.019934654235839844, 0.02173471450805664, 0.023534774780273438, 0.025334835052490234, 0.02713489532470703, 0.028934955596923828, 0.030735015869140625, 0.03253507614135742, 0.03433513641357422, 0.036135196685791016, 0.03793525695800781, 0.03973531723022461, 0.041535377502441406, 0.0433354377746582, 0.045135498046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 9.0, 8.0, 22.0, 40.0, 78.0, 114.0, 157.0, 172.0, 155.0, 123.0, 66.0, 41.0, 17.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39134979248046875, -0.3651254177093506, -0.3389010429382324, -0.31267666816711426, -0.2864522933959961, -0.26022791862487793, -0.23400357365608215, -0.207779198884964, -0.18155482411384583, -0.15533044934272766, -0.1291060745716095, -0.10288171470165253, -0.07665733993053436, -0.0504329651594162, -0.02420860528945923, 0.0020157694816589355, 0.0282401442527771, 0.054464515298604965, 0.08068888634443283, 0.1069132536649704, 0.13313762843608856, 0.15936200320720673, 0.1855863630771637, 0.21181073784828186, 0.23803511261940002, 0.2642594873905182, 0.29048386216163635, 0.31670820713043213, 0.3429325819015503, 0.36915695667266846, 0.3953813314437866, 0.4216057062149048, 0.44783008098602295, 0.4740544557571411, 0.5002788305282593, 0.5265032052993774, 0.5527275800704956, 0.5789519548416138, 0.6051763296127319, 0.6314007043838501, 0.6576250791549683, 0.6838494539260864, 0.7100738286972046, 0.7362982034683228, 0.7625225782394409, 0.7887469530105591, 0.8149713277816772, 0.8411957025527954, 0.8674200177192688, 0.893644392490387, 0.9198687672615051, 0.9460931420326233, 0.9723175168037415, 0.9985418915748596, 1.024766206741333, 1.0509905815124512, 1.0772149562835693, 1.1034393310546875, 1.1296637058258057, 1.1558880805969238, 1.182112455368042, 1.2083368301391602, 1.2345612049102783, 1.2607855796813965, 1.2870099544525146]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 2.0, 3.0, 11.0, 10.0, 11.0, 16.0, 11.0, 11.0, 20.0, 21.0, 22.0, 21.0, 27.0, 28.0, 42.0, 39.0, 40.0, 37.0, 41.0, 32.0, 52.0, 42.0, 43.0, 32.0, 33.0, 34.0, 37.0, 37.0, 35.0, 26.0, 19.0, 19.0, 33.0, 10.0, 15.0, 14.0, 11.0, 14.0, 9.0, 12.0, 7.0, 3.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2768786549568176, -0.2682494819164276, -0.2596203088760376, -0.25099116563796997, -0.24236199259757996, -0.23373281955718994, -0.22510364651679993, -0.2164744734764099, -0.2078453153371811, -0.19921614229679108, -0.19058698415756226, -0.18195781111717224, -0.17332863807678223, -0.1646994799375534, -0.1560703068971634, -0.14744114875793457, -0.13881197571754456, -0.13018280267715454, -0.12155364453792572, -0.1129244714975357, -0.10429530590772629, -0.09566614031791687, -0.08703696727752686, -0.07840780168771744, -0.06977863609790802, -0.0611494705080986, -0.052520301192998886, -0.04389113187789917, -0.03526196628808975, -0.026632800698280334, -0.01800363138318062, -0.009374462068080902, -0.0007452964782714844, 0.007883870974183083, 0.01651303842663765, 0.025142205879092216, 0.03377137333154678, 0.0424005389213562, 0.05102970823645592, 0.059658877551555634, 0.06828804314136505, 0.07691720873117447, 0.08554637432098389, 0.0941755473613739, 0.10280471295118332, 0.11143387854099274, 0.12006305158138275, 0.12869220972061157, 0.1373213827610016, 0.1459505558013916, 0.15457971394062042, 0.16320888698101044, 0.17183804512023926, 0.18046721816062927, 0.1890963912010193, 0.1977255642414093, 0.20635472238063812, 0.21498389542102814, 0.22361305356025696, 0.23224222660064697, 0.240871399641037, 0.2495005577802658, 0.25812971591949463, 0.26675888895988464, 0.27538806200027466]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 11.0, 12.0, 23.0, 26.0, 45.0, 62.0, 76.0, 129.0, 198.0, 285.0, 444.0, 822.0, 1328.0, 2439.0, 4614.0, 10117.0, 24535.0, 73138.0, 271383.0, 1083172.0, 1805478.0, 670795.0, 163289.0, 48158.0, 17358.0, 7612.0, 3705.0, 1946.0, 1140.0, 701.0, 402.0, 288.0, 197.0, 129.0, 80.0, 34.0, 25.0, 25.0, 21.0, 6.0, 7.0, 1.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.05401611328125, -0.052173614501953125, -0.05033111572265625, -0.048488616943359375, -0.0466461181640625, -0.044803619384765625, -0.04296112060546875, -0.041118621826171875, -0.039276123046875, -0.037433624267578125, -0.03559112548828125, -0.033748626708984375, -0.0319061279296875, -0.030063629150390625, -0.02822113037109375, -0.026378631591796875, -0.0245361328125, -0.022693634033203125, -0.02085113525390625, -0.019008636474609375, -0.0171661376953125, -0.015323638916015625, -0.01348114013671875, -0.011638641357421875, -0.009796142578125, -0.007953643798828125, -0.00611114501953125, -0.004268646240234375, -0.0024261474609375, -0.000583648681640625, 0.00125885009765625, 0.003101348876953125, 0.00494384765625, 0.006786346435546875, 0.00862884521484375, 0.010471343994140625, 0.0123138427734375, 0.014156341552734375, 0.01599884033203125, 0.017841339111328125, 0.019683837890625, 0.021526336669921875, 0.02336883544921875, 0.025211334228515625, 0.0270538330078125, 0.028896331787109375, 0.03073883056640625, 0.032581329345703125, 0.034423828125, 0.036266326904296875, 0.03810882568359375, 0.039951324462890625, 0.0417938232421875, 0.043636322021484375, 0.04547882080078125, 0.047321319580078125, 0.049163818359375, 0.051006317138671875, 0.05284881591796875, 0.054691314697265625, 0.0565338134765625, 0.058376312255859375, 0.06021881103515625, 0.062061309814453125, 0.06390380859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 2.0, 6.0, 7.0, 11.0, 7.0, 7.0, 11.0, 10.0, 12.0, 16.0, 15.0, 14.0, 20.0, 22.0, 40.0, 35.0, 36.0, 32.0, 34.0, 31.0, 36.0, 36.0, 33.0, 45.0, 37.0, 30.0, 53.0, 30.0, 43.0, 28.0, 33.0, 24.0, 27.0, 33.0, 11.0, 19.0, 20.0, 20.0, 11.0, 14.0, 10.0, 8.0, 3.0, 3.0, 1.0, 7.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.030609130859375, -0.029625892639160156, -0.028642654418945312, -0.02765941619873047, -0.026676177978515625, -0.02569293975830078, -0.024709701538085938, -0.023726463317871094, -0.02274322509765625, -0.021759986877441406, -0.020776748657226562, -0.01979351043701172, -0.018810272216796875, -0.01782703399658203, -0.016843795776367188, -0.015860557556152344, -0.0148773193359375, -0.013894081115722656, -0.012910842895507812, -0.011927604675292969, -0.010944366455078125, -0.009961128234863281, -0.008977890014648438, -0.007994651794433594, -0.00701141357421875, -0.006028175354003906, -0.0050449371337890625, -0.004061698913574219, -0.003078460693359375, -0.0020952224731445312, -0.0011119842529296875, -0.00012874603271484375, 0.0008544921875, 0.0018377304077148438, 0.0028209686279296875, 0.0038042068481445312, 0.004787445068359375, 0.005770683288574219, 0.0067539215087890625, 0.007737159729003906, 0.00872039794921875, 0.009703636169433594, 0.010686874389648438, 0.011670112609863281, 0.012653350830078125, 0.013636589050292969, 0.014619827270507812, 0.015603065490722656, 0.0165863037109375, 0.017569541931152344, 0.018552780151367188, 0.01953601837158203, 0.020519256591796875, 0.02150249481201172, 0.022485733032226562, 0.023468971252441406, 0.02445220947265625, 0.025435447692871094, 0.026418685913085938, 0.02740192413330078, 0.028385162353515625, 0.02936840057373047, 0.030351638793945312, 0.031334877014160156, 0.032318115234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 9.0, 7.0, 5.0, 19.0, 25.0, 31.0, 36.0, 65.0, 90.0, 149.0, 227.0, 355.0, 542.0, 905.0, 1607.0, 2812.0, 5612.0, 11148.0, 23741.0, 56362.0, 150706.0, 436464.0, 1145730.0, 1394684.0, 614124.0, 211772.0, 76381.0, 31340.0, 14053.0, 6868.0, 3602.0, 1950.0, 1100.0, 636.0, 409.0, 242.0, 152.0, 98.0, 75.0, 42.0, 35.0, 20.0, 21.0, 13.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.058441162109375, -0.05656576156616211, -0.05469036102294922, -0.05281496047973633, -0.05093955993652344, -0.04906415939331055, -0.047188758850097656, -0.045313358306884766, -0.043437957763671875, -0.041562557220458984, -0.039687156677246094, -0.0378117561340332, -0.03593635559082031, -0.03406095504760742, -0.03218555450439453, -0.03031015396118164, -0.02843475341796875, -0.02655935287475586, -0.02468395233154297, -0.022808551788330078, -0.020933151245117188, -0.019057750701904297, -0.017182350158691406, -0.015306949615478516, -0.013431549072265625, -0.011556148529052734, -0.009680747985839844, -0.007805347442626953, -0.0059299468994140625, -0.004054546356201172, -0.0021791458129882812, -0.0003037452697753906, 0.0015716552734375, 0.0034470558166503906, 0.005322456359863281, 0.007197856903076172, 0.009073257446289062, 0.010948657989501953, 0.012824058532714844, 0.014699459075927734, 0.016574859619140625, 0.018450260162353516, 0.020325660705566406, 0.022201061248779297, 0.024076461791992188, 0.025951862335205078, 0.02782726287841797, 0.02970266342163086, 0.03157806396484375, 0.03345346450805664, 0.03532886505126953, 0.03720426559448242, 0.03907966613769531, 0.0409550666809082, 0.042830467224121094, 0.044705867767333984, 0.046581268310546875, 0.048456668853759766, 0.050332069396972656, 0.05220746994018555, 0.05408287048339844, 0.05595827102661133, 0.05783367156982422, 0.05970907211303711, 0.06158447265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 5.0, 7.0, 12.0, 13.0, 15.0, 26.0, 50.0, 67.0, 94.0, 111.0, 209.0, 264.0, 405.0, 463.0, 522.0, 497.0, 369.0, 269.0, 191.0, 147.0, 104.0, 75.0, 42.0, 38.0, 20.0, 15.0, 7.0, 10.0, 4.0, 11.0, 2.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07647705078125, -0.073883056640625, -0.0712890625, -0.068695068359375, -0.06610107421875, -0.063507080078125, -0.0609130859375, -0.058319091796875, -0.05572509765625, -0.053131103515625, -0.050537109375, -0.047943115234375, -0.04534912109375, -0.042755126953125, -0.0401611328125, -0.037567138671875, -0.03497314453125, -0.032379150390625, -0.02978515625, -0.027191162109375, -0.02459716796875, -0.022003173828125, -0.0194091796875, -0.016815185546875, -0.01422119140625, -0.011627197265625, -0.009033203125, -0.006439208984375, -0.00384521484375, -0.001251220703125, 0.0013427734375, 0.003936767578125, 0.00653076171875, 0.009124755859375, 0.01171875, 0.014312744140625, 0.01690673828125, 0.019500732421875, 0.0220947265625, 0.024688720703125, 0.02728271484375, 0.029876708984375, 0.032470703125, 0.035064697265625, 0.03765869140625, 0.040252685546875, 0.0428466796875, 0.045440673828125, 0.04803466796875, 0.050628662109375, 0.05322265625, 0.055816650390625, 0.05841064453125, 0.061004638671875, 0.0635986328125, 0.066192626953125, 0.06878662109375, 0.071380615234375, 0.073974609375, 0.076568603515625, 0.07916259765625, 0.081756591796875, 0.0843505859375, 0.086944580078125, 0.08953857421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 12.0, 16.0, 12.0, 22.0, 41.0, 42.0, 54.0, 53.0, 70.0, 86.0, 86.0, 85.0, 67.0, 64.0, 79.0, 57.0, 41.0, 36.0, 25.0, 21.0, 14.0, 6.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3076535761356354, -0.29612085223197937, -0.28458812832832336, -0.27305540442466736, -0.26152268052101135, -0.24998995661735535, -0.23845724761486053, -0.22692452371120453, -0.21539179980754852, -0.20385907590389252, -0.1923263520002365, -0.1807936429977417, -0.1692609190940857, -0.1577281951904297, -0.14619547128677368, -0.13466274738311768, -0.12313002347946167, -0.11159729957580566, -0.10006457567214966, -0.08853185921907425, -0.07699913531541824, -0.06546641141176224, -0.05393369495868683, -0.04240097105503082, -0.030868247151374817, -0.01933552511036396, -0.007802803069353104, 0.0037299171090126038, 0.01526264101266861, 0.026795364916324615, 0.038328081369400024, 0.04986080527305603, 0.061393558979034424, 0.07292628288269043, 0.08445900678634644, 0.09599172323942184, 0.10752444714307785, 0.11905717104673386, 0.13058988749980927, 0.14212261140346527, 0.15365533530712128, 0.16518805921077728, 0.1767207831144333, 0.1882534921169281, 0.1997862160205841, 0.2113189399242401, 0.22285166382789612, 0.23438438773155212, 0.24591711163520813, 0.25744983553886414, 0.26898255944252014, 0.28051528334617615, 0.29204800724983215, 0.30358073115348816, 0.3151134252548218, 0.3266461491584778, 0.3381788730621338, 0.3497115969657898, 0.3612443208694458, 0.3727770447731018, 0.3843097686767578, 0.3958424925804138, 0.4073752164840698, 0.41890794038772583, 0.43044066429138184]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 10.0, 6.0, 6.0, 11.0, 15.0, 14.0, 10.0, 13.0, 16.0, 22.0, 19.0, 30.0, 29.0, 39.0, 43.0, 32.0, 41.0, 44.0, 50.0, 41.0, 31.0, 39.0, 41.0, 34.0, 38.0, 36.0, 35.0, 32.0, 23.0, 25.0, 18.0, 29.0, 19.0, 23.0, 26.0, 12.0, 10.0, 9.0, 4.0, 6.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26994889974594116, -0.2614332139492035, -0.25291749835014343, -0.24440179765224457, -0.2358860969543457, -0.22737041115760803, -0.21885471045970917, -0.2103390097618103, -0.20182330906391144, -0.19330760836601257, -0.1847919076681137, -0.17627620697021484, -0.16776052117347717, -0.15924480557441711, -0.15072911977767944, -0.14221341907978058, -0.1336977183818817, -0.12518201768398285, -0.11666631698608398, -0.10815062373876572, -0.09963492304086685, -0.09111922234296799, -0.08260352909564972, -0.07408782839775085, -0.06557212769985199, -0.057056427001953125, -0.04854073002934456, -0.04002503305673599, -0.03150933235883713, -0.022993631660938263, -0.014477934688329697, -0.00596223771572113, 0.0025534629821777344, 0.01106916181743145, 0.019584860652685165, 0.02810055948793888, 0.036616258323192596, 0.04513195902109146, 0.05364765599370003, 0.062163352966308594, 0.07067905366420746, 0.07919475436210632, 0.08771045506000519, 0.09622614830732346, 0.10474184900522232, 0.11325754970312119, 0.12177324295043945, 0.13028894364833832, 0.13880464434623718, 0.14732034504413605, 0.1558360457420349, 0.16435174643993378, 0.17286744713783264, 0.1813831329345703, 0.18989883363246918, 0.19841453433036804, 0.2069302350282669, 0.21544593572616577, 0.22396163642406464, 0.2324773371219635, 0.24099302291870117, 0.24950873851776123, 0.2580244243144989, 0.2665401101112366, 0.27505582571029663]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 9.0, 12.0, 9.0, 10.0, 23.0, 39.0, 58.0, 77.0, 108.0, 181.0, 287.0, 536.0, 1012.0, 1845.0, 3573.0, 6844.0, 13267.0, 25527.0, 49403.0, 98168.0, 194092.0, 272675.0, 187579.0, 94502.0, 47299.0, 24533.0, 12765.0, 6601.0, 3411.0, 1813.0, 893.0, 552.0, 300.0, 191.0, 110.0, 70.0, 52.0, 26.0, 21.0, 20.0, 16.0, 12.0, 13.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08734130859375, -0.08416175842285156, -0.08098220825195312, -0.07780265808105469, -0.07462310791015625, -0.07144355773925781, -0.06826400756835938, -0.06508445739746094, -0.0619049072265625, -0.05872535705566406, -0.055545806884765625, -0.05236625671386719, -0.04918670654296875, -0.04600715637207031, -0.042827606201171875, -0.03964805603027344, -0.036468505859375, -0.03328895568847656, -0.030109405517578125, -0.026929855346679688, -0.02375030517578125, -0.020570755004882812, -0.017391204833984375, -0.014211654663085938, -0.0110321044921875, -0.007852554321289062, -0.004673004150390625, -0.0014934539794921875, 0.00168609619140625, 0.0048656463623046875, 0.008045196533203125, 0.011224746704101562, 0.014404296875, 0.017583847045898438, 0.020763397216796875, 0.023942947387695312, 0.02712249755859375, 0.030302047729492188, 0.033481597900390625, 0.03666114807128906, 0.0398406982421875, 0.04302024841308594, 0.046199798583984375, 0.04937934875488281, 0.05255889892578125, 0.05573844909667969, 0.058917999267578125, 0.06209754943847656, 0.065277099609375, 0.06845664978027344, 0.07163619995117188, 0.07481575012207031, 0.07799530029296875, 0.08117485046386719, 0.08435440063476562, 0.08753395080566406, 0.0907135009765625, 0.09389305114746094, 0.09707260131835938, 0.10025215148925781, 0.10343170166015625, 0.10661125183105469, 0.10979080200195312, 0.11297035217285156, 0.11614990234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 9.0, 10.0, 10.0, 16.0, 19.0, 19.0, 23.0, 32.0, 23.0, 33.0, 41.0, 30.0, 41.0, 35.0, 42.0, 49.0, 30.0, 38.0, 46.0, 40.0, 45.0, 36.0, 45.0, 24.0, 38.0, 31.0, 17.0, 29.0, 18.0, 23.0, 11.0, 12.0, 18.0, 14.0, 7.0, 7.0, 3.0, 2.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.037811279296875, -0.03671073913574219, -0.035610198974609375, -0.03450965881347656, -0.03340911865234375, -0.03230857849121094, -0.031208038330078125, -0.030107498168945312, -0.0290069580078125, -0.027906417846679688, -0.026805877685546875, -0.025705337524414062, -0.02460479736328125, -0.023504257202148438, -0.022403717041015625, -0.021303176879882812, -0.02020263671875, -0.019102096557617188, -0.018001556396484375, -0.016901016235351562, -0.01580047607421875, -0.014699935913085938, -0.013599395751953125, -0.012498855590820312, -0.0113983154296875, -0.010297775268554688, -0.009197235107421875, -0.008096694946289062, -0.00699615478515625, -0.0058956146240234375, -0.004795074462890625, -0.0036945343017578125, -0.002593994140625, -0.0014934539794921875, -0.000392913818359375, 0.0007076263427734375, 0.00180816650390625, 0.0029087066650390625, 0.004009246826171875, 0.0051097869873046875, 0.0062103271484375, 0.0073108673095703125, 0.008411407470703125, 0.009511947631835938, 0.01061248779296875, 0.011713027954101562, 0.012813568115234375, 0.013914108276367188, 0.0150146484375, 0.016115188598632812, 0.017215728759765625, 0.018316268920898438, 0.01941680908203125, 0.020517349243164062, 0.021617889404296875, 0.022718429565429688, 0.0238189697265625, 0.024919509887695312, 0.026020050048828125, 0.027120590209960938, 0.02822113037109375, 0.029321670532226562, 0.030422210693359375, 0.03152275085449219, 0.032623291015625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 6.0, 6.0, 7.0, 11.0, 15.0, 30.0, 28.0, 50.0, 80.0, 128.0, 172.0, 433.0, 927.0, 2554.0, 7489.0, 22874.0, 69710.0, 220402.0, 430903.0, 197752.0, 63350.0, 20829.0, 6724.0, 2279.0, 826.0, 375.0, 198.0, 129.0, 78.0, 46.0, 40.0, 43.0, 22.0, 15.0, 10.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152587890625, -0.14740753173828125, -0.1422271728515625, -0.13704681396484375, -0.131866455078125, -0.12668609619140625, -0.1215057373046875, -0.11632537841796875, -0.11114501953125, -0.10596466064453125, -0.1007843017578125, -0.09560394287109375, -0.090423583984375, -0.08524322509765625, -0.0800628662109375, -0.07488250732421875, -0.0697021484375, -0.06452178955078125, -0.0593414306640625, -0.05416107177734375, -0.048980712890625, -0.04380035400390625, -0.0386199951171875, -0.03343963623046875, -0.02825927734375, -0.02307891845703125, -0.0178985595703125, -0.01271820068359375, -0.007537841796875, -0.00235748291015625, 0.0028228759765625, 0.00800323486328125, 0.01318359375, 0.01836395263671875, 0.0235443115234375, 0.02872467041015625, 0.033905029296875, 0.03908538818359375, 0.0442657470703125, 0.04944610595703125, 0.05462646484375, 0.05980682373046875, 0.0649871826171875, 0.07016754150390625, 0.075347900390625, 0.08052825927734375, 0.0857086181640625, 0.09088897705078125, 0.0960693359375, 0.10124969482421875, 0.1064300537109375, 0.11161041259765625, 0.116790771484375, 0.12197113037109375, 0.1271514892578125, 0.13233184814453125, 0.13751220703125, 0.14269256591796875, 0.1478729248046875, 0.15305328369140625, 0.158233642578125, 0.16341400146484375, 0.1685943603515625, 0.17377471923828125, 0.178955078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 10.0, 11.0, 14.0, 14.0, 18.0, 24.0, 27.0, 24.0, 26.0, 31.0, 48.0, 50.0, 46.0, 44.0, 41.0, 44.0, 46.0, 48.0, 40.0, 47.0, 47.0, 42.0, 33.0, 30.0, 27.0, 23.0, 25.0, 22.0, 12.0, 12.0, 8.0, 9.0, 5.0, 5.0, 9.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1080322265625, -0.1042633056640625, -0.100494384765625, -0.0967254638671875, -0.09295654296875, -0.0891876220703125, -0.085418701171875, -0.0816497802734375, -0.077880859375, -0.0741119384765625, -0.070343017578125, -0.0665740966796875, -0.06280517578125, -0.0590362548828125, -0.055267333984375, -0.0514984130859375, -0.0477294921875, -0.0439605712890625, -0.040191650390625, -0.0364227294921875, -0.03265380859375, -0.0288848876953125, -0.025115966796875, -0.0213470458984375, -0.017578125, -0.0138092041015625, -0.010040283203125, -0.0062713623046875, -0.00250244140625, 0.0012664794921875, 0.005035400390625, 0.0088043212890625, 0.0125732421875, 0.0163421630859375, 0.020111083984375, 0.0238800048828125, 0.02764892578125, 0.0314178466796875, 0.035186767578125, 0.0389556884765625, 0.042724609375, 0.0464935302734375, 0.050262451171875, 0.0540313720703125, 0.05780029296875, 0.0615692138671875, 0.065338134765625, 0.0691070556640625, 0.0728759765625, 0.0766448974609375, 0.080413818359375, 0.0841827392578125, 0.08795166015625, 0.0917205810546875, 0.095489501953125, 0.0992584228515625, 0.10302734375, 0.1067962646484375, 0.110565185546875, 0.1143341064453125, 0.11810302734375, 0.1218719482421875, 0.125640869140625, 0.1294097900390625, 0.1331787109375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 17.0, 23.0, 50.0, 81.0, 111.0, 184.0, 357.0, 780.0, 1454.0, 3336.0, 7140.0, 16120.0, 38689.0, 94801.0, 236249.0, 342132.0, 182004.0, 71832.0, 29528.0, 12783.0, 5638.0, 2612.0, 1230.0, 626.0, 309.0, 185.0, 127.0, 46.0, 33.0, 28.0, 13.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0673828125, -0.06516265869140625, -0.0629425048828125, -0.06072235107421875, -0.058502197265625, -0.05628204345703125, -0.0540618896484375, -0.05184173583984375, -0.04962158203125, -0.04740142822265625, -0.0451812744140625, -0.04296112060546875, -0.040740966796875, -0.03852081298828125, -0.0363006591796875, -0.03408050537109375, -0.0318603515625, -0.02964019775390625, -0.0274200439453125, -0.02519989013671875, -0.022979736328125, -0.02075958251953125, -0.0185394287109375, -0.01631927490234375, -0.01409912109375, -0.01187896728515625, -0.0096588134765625, -0.00743865966796875, -0.005218505859375, -0.00299835205078125, -0.0007781982421875, 0.00144195556640625, 0.003662109375, 0.00588226318359375, 0.0081024169921875, 0.01032257080078125, 0.012542724609375, 0.01476287841796875, 0.0169830322265625, 0.01920318603515625, 0.02142333984375, 0.02364349365234375, 0.0258636474609375, 0.02808380126953125, 0.030303955078125, 0.03252410888671875, 0.0347442626953125, 0.03696441650390625, 0.0391845703125, 0.04140472412109375, 0.0436248779296875, 0.04584503173828125, 0.048065185546875, 0.05028533935546875, 0.0525054931640625, 0.05472564697265625, 0.05694580078125, 0.05916595458984375, 0.0613861083984375, 0.06360626220703125, 0.065826416015625, 0.06804656982421875, 0.0702667236328125, 0.07248687744140625, 0.07470703125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 1.0, 1.0, 8.0, 12.0, 6.0, 7.0, 16.0, 8.0, 17.0, 14.0, 20.0, 15.0, 30.0, 41.0, 38.0, 32.0, 36.0, 38.0, 41.0, 43.0, 42.0, 55.0, 43.0, 57.0, 52.0, 35.0, 28.0, 34.0, 35.0, 25.0, 33.0, 19.0, 21.0, 16.0, 12.0, 13.0, 11.0, 7.0, 4.0, 1.0, 8.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.531839370727539e-05, -1.4839693903923035e-05, -1.4360994100570679e-05, -1.3882294297218323e-05, -1.3403594493865967e-05, -1.292489469051361e-05, -1.2446194887161255e-05, -1.1967495083808899e-05, -1.1488795280456543e-05, -1.1010095477104187e-05, -1.0531395673751831e-05, -1.0052695870399475e-05, -9.573996067047119e-06, -9.095296263694763e-06, -8.616596460342407e-06, -8.137896656990051e-06, -7.659196853637695e-06, -7.180497050285339e-06, -6.701797246932983e-06, -6.2230974435806274e-06, -5.7443976402282715e-06, -5.2656978368759155e-06, -4.7869980335235596e-06, -4.308298230171204e-06, -3.829598426818848e-06, -3.3508986234664917e-06, -2.8721988201141357e-06, -2.3934990167617798e-06, -1.914799213409424e-06, -1.4360994100570679e-06, -9.57399606704712e-07, -4.78699803352356e-07, 0.0, 4.78699803352356e-07, 9.57399606704712e-07, 1.4360994100570679e-06, 1.914799213409424e-06, 2.3934990167617798e-06, 2.8721988201141357e-06, 3.3508986234664917e-06, 3.829598426818848e-06, 4.308298230171204e-06, 4.7869980335235596e-06, 5.2656978368759155e-06, 5.7443976402282715e-06, 6.2230974435806274e-06, 6.701797246932983e-06, 7.180497050285339e-06, 7.659196853637695e-06, 8.137896656990051e-06, 8.616596460342407e-06, 9.095296263694763e-06, 9.573996067047119e-06, 1.0052695870399475e-05, 1.0531395673751831e-05, 1.1010095477104187e-05, 1.1488795280456543e-05, 1.1967495083808899e-05, 1.2446194887161255e-05, 1.292489469051361e-05, 1.3403594493865967e-05, 1.3882294297218323e-05, 1.4360994100570679e-05, 1.4839693903923035e-05, 1.531839370727539e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 5.0, 7.0, 9.0, 16.0, 23.0, 18.0, 48.0, 66.0, 86.0, 178.0, 297.0, 627.0, 1357.0, 3218.0, 8298.0, 22829.0, 64097.0, 182697.0, 382061.0, 245879.0, 86969.0, 30842.0, 11264.0, 4296.0, 1690.0, 792.0, 354.0, 196.0, 132.0, 64.0, 58.0, 18.0, 17.0, 11.0, 14.0, 4.0, 7.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0733642578125, -0.07097053527832031, -0.06857681274414062, -0.06618309020996094, -0.06378936767578125, -0.06139564514160156, -0.059001922607421875, -0.05660820007324219, -0.0542144775390625, -0.05182075500488281, -0.049427032470703125, -0.04703330993652344, -0.04463958740234375, -0.04224586486816406, -0.039852142333984375, -0.03745841979980469, -0.035064697265625, -0.03267097473144531, -0.030277252197265625, -0.027883529663085938, -0.02548980712890625, -0.023096084594726562, -0.020702362060546875, -0.018308639526367188, -0.0159149169921875, -0.013521194458007812, -0.011127471923828125, -0.008733749389648438, -0.00634002685546875, -0.0039463043212890625, -0.001552581787109375, 0.0008411407470703125, 0.00323486328125, 0.0056285858154296875, 0.008022308349609375, 0.010416030883789062, 0.01280975341796875, 0.015203475952148438, 0.017597198486328125, 0.019990921020507812, 0.0223846435546875, 0.024778366088867188, 0.027172088623046875, 0.029565811157226562, 0.03195953369140625, 0.03435325622558594, 0.036746978759765625, 0.03914070129394531, 0.041534423828125, 0.04392814636230469, 0.046321868896484375, 0.04871559143066406, 0.05110931396484375, 0.05350303649902344, 0.055896759033203125, 0.05829048156738281, 0.0606842041015625, 0.06307792663574219, 0.06547164916992188, 0.06786537170410156, 0.07025909423828125, 0.07265281677246094, 0.07504653930664062, 0.07744026184082031, 0.079833984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 8.0, 11.0, 20.0, 27.0, 22.0, 43.0, 53.0, 59.0, 98.0, 99.0, 89.0, 94.0, 82.0, 74.0, 52.0, 33.0, 30.0, 16.0, 13.0, 15.0, 15.0, 9.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059967041015625, -0.057779788970947266, -0.05559253692626953, -0.0534052848815918, -0.05121803283691406, -0.04903078079223633, -0.046843528747558594, -0.04465627670288086, -0.042469024658203125, -0.04028177261352539, -0.038094520568847656, -0.03590726852416992, -0.03372001647949219, -0.03153276443481445, -0.02934551239013672, -0.027158260345458984, -0.02497100830078125, -0.022783756256103516, -0.02059650421142578, -0.018409252166748047, -0.016222000122070312, -0.014034748077392578, -0.011847496032714844, -0.00966024398803711, -0.007472991943359375, -0.005285739898681641, -0.0030984878540039062, -0.0009112358093261719, 0.0012760162353515625, 0.003463268280029297, 0.005650520324707031, 0.007837772369384766, 0.0100250244140625, 0.012212276458740234, 0.014399528503417969, 0.016586780548095703, 0.018774032592773438, 0.020961284637451172, 0.023148536682128906, 0.02533578872680664, 0.027523040771484375, 0.02971029281616211, 0.031897544860839844, 0.03408479690551758, 0.03627204895019531, 0.03845930099487305, 0.04064655303955078, 0.042833805084228516, 0.04502105712890625, 0.047208309173583984, 0.04939556121826172, 0.05158281326293945, 0.05377006530761719, 0.05595731735229492, 0.058144569396972656, 0.06033182144165039, 0.06251907348632812, 0.06470632553100586, 0.0668935775756836, 0.06908082962036133, 0.07126808166503906, 0.0734553337097168, 0.07564258575439453, 0.07782983779907227, 0.08001708984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 15.0, 48.0, 86.0, 122.0, 164.0, 190.0, 161.0, 114.0, 55.0, 28.0, 17.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5866121053695679, -0.5525913834571838, -0.5185706615447998, -0.4845499098300934, -0.45052915811538696, -0.41650843620300293, -0.3824877142906189, -0.34846699237823486, -0.31444624066352844, -0.2804255187511444, -0.246404767036438, -0.21238404512405396, -0.17836330831050873, -0.1443425714969635, -0.11032184958457947, -0.07630111277103424, -0.042280375957489014, -0.008259642869234085, 0.025761090219020844, 0.059781819581985474, 0.0938025563955307, 0.12782329320907593, 0.16184401512145996, 0.1958647519350052, 0.22988548874855042, 0.26390621066093445, 0.29792696237564087, 0.3319476842880249, 0.36596840620040894, 0.39998915791511536, 0.4340098798274994, 0.4680306315422058, 0.5020513534545898, 0.5360720753669739, 0.5700927972793579, 0.6041135787963867, 0.6381343007087708, 0.6721550226211548, 0.7061757445335388, 0.7401964664459229, 0.7742172479629517, 0.8082379698753357, 0.8422586917877197, 0.8762794733047485, 0.9103001952171326, 0.9443209171295166, 0.9783416390419006, 1.0123623609542847, 1.0463831424713135, 1.0804039239883423, 1.1144245862960815, 1.1484453678131104, 1.1824660301208496, 1.2164868116378784, 1.2505075931549072, 1.2845282554626465, 1.3185489177703857, 1.3525696992874146, 1.3865903615951538, 1.4206111431121826, 1.4546318054199219, 1.4886525869369507, 1.5226733684539795, 1.5566940307617188, 1.5907148122787476]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 5.0, 5.0, 4.0, 9.0, 9.0, 16.0, 14.0, 5.0, 17.0, 18.0, 19.0, 26.0, 31.0, 23.0, 27.0, 30.0, 30.0, 35.0, 43.0, 38.0, 33.0, 38.0, 51.0, 44.0, 32.0, 32.0, 28.0, 30.0, 39.0, 31.0, 27.0, 27.0, 23.0, 24.0, 15.0, 17.0, 20.0, 14.0, 9.0, 15.0, 12.0, 8.0, 4.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.3092392086982727, -0.2999470829963684, -0.2906549572944641, -0.2813628017902374, -0.27207067608833313, -0.26277855038642883, -0.25348639488220215, -0.24419426918029785, -0.23490214347839355, -0.22561001777648926, -0.21631787717342377, -0.20702573657035828, -0.19773361086845398, -0.18844148516654968, -0.1791493445634842, -0.1698572039604187, -0.1605650782585144, -0.1512729525566101, -0.14198081195354462, -0.13268867135047913, -0.12339654564857483, -0.11410441249608994, -0.10481227934360504, -0.09552014619112015, -0.08622801303863525, -0.07693587988615036, -0.06764374673366547, -0.05835161358118057, -0.04905948042869568, -0.039767347276210785, -0.03047521412372589, -0.021183080971240997, -0.011890947818756104, -0.0025988146662712097, 0.006693318486213684, 0.015985451638698578, 0.02527758479118347, 0.034569717943668365, 0.04386185109615326, 0.05315398424863815, 0.06244611740112305, 0.07173825055360794, 0.08103038370609283, 0.09032251685857773, 0.09961465001106262, 0.10890678316354752, 0.11819891631603241, 0.1274910569190979, 0.1367831826210022, 0.1460753083229065, 0.15536744892597198, 0.16465958952903748, 0.17395171523094177, 0.18324384093284607, 0.19253598153591156, 0.20182812213897705, 0.21112024784088135, 0.22041237354278564, 0.22970451414585114, 0.23899665474891663, 0.24828878045082092, 0.2575809061527252, 0.2668730616569519, 0.2761651873588562, 0.2854573130607605]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 5.0, 9.0, 3.0, 7.0, 12.0, 16.0, 18.0, 27.0, 23.0, 33.0, 35.0, 68.0, 117.0, 210.0, 396.0, 959.0, 2341.0, 6091.0, 18010.0, 61053.0, 242289.0, 1102757.0, 2023261.0, 555658.0, 127460.0, 34949.0, 11362.0, 3939.0, 1634.0, 642.0, 339.0, 180.0, 105.0, 69.0, 51.0, 33.0, 29.0, 12.0, 19.0, 21.0, 7.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 4.0], "bins": [-0.0887451171875, -0.08615589141845703, -0.08356666564941406, -0.0809774398803711, -0.07838821411132812, -0.07579898834228516, -0.07320976257324219, -0.07062053680419922, -0.06803131103515625, -0.06544208526611328, -0.06285285949707031, -0.060263633728027344, -0.057674407958984375, -0.055085182189941406, -0.05249595642089844, -0.04990673065185547, -0.0473175048828125, -0.04472827911376953, -0.04213905334472656, -0.039549827575683594, -0.036960601806640625, -0.034371376037597656, -0.03178215026855469, -0.02919292449951172, -0.02660369873046875, -0.02401447296142578, -0.021425247192382812, -0.018836021423339844, -0.016246795654296875, -0.013657569885253906, -0.011068344116210938, -0.008479118347167969, -0.005889892578125, -0.0033006668090820312, -0.0007114410400390625, 0.0018777847290039062, 0.004467010498046875, 0.007056236267089844, 0.009645462036132812, 0.012234687805175781, 0.01482391357421875, 0.01741313934326172, 0.020002365112304688, 0.022591590881347656, 0.025180816650390625, 0.027770042419433594, 0.030359268188476562, 0.03294849395751953, 0.0355377197265625, 0.03812694549560547, 0.04071617126464844, 0.043305397033691406, 0.045894622802734375, 0.048483848571777344, 0.05107307434082031, 0.05366230010986328, 0.05625152587890625, 0.05884075164794922, 0.06142997741699219, 0.06401920318603516, 0.06660842895507812, 0.0691976547241211, 0.07178688049316406, 0.07437610626220703, 0.07696533203125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 10.0, 9.0, 10.0, 6.0, 17.0, 23.0, 21.0, 26.0, 21.0, 17.0, 18.0, 26.0, 23.0, 24.0, 16.0, 36.0, 33.0, 41.0, 28.0, 35.0, 42.0, 37.0, 33.0, 37.0, 35.0, 37.0, 33.0, 31.0, 37.0, 34.0, 16.0, 23.0, 27.0, 17.0, 17.0, 12.0, 19.0, 12.0, 8.0, 7.0, 8.0, 10.0, 5.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0], "bins": [-0.0382080078125, -0.037138938903808594, -0.03606986999511719, -0.03500080108642578, -0.033931732177734375, -0.03286266326904297, -0.03179359436035156, -0.030724525451660156, -0.02965545654296875, -0.028586387634277344, -0.027517318725585938, -0.02644824981689453, -0.025379180908203125, -0.02431011199951172, -0.023241043090820312, -0.022171974182128906, -0.0211029052734375, -0.020033836364746094, -0.018964767456054688, -0.01789569854736328, -0.016826629638671875, -0.01575756072998047, -0.014688491821289062, -0.013619422912597656, -0.01255035400390625, -0.011481285095214844, -0.010412216186523438, -0.009343147277832031, -0.008274078369140625, -0.007205009460449219, -0.0061359405517578125, -0.005066871643066406, -0.003997802734375, -0.0029287338256835938, -0.0018596649169921875, -0.0007905960083007812, 0.000278472900390625, 0.0013475418090820312, 0.0024166107177734375, 0.0034856796264648438, 0.00455474853515625, 0.005623817443847656, 0.0066928863525390625, 0.007761955261230469, 0.008831024169921875, 0.009900093078613281, 0.010969161987304688, 0.012038230895996094, 0.0131072998046875, 0.014176368713378906, 0.015245437622070312, 0.01631450653076172, 0.017383575439453125, 0.01845264434814453, 0.019521713256835938, 0.020590782165527344, 0.02165985107421875, 0.022728919982910156, 0.023797988891601562, 0.02486705780029297, 0.025936126708984375, 0.02700519561767578, 0.028074264526367188, 0.029143333435058594, 0.03021240234375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 5.0, 17.0, 16.0, 18.0, 44.0, 62.0, 92.0, 144.0, 227.0, 368.0, 627.0, 1049.0, 1999.0, 3686.0, 7532.0, 15956.0, 38471.0, 106340.0, 335478.0, 1073663.0, 1649693.0, 646605.0, 197207.0, 66481.0, 25620.0, 11031.0, 5354.0, 2815.0, 1492.0, 834.0, 492.0, 302.0, 183.0, 116.0, 83.0, 46.0, 33.0, 27.0, 23.0, 14.0, 8.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.09809589385986328, -0.09505653381347656, -0.09201717376708984, -0.08897781372070312, -0.0859384536743164, -0.08289909362792969, -0.07985973358154297, -0.07682037353515625, -0.07378101348876953, -0.07074165344238281, -0.0677022933959961, -0.06466293334960938, -0.061623573303222656, -0.05858421325683594, -0.05554485321044922, -0.0525054931640625, -0.04946613311767578, -0.04642677307128906, -0.043387413024902344, -0.040348052978515625, -0.037308692932128906, -0.03426933288574219, -0.03122997283935547, -0.02819061279296875, -0.02515125274658203, -0.022111892700195312, -0.019072532653808594, -0.016033172607421875, -0.012993812561035156, -0.009954452514648438, -0.006915092468261719, -0.003875732421875, -0.0008363723754882812, 0.0022029876708984375, 0.005242347717285156, 0.008281707763671875, 0.011321067810058594, 0.014360427856445312, 0.01739978790283203, 0.02043914794921875, 0.02347850799560547, 0.026517868041992188, 0.029557228088378906, 0.032596588134765625, 0.035635948181152344, 0.03867530822753906, 0.04171466827392578, 0.0447540283203125, 0.04779338836669922, 0.05083274841308594, 0.053872108459472656, 0.056911468505859375, 0.059950828552246094, 0.06299018859863281, 0.06602954864501953, 0.06906890869140625, 0.07210826873779297, 0.07514762878417969, 0.0781869888305664, 0.08122634887695312, 0.08426570892333984, 0.08730506896972656, 0.09034442901611328, 0.0933837890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 10.0, 16.0, 16.0, 18.0, 27.0, 40.0, 55.0, 81.0, 102.0, 137.0, 199.0, 218.0, 325.0, 440.0, 454.0, 436.0, 343.0, 305.0, 226.0, 164.0, 133.0, 90.0, 58.0, 40.0, 33.0, 23.0, 17.0, 8.0, 10.0, 9.0, 8.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.091552734375, -0.08883094787597656, -0.08610916137695312, -0.08338737487792969, -0.08066558837890625, -0.07794380187988281, -0.07522201538085938, -0.07250022888183594, -0.0697784423828125, -0.06705665588378906, -0.06433486938476562, -0.06161308288574219, -0.05889129638671875, -0.05616950988769531, -0.053447723388671875, -0.05072593688964844, -0.048004150390625, -0.04528236389160156, -0.042560577392578125, -0.03983879089355469, -0.03711700439453125, -0.03439521789550781, -0.031673431396484375, -0.028951644897460938, -0.0262298583984375, -0.023508071899414062, -0.020786285400390625, -0.018064498901367188, -0.01534271240234375, -0.012620925903320312, -0.009899139404296875, -0.0071773529052734375, -0.00445556640625, -0.0017337799072265625, 0.000988006591796875, 0.0037097930908203125, 0.00643157958984375, 0.009153366088867188, 0.011875152587890625, 0.014596939086914062, 0.0173187255859375, 0.020040512084960938, 0.022762298583984375, 0.025484085083007812, 0.02820587158203125, 0.030927658081054688, 0.033649444580078125, 0.03637123107910156, 0.039093017578125, 0.04181480407714844, 0.044536590576171875, 0.04725837707519531, 0.04998016357421875, 0.05270195007324219, 0.055423736572265625, 0.05814552307128906, 0.0608673095703125, 0.06358909606933594, 0.06631088256835938, 0.06903266906738281, 0.07175445556640625, 0.07447624206542969, 0.07719802856445312, 0.07991981506347656, 0.0826416015625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 28.0, 28.0, 39.0, 66.0, 79.0, 93.0, 100.0, 110.0, 112.0, 90.0, 70.0, 58.0, 45.0, 33.0, 21.0, 13.0, 6.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.987786054611206, -0.9681124687194824, -0.9484389424324036, -0.9287653565406799, -0.9090918302536011, -0.8894182443618774, -0.8697447180747986, -0.850071132183075, -0.8303976058959961, -0.8107240200042725, -0.7910504937171936, -0.77137690782547, -0.7517033815383911, -0.7320297956466675, -0.7123562693595886, -0.692682683467865, -0.6730091571807861, -0.6533355712890625, -0.6336620450019836, -0.61398845911026, -0.5943149328231812, -0.5746413469314575, -0.5549678206443787, -0.535294234752655, -0.5156206488609314, -0.49594709277153015, -0.4762735366821289, -0.45659998059272766, -0.4369264245033264, -0.41725286841392517, -0.3975793123245239, -0.3779057264328003, -0.3582322299480438, -0.3385586738586426, -0.31888511776924133, -0.2992115616798401, -0.27953800559043884, -0.2598644495010376, -0.24019087851047516, -0.2205173224210739, -0.20084376633167267, -0.18117021024227142, -0.16149665415287018, -0.14182308316230774, -0.12214953452348709, -0.10247597843408585, -0.082802414894104, -0.06312885880470276, -0.043455302715301514, -0.02378174476325512, -0.004108186811208725, 0.015565373003482819, 0.035238929092884064, 0.05491248518228531, 0.07458604872226715, 0.0942596048116684, 0.11393316090106964, 0.1336067169904709, 0.15328027307987213, 0.17295384407043457, 0.19262740015983582, 0.21230095624923706, 0.2319745123386383, 0.25164806842803955, 0.2713216245174408]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 8.0, 6.0, 8.0, 15.0, 9.0, 18.0, 30.0, 25.0, 22.0, 33.0, 34.0, 39.0, 36.0, 38.0, 36.0, 36.0, 45.0, 44.0, 30.0, 34.0, 40.0, 28.0, 38.0, 31.0, 27.0, 24.0, 36.0, 30.0, 23.0, 27.0, 26.0, 13.0, 9.0, 18.0, 19.0, 7.0, 10.0, 8.0, 8.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2897762656211853, -0.2804456949234009, -0.27111512422561646, -0.26178452372550964, -0.2524539530277252, -0.2431233823299408, -0.23379281163215637, -0.22446222603321075, -0.21513164043426514, -0.2058010697364807, -0.1964704841375351, -0.18713991343975067, -0.17780932784080505, -0.16847875714302063, -0.1591481864452362, -0.1498176008462906, -0.14048703014850616, -0.13115645945072174, -0.12182587385177612, -0.1124953031539917, -0.10316471755504608, -0.09383414685726166, -0.08450356870889664, -0.07517299056053162, -0.0658424124121666, -0.056511834263801575, -0.047181256115436554, -0.03785068169236183, -0.02852010354399681, -0.01918952539563179, -0.009858950972557068, -0.0005283728241920471, 0.008802205324172974, 0.018132783472537994, 0.027463359758257866, 0.03679393604397774, 0.04612451419234276, 0.05545509234070778, 0.0647856667637825, 0.07411624491214752, 0.08344682306051254, 0.09277740120887756, 0.10210797935724258, 0.1114385575056076, 0.12076912820339203, 0.13009971380233765, 0.13943028450012207, 0.1487608551979065, 0.1580914407968521, 0.16742201149463654, 0.17675259709358215, 0.18608316779136658, 0.1954137533903122, 0.20474432408809662, 0.21407490968704224, 0.22340548038482666, 0.23273605108261108, 0.2420666217803955, 0.25139719247817993, 0.26072779297828674, 0.27005836367607117, 0.2793889343738556, 0.28871950507164, 0.2980501055717468, 0.30738067626953125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 1.0, 2.0, 11.0, 14.0, 22.0, 26.0, 48.0, 77.0, 133.0, 243.0, 360.0, 639.0, 1083.0, 1891.0, 3501.0, 5809.0, 10299.0, 18410.0, 32711.0, 60664.0, 126614.0, 256298.0, 260685.0, 130072.0, 61673.0, 33318.0, 18980.0, 10642.0, 6099.0, 3555.0, 2003.0, 1093.0, 680.0, 372.0, 200.0, 122.0, 75.0, 48.0, 33.0, 11.0, 14.0, 12.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0789794921875, -0.07625770568847656, -0.07353591918945312, -0.07081413269042969, -0.06809234619140625, -0.06537055969238281, -0.06264877319335938, -0.05992698669433594, -0.0572052001953125, -0.05448341369628906, -0.051761627197265625, -0.04903984069824219, -0.04631805419921875, -0.04359626770019531, -0.040874481201171875, -0.03815269470214844, -0.035430908203125, -0.03270912170410156, -0.029987335205078125, -0.027265548706054688, -0.02454376220703125, -0.021821975708007812, -0.019100189208984375, -0.016378402709960938, -0.0136566162109375, -0.010934829711914062, -0.008213043212890625, -0.0054912567138671875, -0.00276947021484375, -4.76837158203125e-05, 0.002674102783203125, 0.0053958892822265625, 0.00811767578125, 0.010839462280273438, 0.013561248779296875, 0.016283035278320312, 0.01900482177734375, 0.021726608276367188, 0.024448394775390625, 0.027170181274414062, 0.0298919677734375, 0.03261375427246094, 0.035335540771484375, 0.03805732727050781, 0.04077911376953125, 0.04350090026855469, 0.046222686767578125, 0.04894447326660156, 0.051666259765625, 0.05438804626464844, 0.057109832763671875, 0.05983161926269531, 0.06255340576171875, 0.06527519226074219, 0.06799697875976562, 0.07071876525878906, 0.0734405517578125, 0.07616233825683594, 0.07888412475585938, 0.08160591125488281, 0.08432769775390625, 0.08704948425292969, 0.08977127075195312, 0.09249305725097656, 0.09521484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 6.0, 17.0, 6.0, 8.0, 14.0, 11.0, 19.0, 18.0, 21.0, 22.0, 29.0, 23.0, 26.0, 25.0, 36.0, 31.0, 33.0, 34.0, 33.0, 33.0, 43.0, 36.0, 40.0, 37.0, 35.0, 43.0, 41.0, 30.0, 26.0, 26.0, 22.0, 22.0, 17.0, 18.0, 15.0, 20.0, 13.0, 9.0, 12.0, 4.0, 6.0, 11.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.03802490234375, -0.036858558654785156, -0.03569221496582031, -0.03452587127685547, -0.033359527587890625, -0.03219318389892578, -0.031026840209960938, -0.029860496520996094, -0.02869415283203125, -0.027527809143066406, -0.026361465454101562, -0.02519512176513672, -0.024028778076171875, -0.02286243438720703, -0.021696090698242188, -0.020529747009277344, -0.0193634033203125, -0.018197059631347656, -0.017030715942382812, -0.01586437225341797, -0.014698028564453125, -0.013531684875488281, -0.012365341186523438, -0.011198997497558594, -0.01003265380859375, -0.008866310119628906, -0.0076999664306640625, -0.006533622741699219, -0.005367279052734375, -0.004200935363769531, -0.0030345916748046875, -0.0018682479858398438, -0.000701904296875, 0.00046443939208984375, 0.0016307830810546875, 0.0027971267700195312, 0.003963470458984375, 0.005129814147949219, 0.0062961578369140625, 0.007462501525878906, 0.00862884521484375, 0.009795188903808594, 0.010961532592773438, 0.012127876281738281, 0.013294219970703125, 0.014460563659667969, 0.015626907348632812, 0.016793251037597656, 0.0179595947265625, 0.019125938415527344, 0.020292282104492188, 0.02145862579345703, 0.022624969482421875, 0.02379131317138672, 0.024957656860351562, 0.026124000549316406, 0.02729034423828125, 0.028456687927246094, 0.029623031616210938, 0.03078937530517578, 0.031955718994140625, 0.03312206268310547, 0.03428840637207031, 0.035454750061035156, 0.03662109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 5.0, 7.0, 5.0, 9.0, 19.0, 11.0, 22.0, 30.0, 46.0, 77.0, 108.0, 184.0, 310.0, 548.0, 1083.0, 2056.0, 4389.0, 10142.0, 25287.0, 72364.0, 297306.0, 459074.0, 113972.0, 36165.0, 13893.0, 5789.0, 2661.0, 1326.0, 651.0, 407.0, 198.0, 144.0, 82.0, 47.0, 30.0, 30.0, 33.0, 7.0, 9.0, 8.0, 5.0, 6.0, 6.0, 1.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18556976318359375, -0.1799774169921875, -0.17438507080078125, -0.168792724609375, -0.16320037841796875, -0.1576080322265625, -0.15201568603515625, -0.14642333984375, -0.14083099365234375, -0.1352386474609375, -0.12964630126953125, -0.124053955078125, -0.11846160888671875, -0.1128692626953125, -0.10727691650390625, -0.1016845703125, -0.09609222412109375, -0.0904998779296875, -0.08490753173828125, -0.079315185546875, -0.07372283935546875, -0.0681304931640625, -0.06253814697265625, -0.05694580078125, -0.05135345458984375, -0.0457611083984375, -0.04016876220703125, -0.034576416015625, -0.02898406982421875, -0.0233917236328125, -0.01779937744140625, -0.01220703125, -0.00661468505859375, -0.0010223388671875, 0.00457000732421875, 0.010162353515625, 0.01575469970703125, 0.0213470458984375, 0.02693939208984375, 0.03253173828125, 0.03812408447265625, 0.0437164306640625, 0.04930877685546875, 0.054901123046875, 0.06049346923828125, 0.0660858154296875, 0.07167816162109375, 0.0772705078125, 0.08286285400390625, 0.0884552001953125, 0.09404754638671875, 0.099639892578125, 0.10523223876953125, 0.1108245849609375, 0.11641693115234375, 0.12200927734375, 0.12760162353515625, 0.1331939697265625, 0.13878631591796875, 0.144378662109375, 0.14997100830078125, 0.1555633544921875, 0.16115570068359375, 0.166748046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 5.0, 9.0, 12.0, 14.0, 20.0, 22.0, 25.0, 29.0, 35.0, 44.0, 47.0, 51.0, 41.0, 68.0, 55.0, 52.0, 54.0, 60.0, 46.0, 44.0, 42.0, 38.0, 31.0, 38.0, 26.0, 15.0, 16.0, 9.0, 9.0, 8.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1427001953125, -0.13742446899414062, -0.13214874267578125, -0.12687301635742188, -0.1215972900390625, -0.11632156372070312, -0.11104583740234375, -0.10577011108398438, -0.100494384765625, -0.09521865844726562, -0.08994293212890625, -0.08466720581054688, -0.0793914794921875, -0.07411575317382812, -0.06884002685546875, -0.06356430053710938, -0.05828857421875, -0.053012847900390625, -0.04773712158203125, -0.042461395263671875, -0.0371856689453125, -0.031909942626953125, -0.02663421630859375, -0.021358489990234375, -0.016082763671875, -0.010807037353515625, -0.00553131103515625, -0.000255584716796875, 0.0050201416015625, 0.010295867919921875, 0.01557159423828125, 0.020847320556640625, 0.026123046875, 0.031398773193359375, 0.03667449951171875, 0.041950225830078125, 0.0472259521484375, 0.052501678466796875, 0.05777740478515625, 0.06305313110351562, 0.068328857421875, 0.07360458374023438, 0.07888031005859375, 0.08415603637695312, 0.0894317626953125, 0.09470748901367188, 0.09998321533203125, 0.10525894165039062, 0.11053466796875, 0.11581039428710938, 0.12108612060546875, 0.12636184692382812, 0.1316375732421875, 0.13691329956054688, 0.14218902587890625, 0.14746475219726562, 0.152740478515625, 0.15801620483398438, 0.16329193115234375, 0.16856765747070312, 0.1738433837890625, 0.17911911010742188, 0.18439483642578125, 0.18967056274414062, 0.1949462890625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 25.0, 36.0, 45.0, 51.0, 95.0, 130.0, 149.0, 245.0, 388.0, 571.0, 888.0, 1137.0, 1822.0, 3033.0, 4674.0, 7459.0, 12736.0, 23404.0, 49899.0, 123629.0, 319490.0, 292001.0, 108253.0, 44857.0, 21913.0, 11864.0, 7073.0, 4432.0, 2830.0, 1751.0, 1215.0, 759.0, 531.0, 380.0, 233.0, 155.0, 122.0, 73.0, 55.0, 45.0, 31.0, 19.0, 11.0, 3.0, 8.0, 2.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.06289005279541016, -0.06071662902832031, -0.05854320526123047, -0.056369781494140625, -0.05419635772705078, -0.05202293395996094, -0.049849510192871094, -0.04767608642578125, -0.045502662658691406, -0.04332923889160156, -0.04115581512451172, -0.038982391357421875, -0.03680896759033203, -0.03463554382324219, -0.032462120056152344, -0.0302886962890625, -0.028115272521972656, -0.025941848754882812, -0.02376842498779297, -0.021595001220703125, -0.01942157745361328, -0.017248153686523438, -0.015074729919433594, -0.01290130615234375, -0.010727882385253906, -0.008554458618164062, -0.006381034851074219, -0.004207611083984375, -0.0020341873168945312, 0.0001392364501953125, 0.0023126602172851562, 0.004486083984375, 0.006659507751464844, 0.008832931518554688, 0.011006355285644531, 0.013179779052734375, 0.015353202819824219, 0.017526626586914062, 0.019700050354003906, 0.02187347412109375, 0.024046897888183594, 0.026220321655273438, 0.02839374542236328, 0.030567169189453125, 0.03274059295654297, 0.03491401672363281, 0.037087440490722656, 0.0392608642578125, 0.041434288024902344, 0.04360771179199219, 0.04578113555908203, 0.047954559326171875, 0.05012798309326172, 0.05230140686035156, 0.054474830627441406, 0.05664825439453125, 0.058821678161621094, 0.06099510192871094, 0.06316852569580078, 0.06534194946289062, 0.06751537322998047, 0.06968879699707031, 0.07186222076416016, 0.07403564453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 6.0, 4.0, 6.0, 11.0, 19.0, 21.0, 29.0, 42.0, 63.0, 95.0, 113.0, 121.0, 114.0, 99.0, 67.0, 48.0, 34.0, 33.0, 15.0, 6.0, 14.0, 10.0, 8.0, 4.0, 3.0, 2.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.695487976074219e-05, -3.592390567064285e-05, -3.489293158054352e-05, -3.386195749044418e-05, -3.283098340034485e-05, -3.1800009310245514e-05, -3.076903522014618e-05, -2.9738061130046844e-05, -2.870708703994751e-05, -2.7676112949848175e-05, -2.664513885974884e-05, -2.5614164769649506e-05, -2.458319067955017e-05, -2.3552216589450836e-05, -2.25212424993515e-05, -2.1490268409252167e-05, -2.0459294319152832e-05, -1.9428320229053497e-05, -1.8397346138954163e-05, -1.7366372048854828e-05, -1.6335397958755493e-05, -1.530442386865616e-05, -1.4273449778556824e-05, -1.3242475688457489e-05, -1.2211501598358154e-05, -1.118052750825882e-05, -1.0149553418159485e-05, -9.11857932806015e-06, -8.087605237960815e-06, -7.056631147861481e-06, -6.025657057762146e-06, -4.994682967662811e-06, -3.9637088775634766e-06, -2.932734787464142e-06, -1.9017606973648071e-06, -8.707866072654724e-07, 1.601874828338623e-07, 1.191161572933197e-06, 2.2221356630325317e-06, 3.2531097531318665e-06, 4.284083843231201e-06, 5.315057933330536e-06, 6.346032023429871e-06, 7.377006113529205e-06, 8.40798020362854e-06, 9.438954293727875e-06, 1.046992838382721e-05, 1.1500902473926544e-05, 1.2531876564025879e-05, 1.3562850654125214e-05, 1.4593824744224548e-05, 1.5624798834323883e-05, 1.6655772924423218e-05, 1.7686747014522552e-05, 1.8717721104621887e-05, 1.9748695194721222e-05, 2.0779669284820557e-05, 2.181064337491989e-05, 2.2841617465019226e-05, 2.387259155511856e-05, 2.4903565645217896e-05, 2.593453973531723e-05, 2.6965513825416565e-05, 2.79964879155159e-05, 2.9027462005615234e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 3.0, 1.0, 4.0, 11.0, 10.0, 24.0, 32.0, 32.0, 50.0, 78.0, 143.0, 291.0, 436.0, 755.0, 1377.0, 2396.0, 4495.0, 8617.0, 16971.0, 37266.0, 97999.0, 307272.0, 364069.0, 120938.0, 44299.0, 19881.0, 9618.0, 5152.0, 2726.0, 1559.0, 852.0, 484.0, 261.0, 171.0, 108.0, 59.0, 43.0, 30.0, 5.0, 11.0, 5.0, 9.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.08197021484375, -0.07949352264404297, -0.07701683044433594, -0.0745401382446289, -0.07206344604492188, -0.06958675384521484, -0.06711006164550781, -0.06463336944580078, -0.06215667724609375, -0.05967998504638672, -0.05720329284667969, -0.054726600646972656, -0.052249908447265625, -0.049773216247558594, -0.04729652404785156, -0.04481983184814453, -0.0423431396484375, -0.03986644744873047, -0.03738975524902344, -0.034913063049316406, -0.032436370849609375, -0.029959678649902344, -0.027482986450195312, -0.02500629425048828, -0.02252960205078125, -0.02005290985107422, -0.017576217651367188, -0.015099525451660156, -0.012622833251953125, -0.010146141052246094, -0.0076694488525390625, -0.005192756652832031, -0.002716064453125, -0.00023937225341796875, 0.0022373199462890625, 0.004714012145996094, 0.007190704345703125, 0.009667396545410156, 0.012144088745117188, 0.014620780944824219, 0.01709747314453125, 0.01957416534423828, 0.022050857543945312, 0.024527549743652344, 0.027004241943359375, 0.029480934143066406, 0.03195762634277344, 0.03443431854248047, 0.0369110107421875, 0.03938770294189453, 0.04186439514160156, 0.044341087341308594, 0.046817779541015625, 0.049294471740722656, 0.05177116394042969, 0.05424785614013672, 0.05672454833984375, 0.05920124053955078, 0.06167793273925781, 0.06415462493896484, 0.06663131713867188, 0.0691080093383789, 0.07158470153808594, 0.07406139373779297, 0.0765380859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 4.0, 1.0, 3.0, 4.0, 7.0, 8.0, 11.0, 9.0, 22.0, 24.0, 33.0, 32.0, 49.0, 83.0, 113.0, 103.0, 113.0, 92.0, 61.0, 54.0, 37.0, 28.0, 15.0, 25.0, 17.0, 6.0, 2.0, 4.0, 8.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060302734375, -0.05787849426269531, -0.055454254150390625, -0.05303001403808594, -0.05060577392578125, -0.04818153381347656, -0.045757293701171875, -0.04333305358886719, -0.0409088134765625, -0.03848457336425781, -0.036060333251953125, -0.03363609313964844, -0.03121185302734375, -0.028787612915039062, -0.026363372802734375, -0.023939132690429688, -0.021514892578125, -0.019090652465820312, -0.016666412353515625, -0.014242172241210938, -0.01181793212890625, -0.009393692016601562, -0.006969451904296875, -0.0045452117919921875, -0.0021209716796875, 0.0003032684326171875, 0.002727508544921875, 0.0051517486572265625, 0.00757598876953125, 0.010000228881835938, 0.012424468994140625, 0.014848709106445312, 0.01727294921875, 0.019697189331054688, 0.022121429443359375, 0.024545669555664062, 0.02696990966796875, 0.029394149780273438, 0.031818389892578125, 0.03424263000488281, 0.0366668701171875, 0.03909111022949219, 0.041515350341796875, 0.04393959045410156, 0.04636383056640625, 0.04878807067871094, 0.051212310791015625, 0.05363655090332031, 0.056060791015625, 0.05848503112792969, 0.060909271240234375, 0.06333351135253906, 0.06575775146484375, 0.06818199157714844, 0.07060623168945312, 0.07303047180175781, 0.0754547119140625, 0.07787895202636719, 0.08030319213867188, 0.08272743225097656, 0.08515167236328125, 0.08757591247558594, 0.09000015258789062, 0.09242439270019531, 0.0948486328125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 9.0, 31.0, 36.0, 47.0, 83.0, 84.0, 104.0, 108.0, 101.0, 81.0, 95.0, 70.0, 55.0, 35.0, 27.0, 12.0, 10.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8598827123641968, -0.8337026834487915, -0.8075226545333862, -0.781342625617981, -0.7551625967025757, -0.7289825677871704, -0.7028025388717651, -0.6766225695610046, -0.6504425406455994, -0.6242625117301941, -0.5980824828147888, -0.5719024538993835, -0.5457224249839783, -0.5195424556732178, -0.4933623969554901, -0.4671823978424072, -0.44100233912467957, -0.4148223102092743, -0.388642281293869, -0.36246228218078613, -0.33628225326538086, -0.3101022243499756, -0.2839221954345703, -0.25774216651916504, -0.23156215250492096, -0.20538212358951569, -0.1792021095752716, -0.15302208065986633, -0.12684205174446106, -0.10066203773021698, -0.0744820088148117, -0.04830199480056763, -0.022121965885162354, 0.004058057442307472, 0.030238080769777298, 0.05641810595989227, 0.08259812742471695, 0.10877814888954163, 0.1349581778049469, 0.16113819181919098, 0.18731822073459625, 0.21349824965000153, 0.2396782636642456, 0.2658582925796509, 0.29203832149505615, 0.3182183504104614, 0.3443983793258667, 0.3705783784389496, 0.39675840735435486, 0.42293843626976013, 0.4491184651851654, 0.4752984642982483, 0.5014784932136536, 0.5276585221290588, 0.5538385510444641, 0.5800185799598694, 0.6061986088752747, 0.6323786377906799, 0.6585586667060852, 0.6847386956214905, 0.7109187245368958, 0.7370986938476562, 0.7632787227630615, 0.7894587516784668, 0.8156387805938721]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 9.0, 11.0, 9.0, 11.0, 9.0, 25.0, 14.0, 18.0, 25.0, 31.0, 31.0, 46.0, 39.0, 37.0, 51.0, 36.0, 49.0, 51.0, 58.0, 48.0, 51.0, 34.0, 33.0, 31.0, 22.0, 29.0, 34.0, 24.0, 16.0, 15.0, 15.0, 14.0, 16.0, 10.0, 8.0, 6.0, 5.0, 10.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4427749514579773, -0.42767900228500366, -0.41258305311203003, -0.3974871039390564, -0.38239115476608276, -0.36729520559310913, -0.3521992564201355, -0.33710330724716187, -0.32200735807418823, -0.3069114089012146, -0.29181545972824097, -0.27671951055526733, -0.2616235613822937, -0.24652761220932007, -0.23143166303634644, -0.2163357138633728, -0.20123976469039917, -0.18614381551742554, -0.1710478663444519, -0.15595191717147827, -0.14085596799850464, -0.125760018825531, -0.11066406965255737, -0.09556812047958374, -0.08047217130661011, -0.06537622213363647, -0.05028027296066284, -0.03518432378768921, -0.020088374614715576, -0.004992425441741943, 0.01010352373123169, 0.025199472904205322, 0.040295422077178955, 0.05539137125015259, 0.07048732042312622, 0.08558326959609985, 0.10067921876907349, 0.11577516794204712, 0.13087111711502075, 0.14596706628799438, 0.16106301546096802, 0.17615896463394165, 0.19125491380691528, 0.20635086297988892, 0.22144681215286255, 0.23654276132583618, 0.2516387104988098, 0.26673465967178345, 0.2818306088447571, 0.2969265580177307, 0.31202250719070435, 0.327118456363678, 0.3422144055366516, 0.35731035470962524, 0.3724063038825989, 0.3875022530555725, 0.40259820222854614, 0.4176941514015198, 0.4327901005744934, 0.44788604974746704, 0.4629819989204407, 0.4780779480934143, 0.49317389726638794, 0.5082698464393616, 0.5233657956123352]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 3.0, 8.0, 12.0, 18.0, 16.0, 33.0, 40.0, 36.0, 95.0, 147.0, 211.0, 387.0, 834.0, 1630.0, 3543.0, 7968.0, 19611.0, 54217.0, 166838.0, 585706.0, 2099991.0, 893605.0, 238332.0, 75262.0, 26640.0, 10369.0, 4436.0, 2047.0, 970.0, 530.0, 271.0, 175.0, 84.0, 44.0, 47.0, 32.0, 24.0, 23.0, 14.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08782958984375, -0.08505439758300781, -0.08227920532226562, -0.07950401306152344, -0.07672882080078125, -0.07395362854003906, -0.07117843627929688, -0.06840324401855469, -0.0656280517578125, -0.06285285949707031, -0.060077667236328125, -0.05730247497558594, -0.05452728271484375, -0.05175209045410156, -0.048976898193359375, -0.04620170593261719, -0.043426513671875, -0.04065132141113281, -0.037876129150390625, -0.03510093688964844, -0.03232574462890625, -0.029550552368164062, -0.026775360107421875, -0.024000167846679688, -0.0212249755859375, -0.018449783325195312, -0.015674591064453125, -0.012899398803710938, -0.01012420654296875, -0.0073490142822265625, -0.004573822021484375, -0.0017986297607421875, 0.0009765625, 0.0037517547607421875, 0.006526947021484375, 0.009302139282226562, 0.01207733154296875, 0.014852523803710938, 0.017627716064453125, 0.020402908325195312, 0.0231781005859375, 0.025953292846679688, 0.028728485107421875, 0.03150367736816406, 0.03427886962890625, 0.03705406188964844, 0.039829254150390625, 0.04260444641113281, 0.045379638671875, 0.04815483093261719, 0.050930023193359375, 0.05370521545410156, 0.05648040771484375, 0.05925559997558594, 0.062030792236328125, 0.06480598449707031, 0.0675811767578125, 0.07035636901855469, 0.07313156127929688, 0.07590675354003906, 0.07868194580078125, 0.08145713806152344, 0.08423233032226562, 0.08700752258300781, 0.08978271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 9.0, 6.0, 10.0, 5.0, 11.0, 14.0, 12.0, 11.0, 15.0, 23.0, 37.0, 33.0, 32.0, 33.0, 29.0, 25.0, 31.0, 41.0, 37.0, 39.0, 40.0, 40.0, 41.0, 43.0, 44.0, 36.0, 37.0, 26.0, 32.0, 25.0, 17.0, 13.0, 18.0, 29.0, 8.0, 14.0, 16.0, 13.0, 13.0, 5.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.04180908203125, -0.040454864501953125, -0.03910064697265625, -0.037746429443359375, -0.0363922119140625, -0.035037994384765625, -0.03368377685546875, -0.032329559326171875, -0.030975341796875, -0.029621124267578125, -0.02826690673828125, -0.026912689208984375, -0.0255584716796875, -0.024204254150390625, -0.02285003662109375, -0.021495819091796875, -0.0201416015625, -0.018787384033203125, -0.01743316650390625, -0.016078948974609375, -0.0147247314453125, -0.013370513916015625, -0.01201629638671875, -0.010662078857421875, -0.009307861328125, -0.007953643798828125, -0.00659942626953125, -0.005245208740234375, -0.0038909912109375, -0.002536773681640625, -0.00118255615234375, 0.000171661376953125, 0.00152587890625, 0.002880096435546875, 0.00423431396484375, 0.005588531494140625, 0.0069427490234375, 0.008296966552734375, 0.00965118408203125, 0.011005401611328125, 0.012359619140625, 0.013713836669921875, 0.01506805419921875, 0.016422271728515625, 0.0177764892578125, 0.019130706787109375, 0.02048492431640625, 0.021839141845703125, 0.023193359375, 0.024547576904296875, 0.02590179443359375, 0.027256011962890625, 0.0286102294921875, 0.029964447021484375, 0.03131866455078125, 0.032672882080078125, 0.034027099609375, 0.035381317138671875, 0.03673553466796875, 0.038089752197265625, 0.0394439697265625, 0.040798187255859375, 0.04215240478515625, 0.043506622314453125, 0.04486083984375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 11.0, 15.0, 23.0, 37.0, 51.0, 76.0, 122.0, 185.0, 266.0, 407.0, 734.0, 1049.0, 1865.0, 3435.0, 6957.0, 14600.0, 35683.0, 97855.0, 304375.0, 1044738.0, 1797520.0, 597075.0, 180202.0, 61229.0, 23697.0, 10363.0, 5070.0, 2749.0, 1422.0, 902.0, 555.0, 360.0, 238.0, 146.0, 82.0, 58.0, 33.0, 24.0, 25.0, 7.0, 10.0, 8.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14794921875, -0.1436328887939453, -0.13931655883789062, -0.13500022888183594, -0.13068389892578125, -0.12636756896972656, -0.12205123901367188, -0.11773490905761719, -0.1134185791015625, -0.10910224914550781, -0.10478591918945312, -0.10046958923339844, -0.09615325927734375, -0.09183692932128906, -0.08752059936523438, -0.08320426940917969, -0.078887939453125, -0.07457160949707031, -0.07025527954101562, -0.06593894958496094, -0.06162261962890625, -0.05730628967285156, -0.052989959716796875, -0.04867362976074219, -0.0443572998046875, -0.04004096984863281, -0.035724639892578125, -0.03140830993652344, -0.02709197998046875, -0.022775650024414062, -0.018459320068359375, -0.014142990112304688, -0.00982666015625, -0.0055103302001953125, -0.001194000244140625, 0.0031223297119140625, 0.00743865966796875, 0.011754989624023438, 0.016071319580078125, 0.020387649536132812, 0.0247039794921875, 0.029020309448242188, 0.033336639404296875, 0.03765296936035156, 0.04196929931640625, 0.04628562927246094, 0.050601959228515625, 0.05491828918457031, 0.059234619140625, 0.06355094909667969, 0.06786727905273438, 0.07218360900878906, 0.07649993896484375, 0.08081626892089844, 0.08513259887695312, 0.08944892883300781, 0.0937652587890625, 0.09808158874511719, 0.10239791870117188, 0.10671424865722656, 0.11103057861328125, 0.11534690856933594, 0.11966323852539062, 0.12397956848144531, 0.1282958984375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 17.0, 28.0, 37.0, 63.0, 109.0, 143.0, 214.0, 328.0, 488.0, 661.0, 582.0, 425.0, 292.0, 230.0, 132.0, 92.0, 68.0, 46.0, 26.0, 20.0, 23.0, 9.0, 2.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1395263671875, -0.1352863311767578, -0.13104629516601562, -0.12680625915527344, -0.12256622314453125, -0.11832618713378906, -0.11408615112304688, -0.10984611511230469, -0.1056060791015625, -0.10136604309082031, -0.09712600708007812, -0.09288597106933594, -0.08864593505859375, -0.08440589904785156, -0.08016586303710938, -0.07592582702636719, -0.071685791015625, -0.06744575500488281, -0.06320571899414062, -0.05896568298339844, -0.05472564697265625, -0.05048561096191406, -0.046245574951171875, -0.04200553894042969, -0.0377655029296875, -0.03352546691894531, -0.029285430908203125, -0.025045394897460938, -0.02080535888671875, -0.016565322875976562, -0.012325286865234375, -0.008085250854492188, -0.00384521484375, 0.0003948211669921875, 0.004634857177734375, 0.008874893188476562, 0.01311492919921875, 0.017354965209960938, 0.021595001220703125, 0.025835037231445312, 0.0300750732421875, 0.03431510925292969, 0.038555145263671875, 0.04279518127441406, 0.04703521728515625, 0.05127525329589844, 0.055515289306640625, 0.05975532531738281, 0.063995361328125, 0.06823539733886719, 0.07247543334960938, 0.07671546936035156, 0.08095550537109375, 0.08519554138183594, 0.08943557739257812, 0.09367561340332031, 0.0979156494140625, 0.10215568542480469, 0.10639572143554688, 0.11063575744628906, 0.11487579345703125, 0.11911582946777344, 0.12335586547851562, 0.1275959014892578, 0.1318359375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 23.0, 22.0, 25.0, 41.0, 53.0, 75.0, 103.0, 104.0, 95.0, 95.0, 103.0, 86.0, 49.0, 42.0, 24.0, 25.0, 15.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.9626626968383789, -0.9405006766319275, -0.9183386564254761, -0.8961766958236694, -0.874014675617218, -0.8518526554107666, -0.8296906352043152, -0.8075286149978638, -0.7853665947914124, -0.7632045745849609, -0.7410425543785095, -0.7188805341720581, -0.6967185735702515, -0.6745565533638, -0.6523945331573486, -0.6302325129508972, -0.6080704927444458, -0.5859084725379944, -0.563746452331543, -0.5415844917297363, -0.5194224715232849, -0.4972604513168335, -0.4750984311103821, -0.45293641090393066, -0.430774450302124, -0.4086124300956726, -0.3864504396915436, -0.36428841948509216, -0.34212639927864075, -0.3199644088745117, -0.2978023886680603, -0.2756403684616089, -0.25347837805747986, -0.23131637275218964, -0.20915435254573822, -0.186992347240448, -0.16483032703399658, -0.14266832172870636, -0.12050631642341614, -0.09834429621696472, -0.0761822909116745, -0.05402027815580368, -0.03185826912522316, -0.00969626009464264, 0.01246575266122818, 0.034627765417099, 0.05678977072238922, 0.07895179092884064, 0.10111379623413086, 0.12327580899000168, 0.1454378217458725, 0.16759982705116272, 0.18976184725761414, 0.21192385256290436, 0.23408585786819458, 0.256247878074646, 0.2784098982810974, 0.30057191848754883, 0.32273390889167786, 0.3448959290981293, 0.3670579493045807, 0.3892199397087097, 0.41138195991516113, 0.43354398012161255, 0.4557059705257416]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 7.0, 10.0, 8.0, 9.0, 11.0, 14.0, 13.0, 23.0, 25.0, 13.0, 31.0, 32.0, 24.0, 35.0, 33.0, 29.0, 40.0, 51.0, 29.0, 49.0, 40.0, 56.0, 36.0, 33.0, 53.0, 37.0, 27.0, 33.0, 26.0, 25.0, 17.0, 21.0, 25.0, 17.0, 17.0, 13.0, 7.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38853776454925537, -0.3764485716819763, -0.36435937881469727, -0.3522701561450958, -0.3401809632778168, -0.3280917704105377, -0.31600257754325867, -0.3039133548736572, -0.2918241620063782, -0.2797349691390991, -0.26764577627182007, -0.25555655360221863, -0.24346736073493958, -0.23137816786766052, -0.21928897500038147, -0.20719976723194122, -0.19511057436466217, -0.18302138149738312, -0.17093217372894287, -0.15884298086166382, -0.14675377309322357, -0.13466458022594452, -0.12257537990808487, -0.11048617959022522, -0.09839697927236557, -0.08630777895450592, -0.07421857863664627, -0.06212938204407692, -0.05004018172621727, -0.03795098140835762, -0.02586178481578827, -0.01377258449792862, -0.0016833841800689697, 0.010405815206468105, 0.02249501459300518, 0.03458421304821968, 0.04667341336607933, 0.05876261368393898, 0.07085181027650833, 0.08294101059436798, 0.09503021091222763, 0.10711941123008728, 0.11920861154794693, 0.13129781186580658, 0.14338700473308563, 0.15547621250152588, 0.16756540536880493, 0.17965459823608398, 0.19174380600452423, 0.20383299887180328, 0.21592220664024353, 0.22801139950752258, 0.24010060727596283, 0.2521898150444031, 0.26427900791168213, 0.2763682007789612, 0.28845739364624023, 0.3005465865135193, 0.31263577938079834, 0.3247250020503998, 0.33681419491767883, 0.3489033877849579, 0.36099258065223694, 0.3730818033218384, 0.38517099618911743]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 10.0, 14.0, 32.0, 27.0, 47.0, 75.0, 121.0, 162.0, 267.0, 365.0, 673.0, 920.0, 1428.0, 2164.0, 3259.0, 5053.0, 7705.0, 11786.0, 18867.0, 30571.0, 53824.0, 110640.0, 247791.0, 272526.0, 129274.0, 60261.0, 33535.0, 20314.0, 12883.0, 8240.0, 5335.0, 3633.0, 2281.0, 1506.0, 1026.0, 644.0, 437.0, 300.0, 190.0, 114.0, 103.0, 58.0, 30.0, 19.0, 17.0, 13.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.087158203125, -0.08452415466308594, -0.08189010620117188, -0.07925605773925781, -0.07662200927734375, -0.07398796081542969, -0.07135391235351562, -0.06871986389160156, -0.0660858154296875, -0.06345176696777344, -0.060817718505859375, -0.05818367004394531, -0.05554962158203125, -0.05291557312011719, -0.050281524658203125, -0.04764747619628906, -0.045013427734375, -0.04237937927246094, -0.039745330810546875, -0.03711128234863281, -0.03447723388671875, -0.03184318542480469, -0.029209136962890625, -0.026575088500976562, -0.0239410400390625, -0.021306991577148438, -0.018672943115234375, -0.016038894653320312, -0.01340484619140625, -0.010770797729492188, -0.008136749267578125, -0.0055027008056640625, -0.00286865234375, -0.0002346038818359375, 0.002399444580078125, 0.0050334930419921875, 0.00766754150390625, 0.010301589965820312, 0.012935638427734375, 0.015569686889648438, 0.0182037353515625, 0.020837783813476562, 0.023471832275390625, 0.026105880737304688, 0.02873992919921875, 0.03137397766113281, 0.034008026123046875, 0.03664207458496094, 0.039276123046875, 0.04191017150878906, 0.044544219970703125, 0.04717826843261719, 0.04981231689453125, 0.05244636535644531, 0.055080413818359375, 0.05771446228027344, 0.0603485107421875, 0.06298255920410156, 0.06561660766601562, 0.06825065612792969, 0.07088470458984375, 0.07351875305175781, 0.07615280151367188, 0.07878684997558594, 0.0814208984375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 9.0, 13.0, 8.0, 13.0, 9.0, 16.0, 14.0, 18.0, 20.0, 23.0, 19.0, 15.0, 32.0, 24.0, 30.0, 35.0, 31.0, 31.0, 30.0, 39.0, 36.0, 32.0, 43.0, 39.0, 30.0, 30.0, 37.0, 30.0, 28.0, 37.0, 35.0, 20.0, 18.0, 18.0, 25.0, 18.0, 7.0, 13.0, 12.0, 9.0, 9.0, 9.0, 4.0, 7.0, 5.0, 5.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.045318603515625, -0.04390239715576172, -0.04248619079589844, -0.041069984436035156, -0.039653778076171875, -0.038237571716308594, -0.03682136535644531, -0.03540515899658203, -0.03398895263671875, -0.03257274627685547, -0.031156539916992188, -0.029740333557128906, -0.028324127197265625, -0.026907920837402344, -0.025491714477539062, -0.02407550811767578, -0.0226593017578125, -0.02124309539794922, -0.019826889038085938, -0.018410682678222656, -0.016994476318359375, -0.015578269958496094, -0.014162063598632812, -0.012745857238769531, -0.01132965087890625, -0.009913444519042969, -0.008497238159179688, -0.007081031799316406, -0.005664825439453125, -0.004248619079589844, -0.0028324127197265625, -0.0014162063598632812, 0.0, 0.0014162063598632812, 0.0028324127197265625, 0.004248619079589844, 0.005664825439453125, 0.007081031799316406, 0.008497238159179688, 0.009913444519042969, 0.01132965087890625, 0.012745857238769531, 0.014162063598632812, 0.015578269958496094, 0.016994476318359375, 0.018410682678222656, 0.019826889038085938, 0.02124309539794922, 0.0226593017578125, 0.02407550811767578, 0.025491714477539062, 0.026907920837402344, 0.028324127197265625, 0.029740333557128906, 0.031156539916992188, 0.03257274627685547, 0.03398895263671875, 0.03540515899658203, 0.03682136535644531, 0.038237571716308594, 0.039653778076171875, 0.041069984436035156, 0.04248619079589844, 0.04390239715576172, 0.045318603515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 12.0, 14.0, 17.0, 10.0, 26.0, 43.0, 57.0, 75.0, 134.0, 180.0, 307.0, 573.0, 1218.0, 2877.0, 7771.0, 21162.0, 64185.0, 377792.0, 460510.0, 73009.0, 23738.0, 8600.0, 3268.0, 1317.0, 653.0, 350.0, 182.0, 130.0, 93.0, 73.0, 51.0, 25.0, 24.0, 17.0, 15.0, 8.0, 7.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2099609375, -0.20247650146484375, -0.1949920654296875, -0.18750762939453125, -0.180023193359375, -0.17253875732421875, -0.1650543212890625, -0.15756988525390625, -0.15008544921875, -0.14260101318359375, -0.1351165771484375, -0.12763214111328125, -0.120147705078125, -0.11266326904296875, -0.1051788330078125, -0.09769439697265625, -0.0902099609375, -0.08272552490234375, -0.0752410888671875, -0.06775665283203125, -0.060272216796875, -0.05278778076171875, -0.0453033447265625, -0.03781890869140625, -0.03033447265625, -0.02285003662109375, -0.0153656005859375, -0.00788116455078125, -0.000396728515625, 0.00708770751953125, 0.0145721435546875, 0.02205657958984375, 0.029541015625, 0.03702545166015625, 0.0445098876953125, 0.05199432373046875, 0.059478759765625, 0.06696319580078125, 0.0744476318359375, 0.08193206787109375, 0.08941650390625, 0.09690093994140625, 0.1043853759765625, 0.11186981201171875, 0.119354248046875, 0.12683868408203125, 0.1343231201171875, 0.14180755615234375, 0.1492919921875, 0.15677642822265625, 0.1642608642578125, 0.17174530029296875, 0.179229736328125, 0.18671417236328125, 0.1941986083984375, 0.20168304443359375, 0.20916748046875, 0.21665191650390625, 0.2241363525390625, 0.23162078857421875, 0.239105224609375, 0.24658966064453125, 0.2540740966796875, 0.26155853271484375, 0.26904296875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 8.0, 5.0, 12.0, 12.0, 9.0, 19.0, 20.0, 25.0, 30.0, 43.0, 42.0, 48.0, 41.0, 64.0, 57.0, 63.0, 39.0, 60.0, 49.0, 72.0, 41.0, 45.0, 39.0, 31.0, 24.0, 13.0, 19.0, 11.0, 9.0, 11.0, 5.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.205322265625, -0.19861412048339844, -0.19190597534179688, -0.1851978302001953, -0.17848968505859375, -0.1717815399169922, -0.16507339477539062, -0.15836524963378906, -0.1516571044921875, -0.14494895935058594, -0.13824081420898438, -0.1315326690673828, -0.12482452392578125, -0.11811637878417969, -0.11140823364257812, -0.10470008850097656, -0.097991943359375, -0.09128379821777344, -0.08457565307617188, -0.07786750793457031, -0.07115936279296875, -0.06445121765136719, -0.057743072509765625, -0.05103492736816406, -0.0443267822265625, -0.03761863708496094, -0.030910491943359375, -0.024202346801757812, -0.01749420166015625, -0.010786056518554688, -0.004077911376953125, 0.0026302337646484375, 0.00933837890625, 0.016046524047851562, 0.022754669189453125, 0.029462814331054688, 0.03617095947265625, 0.04287910461425781, 0.049587249755859375, 0.05629539489746094, 0.0630035400390625, 0.06971168518066406, 0.07641983032226562, 0.08312797546386719, 0.08983612060546875, 0.09654426574707031, 0.10325241088867188, 0.10996055603027344, 0.116668701171875, 0.12337684631347656, 0.13008499145507812, 0.1367931365966797, 0.14350128173828125, 0.1502094268798828, 0.15691757202148438, 0.16362571716308594, 0.1703338623046875, 0.17704200744628906, 0.18375015258789062, 0.1904582977294922, 0.19716644287109375, 0.2038745880126953, 0.21058273315429688, 0.21729087829589844, 0.2239990234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 10.0, 7.0, 24.0, 35.0, 36.0, 64.0, 81.0, 142.0, 211.0, 289.0, 476.0, 698.0, 1145.0, 1774.0, 3075.0, 4756.0, 7769.0, 12361.0, 19837.0, 33302.0, 74312.0, 261770.0, 395119.0, 122392.0, 44102.0, 24491.0, 15125.0, 9567.0, 5855.0, 3614.0, 2226.0, 1357.0, 852.0, 592.0, 351.0, 223.0, 156.0, 114.0, 75.0, 49.0, 35.0, 23.0, 21.0, 10.0, 13.0, 7.0, 3.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0584716796875, -0.05632305145263672, -0.05417442321777344, -0.052025794982910156, -0.049877166748046875, -0.047728538513183594, -0.04557991027832031, -0.04343128204345703, -0.04128265380859375, -0.03913402557373047, -0.03698539733886719, -0.034836769104003906, -0.032688140869140625, -0.030539512634277344, -0.028390884399414062, -0.02624225616455078, -0.0240936279296875, -0.02194499969482422, -0.019796371459960938, -0.017647743225097656, -0.015499114990234375, -0.013350486755371094, -0.011201858520507812, -0.009053230285644531, -0.00690460205078125, -0.004755973815917969, -0.0026073455810546875, -0.00045871734619140625, 0.001689910888671875, 0.0038385391235351562, 0.0059871673583984375, 0.008135795593261719, 0.010284423828125, 0.012433052062988281, 0.014581680297851562, 0.016730308532714844, 0.018878936767578125, 0.021027565002441406, 0.023176193237304688, 0.02532482147216797, 0.02747344970703125, 0.02962207794189453, 0.03177070617675781, 0.033919334411621094, 0.036067962646484375, 0.038216590881347656, 0.04036521911621094, 0.04251384735107422, 0.0446624755859375, 0.04681110382080078, 0.04895973205566406, 0.051108360290527344, 0.053256988525390625, 0.055405616760253906, 0.05755424499511719, 0.05970287322998047, 0.06185150146484375, 0.06400012969970703, 0.06614875793457031, 0.0682973861694336, 0.07044601440429688, 0.07259464263916016, 0.07474327087402344, 0.07689189910888672, 0.07904052734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 11.0, 8.0, 8.0, 16.0, 20.0, 21.0, 34.0, 36.0, 58.0, 86.0, 100.0, 108.0, 113.0, 85.0, 76.0, 43.0, 32.0, 37.0, 21.0, 12.0, 11.0, 9.0, 7.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.682209014892578e-05, -2.5998800992965698e-05, -2.5175511837005615e-05, -2.4352222681045532e-05, -2.352893352508545e-05, -2.2705644369125366e-05, -2.1882355213165283e-05, -2.10590660572052e-05, -2.0235776901245117e-05, -1.9412487745285034e-05, -1.858919858932495e-05, -1.7765909433364868e-05, -1.6942620277404785e-05, -1.6119331121444702e-05, -1.529604196548462e-05, -1.4472752809524536e-05, -1.3649463653564453e-05, -1.282617449760437e-05, -1.2002885341644287e-05, -1.1179596185684204e-05, -1.0356307029724121e-05, -9.533017873764038e-06, -8.709728717803955e-06, -7.886439561843872e-06, -7.063150405883789e-06, -6.239861249923706e-06, -5.416572093963623e-06, -4.59328293800354e-06, -3.769993782043457e-06, -2.946704626083374e-06, -2.123415470123291e-06, -1.300126314163208e-06, -4.76837158203125e-07, 3.46451997756958e-07, 1.169741153717041e-06, 1.993030309677124e-06, 2.816319465637207e-06, 3.63960862159729e-06, 4.462897777557373e-06, 5.286186933517456e-06, 6.109476089477539e-06, 6.932765245437622e-06, 7.756054401397705e-06, 8.579343557357788e-06, 9.402632713317871e-06, 1.0225921869277954e-05, 1.1049211025238037e-05, 1.187250018119812e-05, 1.2695789337158203e-05, 1.3519078493118286e-05, 1.4342367649078369e-05, 1.5165656805038452e-05, 1.5988945960998535e-05, 1.6812235116958618e-05, 1.76355242729187e-05, 1.8458813428878784e-05, 1.9282102584838867e-05, 2.010539174079895e-05, 2.0928680896759033e-05, 2.1751970052719116e-05, 2.25752592086792e-05, 2.3398548364639282e-05, 2.4221837520599365e-05, 2.5045126676559448e-05, 2.586841583251953e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 7.0, 16.0, 14.0, 31.0, 43.0, 61.0, 108.0, 202.0, 393.0, 845.0, 1692.0, 3623.0, 7988.0, 17789.0, 39648.0, 124409.0, 540585.0, 215740.0, 53739.0, 22516.0, 10217.0, 4653.0, 2135.0, 1021.0, 466.0, 256.0, 131.0, 67.0, 48.0, 28.0, 21.0, 13.0, 7.0, 3.0, 8.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.09716796875, -0.09409904479980469, -0.09103012084960938, -0.08796119689941406, -0.08489227294921875, -0.08182334899902344, -0.07875442504882812, -0.07568550109863281, -0.0726165771484375, -0.06954765319824219, -0.06647872924804688, -0.06340980529785156, -0.06034088134765625, -0.05727195739746094, -0.054203033447265625, -0.05113410949707031, -0.048065185546875, -0.04499626159667969, -0.041927337646484375, -0.03885841369628906, -0.03578948974609375, -0.03272056579589844, -0.029651641845703125, -0.026582717895507812, -0.0235137939453125, -0.020444869995117188, -0.017375946044921875, -0.014307022094726562, -0.01123809814453125, -0.008169174194335938, -0.005100250244140625, -0.0020313262939453125, 0.00103759765625, 0.0041065216064453125, 0.007175445556640625, 0.010244369506835938, 0.01331329345703125, 0.016382217407226562, 0.019451141357421875, 0.022520065307617188, 0.0255889892578125, 0.028657913208007812, 0.031726837158203125, 0.03479576110839844, 0.03786468505859375, 0.04093360900878906, 0.044002532958984375, 0.04707145690917969, 0.050140380859375, 0.05320930480957031, 0.056278228759765625, 0.05934715270996094, 0.06241607666015625, 0.06548500061035156, 0.06855392456054688, 0.07162284851074219, 0.0746917724609375, 0.07776069641113281, 0.08082962036132812, 0.08389854431152344, 0.08696746826171875, 0.09003639221191406, 0.09310531616210938, 0.09617424011230469, 0.0992431640625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 11.0, 7.0, 5.0, 11.0, 6.0, 15.0, 14.0, 15.0, 24.0, 25.0, 46.0, 70.0, 93.0, 139.0, 116.0, 99.0, 73.0, 44.0, 28.0, 26.0, 26.0, 16.0, 16.0, 9.0, 11.0, 9.0, 3.0, 5.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07330322265625, -0.07108306884765625, -0.0688629150390625, -0.06664276123046875, -0.064422607421875, -0.06220245361328125, -0.0599822998046875, -0.05776214599609375, -0.0555419921875, -0.05332183837890625, -0.0511016845703125, -0.04888153076171875, -0.046661376953125, -0.04444122314453125, -0.0422210693359375, -0.04000091552734375, -0.03778076171875, -0.03556060791015625, -0.0333404541015625, -0.03112030029296875, -0.028900146484375, -0.02667999267578125, -0.0244598388671875, -0.02223968505859375, -0.02001953125, -0.01779937744140625, -0.0155792236328125, -0.01335906982421875, -0.011138916015625, -0.00891876220703125, -0.0066986083984375, -0.00447845458984375, -0.00225830078125, -3.814697265625e-05, 0.0021820068359375, 0.00440216064453125, 0.006622314453125, 0.00884246826171875, 0.0110626220703125, 0.01328277587890625, 0.0155029296875, 0.01772308349609375, 0.0199432373046875, 0.02216339111328125, 0.024383544921875, 0.02660369873046875, 0.0288238525390625, 0.03104400634765625, 0.03326416015625, 0.03548431396484375, 0.0377044677734375, 0.03992462158203125, 0.042144775390625, 0.04436492919921875, 0.0465850830078125, 0.04880523681640625, 0.051025390625, 0.05324554443359375, 0.0554656982421875, 0.05768585205078125, 0.059906005859375, 0.06212615966796875, 0.0643463134765625, 0.06656646728515625, 0.06878662109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 5.0, 3.0, 12.0, 23.0, 22.0, 31.0, 32.0, 43.0, 56.0, 53.0, 62.0, 60.0, 72.0, 63.0, 63.0, 59.0, 68.0, 43.0, 37.0, 45.0, 20.0, 25.0, 26.0, 16.0, 12.0, 14.0, 4.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5607216358184814, -0.5438344478607178, -0.5269472599029541, -0.5100600719451904, -0.49317285418510437, -0.4762856364250183, -0.45939844846725464, -0.44251126050949097, -0.4256240725517273, -0.4087368845939636, -0.39184966683387756, -0.3749624788761139, -0.3580752909183502, -0.34118807315826416, -0.3243008852005005, -0.3074136972427368, -0.29052647948265076, -0.2736392915248871, -0.256752073764801, -0.23986488580703735, -0.22297769784927368, -0.20609049499034882, -0.18920329213142395, -0.17231610417366028, -0.1554289013147354, -0.13854169845581055, -0.12165451049804688, -0.10476730763912201, -0.08788011223077774, -0.07099291682243347, -0.054105713963508606, -0.03721851855516434, -0.02033132314682007, -0.0034441258758306503, 0.013443071395158768, 0.030330270528793335, 0.047217465937137604, 0.06410466134548187, 0.08099186420440674, 0.09787905961275101, 0.11476625502109528, 0.13165345788002014, 0.1485406458377838, 0.16542784869670868, 0.18231505155563354, 0.19920223951339722, 0.21608944237232208, 0.23297664523124695, 0.24986383318901062, 0.2667510211467743, 0.28363823890686035, 0.300525426864624, 0.3174126148223877, 0.33429980278015137, 0.3511870205402374, 0.3680742084980011, 0.38496142625808716, 0.40184861421585083, 0.4187358319759369, 0.43562301993370056, 0.45251020789146423, 0.4693974256515503, 0.48628461360931396, 0.5031718015670776, 0.5200589895248413]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 9.0, 10.0, 9.0, 8.0, 10.0, 6.0, 14.0, 16.0, 21.0, 20.0, 21.0, 37.0, 37.0, 27.0, 43.0, 40.0, 28.0, 42.0, 51.0, 42.0, 48.0, 29.0, 31.0, 48.0, 30.0, 40.0, 31.0, 33.0, 26.0, 29.0, 28.0, 14.0, 17.0, 12.0, 16.0, 6.0, 15.0, 4.0, 10.0, 7.0, 9.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47663402557373047, -0.4601837396621704, -0.44373345375061035, -0.4272831678390503, -0.41083288192749023, -0.3943825960159302, -0.3779323101043701, -0.36148202419281006, -0.34503173828125, -0.32858145236968994, -0.3121311664581299, -0.2956808805465698, -0.27923059463500977, -0.2627803087234497, -0.24633000791072845, -0.2298797219991684, -0.21342942118644714, -0.19697913527488708, -0.18052884936332703, -0.16407856345176697, -0.1476282775402069, -0.13117799162864685, -0.1147276908159256, -0.09827740490436554, -0.08182711899280548, -0.06537683308124542, -0.048926543444395065, -0.03247625380754471, -0.01602596789598465, 0.00042431801557540894, 0.016874611377716064, 0.03332489728927612, 0.04977518320083618, 0.06622546911239624, 0.0826757550239563, 0.09912604838609695, 0.11557633429765701, 0.13202661275863647, 0.14847691357135773, 0.16492719948291779, 0.18137748539447784, 0.1978277713060379, 0.21427805721759796, 0.2307283580303192, 0.24717864394187927, 0.26362892985343933, 0.2800792157649994, 0.29652950167655945, 0.3129797875881195, 0.32943007349967957, 0.3458803594112396, 0.3623306453227997, 0.37878093123435974, 0.3952312171459198, 0.41168153285980225, 0.4281318187713623, 0.44458210468292236, 0.4610323905944824, 0.4774826765060425, 0.49393296241760254, 0.5103832483291626, 0.5268335342407227, 0.5432838201522827, 0.5597341060638428, 0.5761843919754028]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 12.0, 15.0, 22.0, 30.0, 28.0, 70.0, 81.0, 122.0, 212.0, 334.0, 617.0, 1127.0, 2143.0, 4339.0, 9568.0, 21350.0, 53323.0, 146734.0, 470893.0, 2121021.0, 962886.0, 252052.0, 86499.0, 33570.0, 14094.0, 6444.0, 3070.0, 1538.0, 827.0, 459.0, 298.0, 163.0, 111.0, 65.0, 38.0, 33.0, 24.0, 17.0, 14.0, 8.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.11907958984375, -0.11583900451660156, -0.11259841918945312, -0.10935783386230469, -0.10611724853515625, -0.10287666320800781, -0.09963607788085938, -0.09639549255371094, -0.0931549072265625, -0.08991432189941406, -0.08667373657226562, -0.08343315124511719, -0.08019256591796875, -0.07695198059082031, -0.07371139526367188, -0.07047080993652344, -0.067230224609375, -0.06398963928222656, -0.060749053955078125, -0.05750846862792969, -0.05426788330078125, -0.05102729797363281, -0.047786712646484375, -0.04454612731933594, -0.0413055419921875, -0.03806495666503906, -0.034824371337890625, -0.03158378601074219, -0.02834320068359375, -0.025102615356445312, -0.021862030029296875, -0.018621444702148438, -0.015380859375, -0.012140274047851562, -0.008899688720703125, -0.0056591033935546875, -0.00241851806640625, 0.0008220672607421875, 0.004062652587890625, 0.0073032379150390625, 0.0105438232421875, 0.013784408569335938, 0.017024993896484375, 0.020265579223632812, 0.02350616455078125, 0.026746749877929688, 0.029987335205078125, 0.03322792053222656, 0.036468505859375, 0.03970909118652344, 0.042949676513671875, 0.04619026184082031, 0.04943084716796875, 0.05267143249511719, 0.055912017822265625, 0.05915260314941406, 0.0623931884765625, 0.06563377380371094, 0.06887435913085938, 0.07211494445800781, 0.07535552978515625, 0.07859611511230469, 0.08183670043945312, 0.08507728576660156, 0.08831787109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 11.0, 11.0, 14.0, 19.0, 22.0, 15.0, 16.0, 28.0, 28.0, 37.0, 47.0, 32.0, 44.0, 53.0, 40.0, 36.0, 58.0, 55.0, 50.0, 52.0, 41.0, 45.0, 32.0, 29.0, 35.0, 27.0, 33.0, 15.0, 7.0, 16.0, 12.0, 12.0, 16.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07989501953125, -0.07769060134887695, -0.0754861831665039, -0.07328176498413086, -0.07107734680175781, -0.06887292861938477, -0.06666851043701172, -0.06446409225463867, -0.062259674072265625, -0.06005525588989258, -0.05785083770751953, -0.055646419525146484, -0.05344200134277344, -0.05123758316040039, -0.049033164978027344, -0.0468287467956543, -0.04462432861328125, -0.0424199104309082, -0.040215492248535156, -0.03801107406616211, -0.03580665588378906, -0.033602237701416016, -0.03139781951904297, -0.029193401336669922, -0.026988983154296875, -0.024784564971923828, -0.02258014678955078, -0.020375728607177734, -0.018171310424804688, -0.01596689224243164, -0.013762474060058594, -0.011558055877685547, -0.0093536376953125, -0.007149219512939453, -0.004944801330566406, -0.0027403831481933594, -0.0005359649658203125, 0.0016684532165527344, 0.0038728713989257812, 0.006077289581298828, 0.008281707763671875, 0.010486125946044922, 0.012690544128417969, 0.014894962310791016, 0.017099380493164062, 0.01930379867553711, 0.021508216857910156, 0.023712635040283203, 0.02591705322265625, 0.028121471405029297, 0.030325889587402344, 0.03253030776977539, 0.03473472595214844, 0.036939144134521484, 0.03914356231689453, 0.04134798049926758, 0.043552398681640625, 0.04575681686401367, 0.04796123504638672, 0.050165653228759766, 0.05237007141113281, 0.05457448959350586, 0.056778907775878906, 0.05898332595825195, 0.061187744140625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 17.0, 18.0, 24.0, 35.0, 61.0, 87.0, 114.0, 238.0, 274.0, 407.0, 678.0, 1055.0, 1642.0, 2639.0, 4747.0, 8437.0, 16516.0, 36485.0, 90269.0, 250754.0, 817937.0, 1954323.0, 657527.0, 208659.0, 76431.0, 31524.0, 14746.0, 7496.0, 4201.0, 2579.0, 1541.0, 938.0, 647.0, 419.0, 277.0, 197.0, 118.0, 62.0, 59.0, 33.0, 20.0, 16.0, 12.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1624755859375, -0.15746307373046875, -0.1524505615234375, -0.14743804931640625, -0.142425537109375, -0.13741302490234375, -0.1324005126953125, -0.12738800048828125, -0.12237548828125, -0.11736297607421875, -0.1123504638671875, -0.10733795166015625, -0.102325439453125, -0.09731292724609375, -0.0923004150390625, -0.08728790283203125, -0.082275390625, -0.07726287841796875, -0.0722503662109375, -0.06723785400390625, -0.062225341796875, -0.05721282958984375, -0.0522003173828125, -0.04718780517578125, -0.04217529296875, -0.03716278076171875, -0.0321502685546875, -0.02713775634765625, -0.022125244140625, -0.01711273193359375, -0.0121002197265625, -0.00708770751953125, -0.0020751953125, 0.00293731689453125, 0.0079498291015625, 0.01296234130859375, 0.017974853515625, 0.02298736572265625, 0.0279998779296875, 0.03301239013671875, 0.03802490234375, 0.04303741455078125, 0.0480499267578125, 0.05306243896484375, 0.058074951171875, 0.06308746337890625, 0.0680999755859375, 0.07311248779296875, 0.078125, 0.08313751220703125, 0.0881500244140625, 0.09316253662109375, 0.098175048828125, 0.10318756103515625, 0.1082000732421875, 0.11321258544921875, 0.11822509765625, 0.12323760986328125, 0.1282501220703125, 0.13326263427734375, 0.138275146484375, 0.14328765869140625, 0.1483001708984375, 0.15331268310546875, 0.1583251953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 12.0, 12.0, 16.0, 22.0, 23.0, 47.0, 44.0, 65.0, 95.0, 139.0, 182.0, 240.0, 320.0, 523.0, 644.0, 465.0, 318.0, 254.0, 183.0, 110.0, 87.0, 55.0, 55.0, 37.0, 31.0, 23.0, 10.0, 9.0, 11.0, 9.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.130126953125, -0.1259899139404297, -0.12185287475585938, -0.11771583557128906, -0.11357879638671875, -0.10944175720214844, -0.10530471801757812, -0.10116767883300781, -0.0970306396484375, -0.09289360046386719, -0.08875656127929688, -0.08461952209472656, -0.08048248291015625, -0.07634544372558594, -0.07220840454101562, -0.06807136535644531, -0.063934326171875, -0.05979728698730469, -0.055660247802734375, -0.05152320861816406, -0.04738616943359375, -0.04324913024902344, -0.039112091064453125, -0.03497505187988281, -0.0308380126953125, -0.026700973510742188, -0.022563934326171875, -0.018426895141601562, -0.01428985595703125, -0.010152816772460938, -0.006015777587890625, -0.0018787384033203125, 0.00225830078125, 0.0063953399658203125, 0.010532379150390625, 0.014669418334960938, 0.01880645751953125, 0.022943496704101562, 0.027080535888671875, 0.031217575073242188, 0.0353546142578125, 0.03949165344238281, 0.043628692626953125, 0.04776573181152344, 0.05190277099609375, 0.05603981018066406, 0.060176849365234375, 0.06431388854980469, 0.068450927734375, 0.07258796691894531, 0.07672500610351562, 0.08086204528808594, 0.08499908447265625, 0.08913612365722656, 0.09327316284179688, 0.09741020202636719, 0.1015472412109375, 0.10568428039550781, 0.10982131958007812, 0.11395835876464844, 0.11809539794921875, 0.12223243713378906, 0.12636947631835938, 0.1305065155029297, 0.1346435546875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 17.0, 15.0, 17.0, 32.0, 43.0, 38.0, 63.0, 61.0, 87.0, 84.0, 80.0, 83.0, 81.0, 63.0, 48.0, 48.0, 41.0, 20.0, 16.0, 17.0, 15.0, 10.0, 5.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6588698625564575, -0.6383638381958008, -0.617857813835144, -0.5973517894744873, -0.5768458247184753, -0.5563398003578186, -0.5358337759971619, -0.5153277516365051, -0.4948217272758484, -0.47431570291519165, -0.4538097083568573, -0.43330368399620056, -0.4127976596355438, -0.3922916650772095, -0.37178564071655273, -0.351279616355896, -0.33077362179756165, -0.3102675974369049, -0.28976160287857056, -0.2692555785179138, -0.24874955415725708, -0.22824354469776154, -0.207737535238266, -0.18723151087760925, -0.1667255014181137, -0.14621949195861816, -0.12571346759796143, -0.10520745813846588, -0.08470144122838974, -0.0641954243183136, -0.043689414858818054, -0.023183390498161316, -0.0026773810386657715, 0.01782863400876522, 0.03833464905619621, 0.058840662240982056, 0.0793466791510582, 0.09985269606113434, 0.12035870552062988, 0.14086472988128662, 0.16137073934078217, 0.1818767488002777, 0.20238277316093445, 0.22288878262043, 0.24339479207992554, 0.2639008164405823, 0.284406840801239, 0.30491286516189575, 0.3254188597202301, 0.34592488408088684, 0.3664308786392212, 0.38693690299987793, 0.40744292736053467, 0.4279489517211914, 0.44845494627952576, 0.4689609706401825, 0.48946696519851685, 0.5099729895591736, 0.5304790139198303, 0.5509849786758423, 0.571491003036499, 0.5919970273971558, 0.6125030517578125, 0.6330090761184692, 0.653515100479126]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 7.0, 4.0, 7.0, 9.0, 8.0, 18.0, 12.0, 17.0, 18.0, 23.0, 19.0, 30.0, 24.0, 25.0, 29.0, 38.0, 33.0, 48.0, 44.0, 32.0, 40.0, 36.0, 45.0, 42.0, 39.0, 29.0, 42.0, 26.0, 20.0, 29.0, 35.0, 26.0, 20.0, 21.0, 17.0, 18.0, 10.0, 8.0, 11.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.39880841970443726, -0.3866569697856903, -0.37450549006462097, -0.362354040145874, -0.3502025604248047, -0.33805111050605774, -0.3258996605873108, -0.31374818086624146, -0.3015967309474945, -0.28944528102874756, -0.2772938013076782, -0.2651423513889313, -0.25299087166786194, -0.240839421749115, -0.22868795692920685, -0.2165364921092987, -0.20438502728939056, -0.19223356246948242, -0.18008209764957428, -0.16793063282966614, -0.1557791829109192, -0.14362771809101105, -0.1314762532711029, -0.11932479590177536, -0.10717333108186722, -0.09502186626195908, -0.08287040889263153, -0.07071894407272339, -0.058567482978105545, -0.0464160218834877, -0.03426455706357956, -0.022113099694252014, -0.009961634874343872, 0.002189827151596546, 0.014341289177536964, 0.026492752134799957, 0.0386442132294178, 0.050795674324035645, 0.06294713914394379, 0.07509859651327133, 0.08725006133317947, 0.09940152615308762, 0.11155298352241516, 0.1237044483423233, 0.13585591316223145, 0.1480073630809784, 0.16015884280204773, 0.17231029272079468, 0.18446175754070282, 0.19661322236061096, 0.2087646871805191, 0.22091615200042725, 0.2330676019191742, 0.24521906673908234, 0.2573705315589905, 0.2695219814777374, 0.28167346119880676, 0.2938249111175537, 0.30597639083862305, 0.31812784075737, 0.33027932047843933, 0.3424307703971863, 0.3545822501182556, 0.36673370003700256, 0.3788851499557495]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 7.0, 14.0, 21.0, 33.0, 59.0, 94.0, 210.0, 315.0, 565.0, 1090.0, 1928.0, 3222.0, 5885.0, 10782.0, 19714.0, 36983.0, 69801.0, 149005.0, 307361.0, 229577.0, 101093.0, 50649.0, 27160.0, 14859.0, 8039.0, 4385.0, 2428.0, 1435.0, 775.0, 459.0, 253.0, 145.0, 89.0, 42.0, 35.0, 19.0, 8.0, 6.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08245849609375, -0.07925701141357422, -0.07605552673339844, -0.07285404205322266, -0.06965255737304688, -0.0664510726928711, -0.06324958801269531, -0.06004810333251953, -0.05684661865234375, -0.05364513397216797, -0.05044364929199219, -0.047242164611816406, -0.044040679931640625, -0.040839195251464844, -0.03763771057128906, -0.03443622589111328, -0.0312347412109375, -0.02803325653076172, -0.024831771850585938, -0.021630287170410156, -0.018428802490234375, -0.015227317810058594, -0.012025833129882812, -0.008824348449707031, -0.00562286376953125, -0.0024213790893554688, 0.0007801055908203125, 0.003981590270996094, 0.007183074951171875, 0.010384559631347656, 0.013586044311523438, 0.01678752899169922, 0.019989013671875, 0.02319049835205078, 0.026391983032226562, 0.029593467712402344, 0.032794952392578125, 0.035996437072753906, 0.03919792175292969, 0.04239940643310547, 0.04560089111328125, 0.04880237579345703, 0.05200386047363281, 0.055205345153808594, 0.058406829833984375, 0.061608314514160156, 0.06480979919433594, 0.06801128387451172, 0.0712127685546875, 0.07441425323486328, 0.07761573791503906, 0.08081722259521484, 0.08401870727539062, 0.0872201919555664, 0.09042167663574219, 0.09362316131591797, 0.09682464599609375, 0.10002613067626953, 0.10322761535644531, 0.1064291000366211, 0.10963058471679688, 0.11283206939697266, 0.11603355407714844, 0.11923503875732422, 0.1224365234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 6.0, 5.0, 10.0, 9.0, 6.0, 12.0, 11.0, 16.0, 15.0, 17.0, 14.0, 19.0, 26.0, 27.0, 25.0, 30.0, 23.0, 25.0, 31.0, 43.0, 28.0, 28.0, 41.0, 44.0, 44.0, 27.0, 42.0, 39.0, 35.0, 40.0, 29.0, 36.0, 18.0, 18.0, 24.0, 13.0, 19.0, 16.0, 11.0, 17.0, 12.0, 10.0, 8.0, 7.0, 10.0, 4.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.055328369140625, -0.05361032485961914, -0.05189228057861328, -0.05017423629760742, -0.04845619201660156, -0.0467381477355957, -0.045020103454589844, -0.043302059173583984, -0.041584014892578125, -0.039865970611572266, -0.038147926330566406, -0.03642988204956055, -0.03471183776855469, -0.03299379348754883, -0.03127574920654297, -0.02955770492553711, -0.02783966064453125, -0.02612161636352539, -0.02440357208251953, -0.022685527801513672, -0.020967483520507812, -0.019249439239501953, -0.017531394958496094, -0.015813350677490234, -0.014095306396484375, -0.012377262115478516, -0.010659217834472656, -0.008941173553466797, -0.0072231292724609375, -0.005505084991455078, -0.0037870407104492188, -0.0020689964294433594, -0.0003509521484375, 0.0013670921325683594, 0.0030851364135742188, 0.004803180694580078, 0.0065212249755859375, 0.008239269256591797, 0.009957313537597656, 0.011675357818603516, 0.013393402099609375, 0.015111446380615234, 0.016829490661621094, 0.018547534942626953, 0.020265579223632812, 0.021983623504638672, 0.02370166778564453, 0.02541971206665039, 0.02713775634765625, 0.02885580062866211, 0.03057384490966797, 0.03229188919067383, 0.03400993347167969, 0.03572797775268555, 0.037446022033691406, 0.039164066314697266, 0.040882110595703125, 0.042600154876708984, 0.044318199157714844, 0.0460362434387207, 0.04775428771972656, 0.04947233200073242, 0.05119037628173828, 0.05290842056274414, 0.05462646484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 7.0, 7.0, 13.0, 17.0, 23.0, 30.0, 45.0, 75.0, 135.0, 211.0, 588.0, 1556.0, 5189.0, 18226.0, 81648.0, 549408.0, 321091.0, 52112.0, 12467.0, 3586.0, 1171.0, 441.0, 199.0, 92.0, 68.0, 40.0, 26.0, 24.0, 16.0, 14.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.313720703125, -0.3044548034667969, -0.29518890380859375, -0.2859230041503906, -0.2766571044921875, -0.2673912048339844, -0.25812530517578125, -0.24885940551757812, -0.239593505859375, -0.23032760620117188, -0.22106170654296875, -0.21179580688476562, -0.2025299072265625, -0.19326400756835938, -0.18399810791015625, -0.17473220825195312, -0.16546630859375, -0.15620040893554688, -0.14693450927734375, -0.13766860961914062, -0.1284027099609375, -0.11913681030273438, -0.10987091064453125, -0.10060501098632812, -0.091339111328125, -0.08207321166992188, -0.07280731201171875, -0.06354141235351562, -0.0542755126953125, -0.045009613037109375, -0.03574371337890625, -0.026477813720703125, -0.0172119140625, -0.007946014404296875, 0.00131988525390625, 0.010585784912109375, 0.0198516845703125, 0.029117584228515625, 0.03838348388671875, 0.047649383544921875, 0.056915283203125, 0.06618118286132812, 0.07544708251953125, 0.08471298217773438, 0.0939788818359375, 0.10324478149414062, 0.11251068115234375, 0.12177658081054688, 0.13104248046875, 0.14030838012695312, 0.14957427978515625, 0.15884017944335938, 0.1681060791015625, 0.17737197875976562, 0.18663787841796875, 0.19590377807617188, 0.205169677734375, 0.21443557739257812, 0.22370147705078125, 0.23296737670898438, 0.2422332763671875, 0.2514991760253906, 0.26076507568359375, 0.2700309753417969, 0.279296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 10.0, 10.0, 16.0, 19.0, 18.0, 19.0, 31.0, 24.0, 30.0, 36.0, 31.0, 45.0, 62.0, 59.0, 47.0, 53.0, 51.0, 46.0, 60.0, 33.0, 52.0, 36.0, 33.0, 31.0, 22.0, 22.0, 19.0, 17.0, 15.0, 9.0, 8.0, 11.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2147216796875, -0.2076416015625, -0.2005615234375, -0.1934814453125, -0.1864013671875, -0.1793212890625, -0.1722412109375, -0.1651611328125, -0.1580810546875, -0.1510009765625, -0.1439208984375, -0.1368408203125, -0.1297607421875, -0.1226806640625, -0.1156005859375, -0.1085205078125, -0.1014404296875, -0.0943603515625, -0.0872802734375, -0.0802001953125, -0.0731201171875, -0.0660400390625, -0.0589599609375, -0.0518798828125, -0.0447998046875, -0.0377197265625, -0.0306396484375, -0.0235595703125, -0.0164794921875, -0.0093994140625, -0.0023193359375, 0.0047607421875, 0.0118408203125, 0.0189208984375, 0.0260009765625, 0.0330810546875, 0.0401611328125, 0.0472412109375, 0.0543212890625, 0.0614013671875, 0.0684814453125, 0.0755615234375, 0.0826416015625, 0.0897216796875, 0.0968017578125, 0.1038818359375, 0.1109619140625, 0.1180419921875, 0.1251220703125, 0.1322021484375, 0.1392822265625, 0.1463623046875, 0.1534423828125, 0.1605224609375, 0.1676025390625, 0.1746826171875, 0.1817626953125, 0.1888427734375, 0.1959228515625, 0.2030029296875, 0.2100830078125, 0.2171630859375, 0.2242431640625, 0.2313232421875, 0.2384033203125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 4.0, 7.0, 20.0, 23.0, 42.0, 62.0, 103.0, 113.0, 201.0, 284.0, 483.0, 720.0, 1199.0, 2040.0, 3948.0, 7781.0, 15949.0, 33245.0, 67745.0, 166138.0, 457956.0, 160011.0, 65724.0, 32340.0, 15677.0, 7613.0, 3848.0, 2091.0, 1145.0, 695.0, 501.0, 270.0, 178.0, 137.0, 85.0, 66.0, 41.0, 26.0, 13.0, 13.0, 10.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09307861328125, -0.09012222290039062, -0.08716583251953125, -0.08420944213867188, -0.0812530517578125, -0.07829666137695312, -0.07534027099609375, -0.07238388061523438, -0.069427490234375, -0.06647109985351562, -0.06351470947265625, -0.060558319091796875, -0.0576019287109375, -0.054645538330078125, -0.05168914794921875, -0.048732757568359375, -0.0457763671875, -0.042819976806640625, -0.03986358642578125, -0.036907196044921875, -0.0339508056640625, -0.030994415283203125, -0.02803802490234375, -0.025081634521484375, -0.022125244140625, -0.019168853759765625, -0.01621246337890625, -0.013256072998046875, -0.0102996826171875, -0.007343292236328125, -0.00438690185546875, -0.001430511474609375, 0.00152587890625, 0.004482269287109375, 0.00743865966796875, 0.010395050048828125, 0.0133514404296875, 0.016307830810546875, 0.01926422119140625, 0.022220611572265625, 0.025177001953125, 0.028133392333984375, 0.03108978271484375, 0.034046173095703125, 0.0370025634765625, 0.039958953857421875, 0.04291534423828125, 0.045871734619140625, 0.048828125, 0.051784515380859375, 0.05474090576171875, 0.057697296142578125, 0.0606536865234375, 0.06361007690429688, 0.06656646728515625, 0.06952285766601562, 0.072479248046875, 0.07543563842773438, 0.07839202880859375, 0.08134841918945312, 0.0843048095703125, 0.08726119995117188, 0.09021759033203125, 0.09317398071289062, 0.09613037109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 9.0, 4.0, 4.0, 10.0, 12.0, 23.0, 20.0, 40.0, 66.0, 85.0, 112.0, 144.0, 141.0, 89.0, 80.0, 44.0, 28.0, 18.0, 23.0, 13.0, 9.0, 9.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.552436828613281e-05, -3.436673432588577e-05, -3.320910036563873e-05, -3.205146640539169e-05, -3.089383244514465e-05, -2.9736198484897614e-05, -2.8578564524650574e-05, -2.7420930564403534e-05, -2.6263296604156494e-05, -2.5105662643909454e-05, -2.3948028683662415e-05, -2.2790394723415375e-05, -2.1632760763168335e-05, -2.0475126802921295e-05, -1.9317492842674255e-05, -1.8159858882427216e-05, -1.7002224922180176e-05, -1.5844590961933136e-05, -1.4686957001686096e-05, -1.3529323041439056e-05, -1.2371689081192017e-05, -1.1214055120944977e-05, -1.0056421160697937e-05, -8.898787200450897e-06, -7.741153240203857e-06, -6.583519279956818e-06, -5.425885319709778e-06, -4.268251359462738e-06, -3.1106173992156982e-06, -1.9529834389686584e-06, -7.953494787216187e-07, 3.6228448152542114e-07, 1.519918441772461e-06, 2.6775524020195007e-06, 3.8351863622665405e-06, 4.99282032251358e-06, 6.15045428276062e-06, 7.30808824300766e-06, 8.4657222032547e-06, 9.62335616350174e-06, 1.078099012374878e-05, 1.1938624083995819e-05, 1.3096258044242859e-05, 1.4253892004489899e-05, 1.541152596473694e-05, 1.6569159924983978e-05, 1.7726793885231018e-05, 1.8884427845478058e-05, 2.0042061805725098e-05, 2.1199695765972137e-05, 2.2357329726219177e-05, 2.3514963686466217e-05, 2.4672597646713257e-05, 2.5830231606960297e-05, 2.6987865567207336e-05, 2.8145499527454376e-05, 2.9303133487701416e-05, 3.0460767447948456e-05, 3.1618401408195496e-05, 3.2776035368442535e-05, 3.3933669328689575e-05, 3.5091303288936615e-05, 3.6248937249183655e-05, 3.7406571209430695e-05, 3.8564205169677734e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 5.0, 9.0, 6.0, 12.0, 28.0, 21.0, 28.0, 41.0, 61.0, 76.0, 125.0, 205.0, 382.0, 821.0, 1767.0, 4251.0, 10829.0, 28575.0, 74585.0, 246283.0, 485147.0, 121210.0, 45258.0, 17098.0, 6584.0, 2648.0, 1107.0, 566.0, 293.0, 178.0, 105.0, 74.0, 53.0, 28.0, 29.0, 18.0, 16.0, 12.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1348876953125, -0.1311655044555664, -0.1274433135986328, -0.12372112274169922, -0.11999893188476562, -0.11627674102783203, -0.11255455017089844, -0.10883235931396484, -0.10511016845703125, -0.10138797760009766, -0.09766578674316406, -0.09394359588623047, -0.09022140502929688, -0.08649921417236328, -0.08277702331542969, -0.0790548324584961, -0.0753326416015625, -0.0716104507446289, -0.06788825988769531, -0.06416606903076172, -0.060443878173828125, -0.05672168731689453, -0.05299949645996094, -0.049277305603027344, -0.04555511474609375, -0.041832923889160156, -0.03811073303222656, -0.03438854217529297, -0.030666351318359375, -0.02694416046142578, -0.023221969604492188, -0.019499778747558594, -0.015777587890625, -0.012055397033691406, -0.008333206176757812, -0.004611015319824219, -0.000888824462890625, 0.0028333663940429688, 0.0065555572509765625, 0.010277748107910156, 0.01399993896484375, 0.017722129821777344, 0.021444320678710938, 0.02516651153564453, 0.028888702392578125, 0.03261089324951172, 0.03633308410644531, 0.040055274963378906, 0.0437774658203125, 0.047499656677246094, 0.05122184753417969, 0.05494403839111328, 0.058666229248046875, 0.06238842010498047, 0.06611061096191406, 0.06983280181884766, 0.07355499267578125, 0.07727718353271484, 0.08099937438964844, 0.08472156524658203, 0.08844375610351562, 0.09216594696044922, 0.09588813781738281, 0.0996103286743164, 0.10333251953125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 6.0, 7.0, 9.0, 12.0, 16.0, 22.0, 24.0, 32.0, 48.0, 58.0, 78.0, 150.0, 158.0, 103.0, 73.0, 50.0, 35.0, 25.0, 16.0, 14.0, 14.0, 12.0, 4.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1090087890625, -0.1055135726928711, -0.10201835632324219, -0.09852313995361328, -0.09502792358398438, -0.09153270721435547, -0.08803749084472656, -0.08454227447509766, -0.08104705810546875, -0.07755184173583984, -0.07405662536621094, -0.07056140899658203, -0.06706619262695312, -0.06357097625732422, -0.06007575988769531, -0.056580543518066406, -0.0530853271484375, -0.049590110778808594, -0.04609489440917969, -0.04259967803955078, -0.039104461669921875, -0.03560924530029297, -0.03211402893066406, -0.028618812561035156, -0.02512359619140625, -0.021628379821777344, -0.018133163452148438, -0.014637947082519531, -0.011142730712890625, -0.007647514343261719, -0.0041522979736328125, -0.0006570816040039062, 0.002838134765625, 0.006333351135253906, 0.009828567504882812, 0.013323783874511719, 0.016819000244140625, 0.02031421661376953, 0.023809432983398438, 0.027304649353027344, 0.03079986572265625, 0.034295082092285156, 0.03779029846191406, 0.04128551483154297, 0.044780731201171875, 0.04827594757080078, 0.05177116394042969, 0.055266380310058594, 0.0587615966796875, 0.062256813049316406, 0.06575202941894531, 0.06924724578857422, 0.07274246215820312, 0.07623767852783203, 0.07973289489746094, 0.08322811126708984, 0.08672332763671875, 0.09021854400634766, 0.09371376037597656, 0.09720897674560547, 0.10070419311523438, 0.10419940948486328, 0.10769462585449219, 0.1111898422241211, 0.11468505859375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 16.0, 12.0, 20.0, 26.0, 40.0, 50.0, 77.0, 74.0, 89.0, 81.0, 100.0, 81.0, 73.0, 76.0, 54.0, 46.0, 22.0, 21.0, 16.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8445805311203003, -0.8191482424736023, -0.7937159538269043, -0.7682836651802063, -0.7428513765335083, -0.7174190878868103, -0.6919867992401123, -0.6665545105934143, -0.6411222219467163, -0.6156899333000183, -0.5902576446533203, -0.5648253560066223, -0.5393930673599243, -0.5139607787132263, -0.4885284900665283, -0.4630962014198303, -0.4376639425754547, -0.4122316539287567, -0.3867993652820587, -0.3613670766353607, -0.3359347879886627, -0.3105025291442871, -0.2850702404975891, -0.2596379518508911, -0.23420564830303192, -0.20877335965633392, -0.18334107100963593, -0.15790879726409912, -0.13247650861740112, -0.10704421997070312, -0.08161193132400513, -0.05617964267730713, -0.03074735403060913, -0.005315067246556282, 0.020117219537496567, 0.045549504458904266, 0.07098179310560226, 0.09641407430171967, 0.12184636294841766, 0.14727865159511566, 0.17271094024181366, 0.19814322888851166, 0.22357551753520966, 0.24900779128074646, 0.27444007992744446, 0.29987236857414246, 0.32530465722084045, 0.35073694586753845, 0.37616923451423645, 0.40160152316093445, 0.42703381180763245, 0.45246610045433044, 0.47789838910102844, 0.503330647945404, 0.528762936592102, 0.5541952252388, 0.579627513885498, 0.605059802532196, 0.630492091178894, 0.655924379825592, 0.68135666847229, 0.706788957118988, 0.732221245765686, 0.757653534412384, 0.783085823059082]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 6.0, 8.0, 7.0, 6.0, 20.0, 9.0, 13.0, 22.0, 24.0, 23.0, 21.0, 26.0, 28.0, 37.0, 25.0, 38.0, 44.0, 56.0, 45.0, 37.0, 45.0, 45.0, 51.0, 25.0, 36.0, 41.0, 34.0, 23.0, 29.0, 24.0, 24.0, 16.0, 11.0, 25.0, 12.0, 15.0, 13.0, 5.0, 7.0, 8.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45189380645751953, -0.4363543689250946, -0.42081496119499207, -0.40527552366256714, -0.3897360861301422, -0.3741966485977173, -0.35865724086761475, -0.3431178033351898, -0.3275783658027649, -0.31203892827033997, -0.2964995205402374, -0.2809600830078125, -0.2654206454753876, -0.24988122284412384, -0.2343418002128601, -0.21880236268043518, -0.20326295495033264, -0.1877235323190689, -0.17218409478664398, -0.15664467215538025, -0.14110523462295532, -0.1255658119916916, -0.11002638936042786, -0.09448695927858353, -0.0789475291967392, -0.06340809911489487, -0.047868672758340836, -0.032329246401786804, -0.016789816319942474, -0.0012503862380981445, 0.014289036393165588, 0.029828466475009918, 0.04536789655685425, 0.06090732663869858, 0.07644675672054291, 0.09198617935180664, 0.10752560943365097, 0.1230650395154953, 0.13860446214675903, 0.15414389967918396, 0.1696833223104477, 0.18522274494171143, 0.20076218247413635, 0.21630160510540009, 0.23184102773666382, 0.24738046526908875, 0.26291990280151367, 0.2784593105316162, 0.29399874806404114, 0.30953818559646606, 0.3250775933265686, 0.34061703085899353, 0.35615646839141846, 0.371695876121521, 0.3872353136539459, 0.40277475118637085, 0.4183141589164734, 0.4338535964488983, 0.44939300417900085, 0.4649324417114258, 0.4804718792438507, 0.49601131677627563, 0.5115507245063782, 0.5270901322364807, 0.542629599571228]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 3.0, 8.0, 17.0, 26.0, 50.0, 56.0, 102.0, 134.0, 209.0, 324.0, 544.0, 780.0, 1301.0, 2102.0, 3485.0, 5940.0, 10299.0, 18379.0, 33586.0, 65381.0, 131556.0, 291931.0, 798314.0, 1688613.0, 650554.0, 249922.0, 114800.0, 56771.0, 29847.0, 16324.0, 8984.0, 5339.0, 3246.0, 1916.0, 1201.0, 820.0, 472.0, 293.0, 203.0, 143.0, 96.0, 56.0, 47.0, 32.0, 23.0, 17.0, 12.0, 10.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.08734130859375, -0.08464622497558594, -0.08195114135742188, -0.07925605773925781, -0.07656097412109375, -0.07386589050292969, -0.07117080688476562, -0.06847572326660156, -0.0657806396484375, -0.06308555603027344, -0.060390472412109375, -0.05769538879394531, -0.05500030517578125, -0.05230522155761719, -0.049610137939453125, -0.04691505432128906, -0.044219970703125, -0.04152488708496094, -0.038829803466796875, -0.03613471984863281, -0.03343963623046875, -0.030744552612304688, -0.028049468994140625, -0.025354385375976562, -0.0226593017578125, -0.019964218139648438, -0.017269134521484375, -0.014574050903320312, -0.01187896728515625, -0.009183883666992188, -0.006488800048828125, -0.0037937164306640625, -0.0010986328125, 0.0015964508056640625, 0.004291534423828125, 0.0069866180419921875, 0.00968170166015625, 0.012376785278320312, 0.015071868896484375, 0.017766952514648438, 0.0204620361328125, 0.023157119750976562, 0.025852203369140625, 0.028547286987304688, 0.03124237060546875, 0.03393745422363281, 0.036632537841796875, 0.03932762145996094, 0.042022705078125, 0.04471778869628906, 0.047412872314453125, 0.05010795593261719, 0.05280303955078125, 0.05549812316894531, 0.058193206787109375, 0.06088829040527344, 0.0635833740234375, 0.06627845764160156, 0.06897354125976562, 0.07166862487792969, 0.07436370849609375, 0.07705879211425781, 0.07975387573242188, 0.08244895935058594, 0.08514404296875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 12.0, 7.0, 7.0, 14.0, 17.0, 8.0, 14.0, 15.0, 16.0, 21.0, 22.0, 28.0, 33.0, 49.0, 42.0, 41.0, 39.0, 41.0, 45.0, 44.0, 60.0, 41.0, 41.0, 43.0, 36.0, 28.0, 36.0, 23.0, 34.0, 33.0, 20.0, 14.0, 11.0, 14.0, 6.0, 11.0, 3.0, 10.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06500244140625, -0.06297492980957031, -0.060947418212890625, -0.05891990661621094, -0.05689239501953125, -0.05486488342285156, -0.052837371826171875, -0.05080986022949219, -0.0487823486328125, -0.04675483703613281, -0.044727325439453125, -0.04269981384277344, -0.04067230224609375, -0.03864479064941406, -0.036617279052734375, -0.03458976745605469, -0.032562255859375, -0.030534744262695312, -0.028507232666015625, -0.026479721069335938, -0.02445220947265625, -0.022424697875976562, -0.020397186279296875, -0.018369674682617188, -0.0163421630859375, -0.014314651489257812, -0.012287139892578125, -0.010259628295898438, -0.00823211669921875, -0.0062046051025390625, -0.004177093505859375, -0.0021495819091796875, -0.0001220703125, 0.0019054412841796875, 0.003932952880859375, 0.0059604644775390625, 0.00798797607421875, 0.010015487670898438, 0.012042999267578125, 0.014070510864257812, 0.0160980224609375, 0.018125534057617188, 0.020153045654296875, 0.022180557250976562, 0.02420806884765625, 0.026235580444335938, 0.028263092041015625, 0.030290603637695312, 0.032318115234375, 0.03434562683105469, 0.036373138427734375, 0.03840065002441406, 0.04042816162109375, 0.04245567321777344, 0.044483184814453125, 0.04651069641113281, 0.0485382080078125, 0.05056571960449219, 0.052593231201171875, 0.05462074279785156, 0.05664825439453125, 0.05867576599121094, 0.060703277587890625, 0.06273078918457031, 0.06475830078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 11.0, 17.0, 21.0, 33.0, 51.0, 76.0, 93.0, 134.0, 208.0, 317.0, 460.0, 799.0, 1175.0, 1949.0, 3317.0, 5876.0, 10637.0, 20967.0, 44726.0, 104743.0, 281692.0, 927074.0, 1844561.0, 598549.0, 198099.0, 77018.0, 34193.0, 16587.0, 8644.0, 4869.0, 2724.0, 1677.0, 1062.0, 656.0, 427.0, 272.0, 170.0, 122.0, 69.0, 62.0, 37.0, 34.0, 17.0, 14.0, 9.0, 6.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0], "bins": [-0.1727294921875, -0.16769790649414062, -0.16266632080078125, -0.15763473510742188, -0.1526031494140625, -0.14757156372070312, -0.14253997802734375, -0.13750839233398438, -0.132476806640625, -0.12744522094726562, -0.12241363525390625, -0.11738204956054688, -0.1123504638671875, -0.10731887817382812, -0.10228729248046875, -0.09725570678710938, -0.09222412109375, -0.08719253540039062, -0.08216094970703125, -0.07712936401367188, -0.0720977783203125, -0.06706619262695312, -0.06203460693359375, -0.057003021240234375, -0.051971435546875, -0.046939849853515625, -0.04190826416015625, -0.036876678466796875, -0.0318450927734375, -0.026813507080078125, -0.02178192138671875, -0.016750335693359375, -0.01171875, -0.006687164306640625, -0.00165557861328125, 0.003376007080078125, 0.0084075927734375, 0.013439178466796875, 0.01847076416015625, 0.023502349853515625, 0.028533935546875, 0.033565521240234375, 0.03859710693359375, 0.043628692626953125, 0.0486602783203125, 0.053691864013671875, 0.05872344970703125, 0.06375503540039062, 0.06878662109375, 0.07381820678710938, 0.07884979248046875, 0.08388137817382812, 0.0889129638671875, 0.09394454956054688, 0.09897613525390625, 0.10400772094726562, 0.109039306640625, 0.11407089233398438, 0.11910247802734375, 0.12413406372070312, 0.1291656494140625, 0.13419723510742188, 0.13922882080078125, 0.14426040649414062, 0.1492919921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 17.0, 8.0, 12.0, 20.0, 26.0, 27.0, 51.0, 84.0, 80.0, 125.0, 177.0, 240.0, 374.0, 599.0, 651.0, 448.0, 327.0, 218.0, 149.0, 122.0, 86.0, 44.0, 47.0, 31.0, 21.0, 18.0, 12.0, 11.0, 10.0, 5.0, 8.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.181640625, -0.17616844177246094, -0.17069625854492188, -0.1652240753173828, -0.15975189208984375, -0.1542797088623047, -0.14880752563476562, -0.14333534240722656, -0.1378631591796875, -0.13239097595214844, -0.12691879272460938, -0.12144660949707031, -0.11597442626953125, -0.11050224304199219, -0.10503005981445312, -0.09955787658691406, -0.094085693359375, -0.08861351013183594, -0.08314132690429688, -0.07766914367675781, -0.07219696044921875, -0.06672477722167969, -0.061252593994140625, -0.05578041076660156, -0.0503082275390625, -0.04483604431152344, -0.039363861083984375, -0.03389167785644531, -0.02841949462890625, -0.022947311401367188, -0.017475128173828125, -0.012002944946289062, -0.00653076171875, -0.0010585784912109375, 0.004413604736328125, 0.009885787963867188, 0.01535797119140625, 0.020830154418945312, 0.026302337646484375, 0.03177452087402344, 0.0372467041015625, 0.04271888732910156, 0.048191070556640625, 0.05366325378417969, 0.05913543701171875, 0.06460762023925781, 0.07007980346679688, 0.07555198669433594, 0.081024169921875, 0.08649635314941406, 0.09196853637695312, 0.09744071960449219, 0.10291290283203125, 0.10838508605957031, 0.11385726928710938, 0.11932945251464844, 0.1248016357421875, 0.13027381896972656, 0.13574600219726562, 0.1412181854248047, 0.14669036865234375, 0.1521625518798828, 0.15763473510742188, 0.16310691833496094, 0.1685791015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 9.0, 7.0, 6.0, 16.0, 8.0, 15.0, 19.0, 13.0, 19.0, 25.0, 23.0, 37.0, 35.0, 44.0, 37.0, 40.0, 52.0, 55.0, 52.0, 53.0, 65.0, 48.0, 56.0, 27.0, 44.0, 35.0, 25.0, 24.0, 18.0, 17.0, 8.0, 8.0, 14.0, 14.0, 4.0, 7.0, 6.0, 4.0, 3.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.5574355125427246, -0.5417376160621643, -0.526039719581604, -0.5103418231010437, -0.4946439266204834, -0.4789460301399231, -0.4632481336593628, -0.4475502371788025, -0.4318523406982422, -0.4161544442176819, -0.4004565477371216, -0.3847586512565613, -0.369060754776001, -0.3533628582954407, -0.33766496181488037, -0.32196706533432007, -0.3062691390514374, -0.2905712425708771, -0.2748733460903168, -0.25917544960975647, -0.24347755312919617, -0.22777965664863586, -0.21208174526691437, -0.19638384878635406, -0.18068595230579376, -0.16498805582523346, -0.14929015934467316, -0.13359224796295166, -0.11789435893297195, -0.10219646245241165, -0.08649855852127075, -0.07080066204071045, -0.055102765560150146, -0.039404869079589844, -0.023706968873739243, -0.008009068667888641, 0.007688827812671661, 0.023386724293231964, 0.039084628224372864, 0.054782524704933167, 0.07048042118549347, 0.08617831766605377, 0.10187621414661407, 0.11757411807775497, 0.13327202200889587, 0.14896991848945618, 0.16466781497001648, 0.18036571145057678, 0.19606360793113708, 0.2117615044116974, 0.2274594008922577, 0.243157297372818, 0.2588551938533783, 0.2745530903339386, 0.2902510166168213, 0.3059489130973816, 0.3216468095779419, 0.3373447060585022, 0.3530426025390625, 0.3687404990196228, 0.3844383955001831, 0.4001362919807434, 0.4158341884613037, 0.431532084941864, 0.4472299814224243]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 4.0, 7.0, 9.0, 19.0, 9.0, 16.0, 17.0, 26.0, 21.0, 28.0, 29.0, 33.0, 30.0, 41.0, 34.0, 34.0, 46.0, 40.0, 39.0, 43.0, 41.0, 53.0, 28.0, 38.0, 32.0, 35.0, 24.0, 33.0, 21.0, 15.0, 20.0, 20.0, 20.0, 15.0, 17.0, 16.0, 8.0, 6.0, 6.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5136818289756775, -0.49725139141082764, -0.4808209538459778, -0.46439051628112793, -0.4479600787162781, -0.4315296411514282, -0.415099173784256, -0.39866873621940613, -0.3822382986545563, -0.3658078610897064, -0.34937742352485657, -0.3329469859600067, -0.3165165185928345, -0.3000860810279846, -0.28365564346313477, -0.2672252058982849, -0.25079476833343506, -0.2343643307685852, -0.21793389320373535, -0.2015034407377243, -0.18507300317287445, -0.1686425656080246, -0.15221211314201355, -0.1357816755771637, -0.11935123801231384, -0.10292080044746399, -0.08649035543203354, -0.07005991041660309, -0.053629472851753235, -0.03719903528690338, -0.02076859027147293, -0.0043381452560424805, 0.012092232704162598, 0.02852267399430275, 0.0449531152844429, 0.061383556574583054, 0.0778139978647232, 0.09424443542957306, 0.11067488044500351, 0.12710532546043396, 0.1435357630252838, 0.15996620059013367, 0.17639663815498352, 0.19282709062099457, 0.20925752818584442, 0.22568796575069427, 0.24211841821670532, 0.2585488557815552, 0.27497929334640503, 0.2914097309112549, 0.30784016847610474, 0.3242706060409546, 0.34070104360580444, 0.3571314811706543, 0.37356194853782654, 0.3899923861026764, 0.40642282366752625, 0.4228532612323761, 0.43928369879722595, 0.4557141363620758, 0.47214460372924805, 0.4885750412940979, 0.5050054788589478, 0.5214359164237976, 0.5378663539886475]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 9.0, 5.0, 17.0, 21.0, 37.0, 64.0, 80.0, 134.0, 216.0, 321.0, 543.0, 876.0, 1463.0, 2308.0, 3712.0, 6063.0, 9860.0, 16203.0, 26369.0, 44500.0, 79591.0, 156977.0, 283733.0, 192367.0, 93841.0, 51588.0, 30074.0, 18214.0, 11147.0, 6881.0, 4283.0, 2626.0, 1621.0, 968.0, 651.0, 450.0, 301.0, 158.0, 115.0, 58.0, 34.0, 20.0, 21.0, 17.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.13134765625, -0.1270599365234375, -0.122772216796875, -0.1184844970703125, -0.11419677734375, -0.1099090576171875, -0.105621337890625, -0.1013336181640625, -0.0970458984375, -0.0927581787109375, -0.088470458984375, -0.0841827392578125, -0.07989501953125, -0.0756072998046875, -0.071319580078125, -0.0670318603515625, -0.062744140625, -0.0584564208984375, -0.054168701171875, -0.0498809814453125, -0.04559326171875, -0.0413055419921875, -0.037017822265625, -0.0327301025390625, -0.0284423828125, -0.0241546630859375, -0.019866943359375, -0.0155792236328125, -0.01129150390625, -0.0070037841796875, -0.002716064453125, 0.0015716552734375, 0.005859375, 0.0101470947265625, 0.014434814453125, 0.0187225341796875, 0.02301025390625, 0.0272979736328125, 0.031585693359375, 0.0358734130859375, 0.0401611328125, 0.0444488525390625, 0.048736572265625, 0.0530242919921875, 0.05731201171875, 0.0615997314453125, 0.065887451171875, 0.0701751708984375, 0.074462890625, 0.0787506103515625, 0.083038330078125, 0.0873260498046875, 0.09161376953125, 0.0959014892578125, 0.100189208984375, 0.1044769287109375, 0.1087646484375, 0.1130523681640625, 0.117340087890625, 0.1216278076171875, 0.12591552734375, 0.1302032470703125, 0.134490966796875, 0.1387786865234375, 0.14306640625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 7.0, 7.0, 8.0, 9.0, 19.0, 19.0, 19.0, 25.0, 23.0, 13.0, 33.0, 36.0, 27.0, 37.0, 39.0, 41.0, 36.0, 29.0, 37.0, 41.0, 52.0, 38.0, 40.0, 41.0, 37.0, 27.0, 33.0, 27.0, 23.0, 19.0, 25.0, 20.0, 14.0, 8.0, 13.0, 12.0, 9.0, 12.0, 8.0, 3.0, 1.0, 2.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.06768798828125, -0.06564807891845703, -0.06360816955566406, -0.061568260192871094, -0.059528350830078125, -0.057488441467285156, -0.05544853210449219, -0.05340862274169922, -0.05136871337890625, -0.04932880401611328, -0.04728889465332031, -0.045248985290527344, -0.043209075927734375, -0.041169166564941406, -0.03912925720214844, -0.03708934783935547, -0.0350494384765625, -0.03300952911376953, -0.030969619750976562, -0.028929710388183594, -0.026889801025390625, -0.024849891662597656, -0.022809982299804688, -0.02077007293701172, -0.01873016357421875, -0.01669025421142578, -0.014650344848632812, -0.012610435485839844, -0.010570526123046875, -0.008530616760253906, -0.0064907073974609375, -0.004450798034667969, -0.002410888671875, -0.00037097930908203125, 0.0016689300537109375, 0.0037088394165039062, 0.005748748779296875, 0.007788658142089844, 0.009828567504882812, 0.011868476867675781, 0.01390838623046875, 0.01594829559326172, 0.017988204956054688, 0.020028114318847656, 0.022068023681640625, 0.024107933044433594, 0.026147842407226562, 0.02818775177001953, 0.0302276611328125, 0.03226757049560547, 0.03430747985839844, 0.036347389221191406, 0.038387298583984375, 0.040427207946777344, 0.04246711730957031, 0.04450702667236328, 0.04654693603515625, 0.04858684539794922, 0.05062675476074219, 0.052666664123535156, 0.054706573486328125, 0.056746482849121094, 0.05878639221191406, 0.06082630157470703, 0.0628662109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 16.0, 13.0, 26.0, 36.0, 48.0, 70.0, 100.0, 141.0, 260.0, 506.0, 1071.0, 2964.0, 8101.0, 23105.0, 67844.0, 245203.0, 496085.0, 136138.0, 42979.0, 14984.0, 5242.0, 1845.0, 788.0, 356.0, 197.0, 123.0, 83.0, 45.0, 46.0, 32.0, 26.0, 13.0, 11.0, 13.0, 9.0, 4.0, 7.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240478515625, -0.23166656494140625, -0.2228546142578125, -0.21404266357421875, -0.205230712890625, -0.19641876220703125, -0.1876068115234375, -0.17879486083984375, -0.16998291015625, -0.16117095947265625, -0.1523590087890625, -0.14354705810546875, -0.134735107421875, -0.12592315673828125, -0.1171112060546875, -0.10829925537109375, -0.0994873046875, -0.09067535400390625, -0.0818634033203125, -0.07305145263671875, -0.064239501953125, -0.05542755126953125, -0.0466156005859375, -0.03780364990234375, -0.02899169921875, -0.02017974853515625, -0.0113677978515625, -0.00255584716796875, 0.006256103515625, 0.01506805419921875, 0.0238800048828125, 0.03269195556640625, 0.04150390625, 0.05031585693359375, 0.0591278076171875, 0.06793975830078125, 0.076751708984375, 0.08556365966796875, 0.0943756103515625, 0.10318756103515625, 0.11199951171875, 0.12081146240234375, 0.1296234130859375, 0.13843536376953125, 0.147247314453125, 0.15605926513671875, 0.1648712158203125, 0.17368316650390625, 0.1824951171875, 0.19130706787109375, 0.2001190185546875, 0.20893096923828125, 0.217742919921875, 0.22655487060546875, 0.2353668212890625, 0.24417877197265625, 0.25299072265625, 0.26180267333984375, 0.2706146240234375, 0.27942657470703125, 0.288238525390625, 0.29705047607421875, 0.3058624267578125, 0.31467437744140625, 0.323486328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 7.0, 12.0, 9.0, 14.0, 12.0, 16.0, 20.0, 20.0, 17.0, 20.0, 24.0, 30.0, 27.0, 29.0, 31.0, 38.0, 37.0, 35.0, 34.0, 45.0, 52.0, 40.0, 37.0, 45.0, 28.0, 37.0, 25.0, 29.0, 35.0, 32.0, 29.0, 16.0, 20.0, 12.0, 11.0, 14.0, 6.0, 8.0, 12.0, 7.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2100830078125, -0.20352554321289062, -0.19696807861328125, -0.19041061401367188, -0.1838531494140625, -0.17729568481445312, -0.17073822021484375, -0.16418075561523438, -0.157623291015625, -0.15106582641601562, -0.14450836181640625, -0.13795089721679688, -0.1313934326171875, -0.12483596801757812, -0.11827850341796875, -0.11172103881835938, -0.10516357421875, -0.09860610961914062, -0.09204864501953125, -0.08549118041992188, -0.0789337158203125, -0.07237625122070312, -0.06581878662109375, -0.059261322021484375, -0.052703857421875, -0.046146392822265625, -0.03958892822265625, -0.033031463623046875, -0.0264739990234375, -0.019916534423828125, -0.01335906982421875, -0.006801605224609375, -0.000244140625, 0.006313323974609375, 0.01287078857421875, 0.019428253173828125, 0.0259857177734375, 0.032543182373046875, 0.03910064697265625, 0.045658111572265625, 0.052215576171875, 0.058773040771484375, 0.06533050537109375, 0.07188796997070312, 0.0784454345703125, 0.08500289916992188, 0.09156036376953125, 0.09811782836914062, 0.10467529296875, 0.11123275756835938, 0.11779022216796875, 0.12434768676757812, 0.1309051513671875, 0.13746261596679688, 0.14402008056640625, 0.15057754516601562, 0.157135009765625, 0.16369247436523438, 0.17024993896484375, 0.17680740356445312, 0.1833648681640625, 0.18992233276367188, 0.19647979736328125, 0.20303726196289062, 0.2095947265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 1.0, 8.0, 11.0, 22.0, 32.0, 82.0, 145.0, 287.0, 559.0, 1144.0, 2386.0, 4863.0, 10754.0, 24607.0, 55250.0, 132450.0, 375405.0, 265642.0, 98407.0, 41939.0, 18578.0, 8365.0, 3877.0, 1851.0, 918.0, 438.0, 243.0, 136.0, 65.0, 43.0, 23.0, 13.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0860595703125, -0.08244895935058594, -0.07883834838867188, -0.07522773742675781, -0.07161712646484375, -0.06800651550292969, -0.06439590454101562, -0.06078529357910156, -0.0571746826171875, -0.05356407165527344, -0.049953460693359375, -0.04634284973144531, -0.04273223876953125, -0.03912162780761719, -0.035511016845703125, -0.03190040588378906, -0.028289794921875, -0.024679183959960938, -0.021068572998046875, -0.017457962036132812, -0.01384735107421875, -0.010236740112304688, -0.006626129150390625, -0.0030155181884765625, 0.0005950927734375, 0.0042057037353515625, 0.007816314697265625, 0.011426925659179688, 0.01503753662109375, 0.018648147583007812, 0.022258758544921875, 0.025869369506835938, 0.02947998046875, 0.03309059143066406, 0.036701202392578125, 0.04031181335449219, 0.04392242431640625, 0.04753303527832031, 0.051143646240234375, 0.05475425720214844, 0.0583648681640625, 0.06197547912597656, 0.06558609008789062, 0.06919670104980469, 0.07280731201171875, 0.07641792297363281, 0.08002853393554688, 0.08363914489746094, 0.087249755859375, 0.09086036682128906, 0.09447097778320312, 0.09808158874511719, 0.10169219970703125, 0.10530281066894531, 0.10891342163085938, 0.11252403259277344, 0.1161346435546875, 0.11974525451660156, 0.12335586547851562, 0.1269664764404297, 0.13057708740234375, 0.1341876983642578, 0.13779830932617188, 0.14140892028808594, 0.14501953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 8.0, 8.0, 10.0, 13.0, 13.0, 22.0, 27.0, 34.0, 55.0, 68.0, 103.0, 111.0, 105.0, 100.0, 84.0, 66.0, 35.0, 32.0, 18.0, 15.0, 21.0, 4.0, 11.0, 5.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.504753112792969e-05, -3.388989716768265e-05, -3.273226320743561e-05, -3.157462924718857e-05, -3.041699528694153e-05, -2.925936132669449e-05, -2.810172736644745e-05, -2.694409340620041e-05, -2.578645944595337e-05, -2.462882548570633e-05, -2.347119152545929e-05, -2.231355756521225e-05, -2.115592360496521e-05, -1.999828964471817e-05, -1.884065568447113e-05, -1.768302172422409e-05, -1.652538776397705e-05, -1.536775380373001e-05, -1.4210119843482971e-05, -1.3052485883235931e-05, -1.1894851922988892e-05, -1.0737217962741852e-05, -9.579584002494812e-06, -8.421950042247772e-06, -7.264316082000732e-06, -6.106682121753693e-06, -4.949048161506653e-06, -3.791414201259613e-06, -2.6337802410125732e-06, -1.4761462807655334e-06, -3.1851232051849365e-07, 8.391216397285461e-07, 1.996755599975586e-06, 3.1543895602226257e-06, 4.3120235204696655e-06, 5.469657480716705e-06, 6.627291440963745e-06, 7.784925401210785e-06, 8.942559361457825e-06, 1.0100193321704865e-05, 1.1257827281951904e-05, 1.2415461242198944e-05, 1.3573095202445984e-05, 1.4730729162693024e-05, 1.5888363122940063e-05, 1.7045997083187103e-05, 1.8203631043434143e-05, 1.9361265003681183e-05, 2.0518898963928223e-05, 2.1676532924175262e-05, 2.2834166884422302e-05, 2.3991800844669342e-05, 2.5149434804916382e-05, 2.630706876516342e-05, 2.746470272541046e-05, 2.86223366856575e-05, 2.977997064590454e-05, 3.093760460615158e-05, 3.209523856639862e-05, 3.325287252664566e-05, 3.44105064868927e-05, 3.556814044713974e-05, 3.672577440738678e-05, 3.788340836763382e-05, 3.904104232788086e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 9.0, 13.0, 11.0, 24.0, 30.0, 32.0, 48.0, 75.0, 99.0, 160.0, 247.0, 489.0, 1073.0, 2300.0, 5280.0, 12669.0, 31518.0, 80641.0, 219922.0, 422754.0, 165901.0, 62566.0, 24843.0, 9970.0, 4160.0, 1794.0, 852.0, 418.0, 221.0, 140.0, 96.0, 52.0, 39.0, 23.0, 22.0, 13.0, 10.0, 9.0, 6.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1195068359375, -0.11569690704345703, -0.11188697814941406, -0.1080770492553711, -0.10426712036132812, -0.10045719146728516, -0.09664726257324219, -0.09283733367919922, -0.08902740478515625, -0.08521747589111328, -0.08140754699707031, -0.07759761810302734, -0.07378768920898438, -0.0699777603149414, -0.06616783142089844, -0.06235790252685547, -0.0585479736328125, -0.05473804473876953, -0.05092811584472656, -0.047118186950683594, -0.043308258056640625, -0.039498329162597656, -0.03568840026855469, -0.03187847137451172, -0.02806854248046875, -0.02425861358642578, -0.020448684692382812, -0.016638755798339844, -0.012828826904296875, -0.009018898010253906, -0.0052089691162109375, -0.0013990402221679688, 0.002410888671875, 0.006220817565917969, 0.010030746459960938, 0.013840675354003906, 0.017650604248046875, 0.021460533142089844, 0.025270462036132812, 0.02908039093017578, 0.03289031982421875, 0.03670024871826172, 0.04051017761230469, 0.044320106506347656, 0.048130035400390625, 0.051939964294433594, 0.05574989318847656, 0.05955982208251953, 0.0633697509765625, 0.06717967987060547, 0.07098960876464844, 0.0747995376586914, 0.07860946655273438, 0.08241939544677734, 0.08622932434082031, 0.09003925323486328, 0.09384918212890625, 0.09765911102294922, 0.10146903991699219, 0.10527896881103516, 0.10908889770507812, 0.1128988265991211, 0.11670875549316406, 0.12051868438720703, 0.12432861328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 4.0, 8.0, 7.0, 9.0, 16.0, 19.0, 21.0, 22.0, 22.0, 35.0, 49.0, 41.0, 49.0, 94.0, 125.0, 105.0, 72.0, 51.0, 49.0, 45.0, 31.0, 15.0, 25.0, 23.0, 11.0, 8.0, 6.0, 6.0, 6.0, 9.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.11089515686035156, -0.10704421997070312, -0.10319328308105469, -0.09934234619140625, -0.09549140930175781, -0.09164047241210938, -0.08778953552246094, -0.0839385986328125, -0.08008766174316406, -0.07623672485351562, -0.07238578796386719, -0.06853485107421875, -0.06468391418457031, -0.060832977294921875, -0.05698204040527344, -0.053131103515625, -0.04928016662597656, -0.045429229736328125, -0.04157829284667969, -0.03772735595703125, -0.03387641906738281, -0.030025482177734375, -0.026174545288085938, -0.0223236083984375, -0.018472671508789062, -0.014621734619140625, -0.010770797729492188, -0.00691986083984375, -0.0030689239501953125, 0.000782012939453125, 0.0046329498291015625, 0.00848388671875, 0.012334823608398438, 0.016185760498046875, 0.020036697387695312, 0.02388763427734375, 0.027738571166992188, 0.031589508056640625, 0.03544044494628906, 0.0392913818359375, 0.04314231872558594, 0.046993255615234375, 0.05084419250488281, 0.05469512939453125, 0.05854606628417969, 0.062397003173828125, 0.06624794006347656, 0.070098876953125, 0.07394981384277344, 0.07780075073242188, 0.08165168762207031, 0.08550262451171875, 0.08935356140136719, 0.09320449829101562, 0.09705543518066406, 0.1009063720703125, 0.10475730895996094, 0.10860824584960938, 0.11245918273925781, 0.11631011962890625, 0.12016105651855469, 0.12401199340820312, 0.12786293029785156, 0.1317138671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 13.0, 20.0, 26.0, 65.0, 94.0, 126.0, 158.0, 150.0, 134.0, 99.0, 57.0, 33.0, 19.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5333600044250488, -1.47694730758667, -1.4205347299575806, -1.3641221523284912, -1.3077094554901123, -1.2512967586517334, -1.194884181022644, -1.1384716033935547, -1.0820589065551758, -1.0256462097167969, -0.9692336320877075, -0.9128209948539734, -0.8564083576202393, -0.7999957203865051, -0.743583083152771, -0.6871704459190369, -0.6307578086853027, -0.5743451714515686, -0.5179325342178345, -0.46151989698410034, -0.4051072597503662, -0.3486946225166321, -0.29228198528289795, -0.23586934804916382, -0.1794567108154297, -0.12304407358169556, -0.06663143634796143, -0.010218799114227295, 0.046193838119506836, 0.10260647535324097, 0.1590191125869751, 0.21543174982070923, 0.27184438705444336, 0.3282570242881775, 0.3846696615219116, 0.44108229875564575, 0.4974949359893799, 0.553907573223114, 0.6103202104568481, 0.6667328476905823, 0.7231454849243164, 0.7795581221580505, 0.8359707593917847, 0.8923833966255188, 0.9487960338592529, 1.0052087306976318, 1.0616213083267212, 1.1180338859558105, 1.1744465827941895, 1.2308592796325684, 1.2872718572616577, 1.343684434890747, 1.400097131729126, 1.4565098285675049, 1.5129224061965942, 1.5693349838256836, 1.6257476806640625, 1.6821603775024414, 1.7385729551315308, 1.7949855327606201, 1.851398229598999, 1.907810926437378, 1.9642235040664673, 2.0206360816955566, 2.0770487785339355]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 2.0, 11.0, 13.0, 11.0, 17.0, 22.0, 24.0, 33.0, 33.0, 27.0, 33.0, 31.0, 29.0, 40.0, 39.0, 43.0, 38.0, 45.0, 49.0, 58.0, 46.0, 36.0, 39.0, 48.0, 33.0, 27.0, 32.0, 32.0, 19.0, 15.0, 18.0, 13.0, 9.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7546989321708679, -0.728951096534729, -0.7032032012939453, -0.6774553656578064, -0.6517075300216675, -0.6259596347808838, -0.6002117991447449, -0.574463963508606, -0.5487160682678223, -0.5229682326316833, -0.49722036719322205, -0.47147250175476074, -0.4457246661186218, -0.4199768006801605, -0.3942289352416992, -0.3684810996055603, -0.3427332639694214, -0.3169853985309601, -0.29123756289482117, -0.26548969745635986, -0.23974184691905975, -0.21399399638175964, -0.18824613094329834, -0.16249828040599823, -0.13675042986869812, -0.11100257933139801, -0.0852547213435173, -0.0595068633556366, -0.03375901281833649, -0.008011162281036377, 0.017736703157424927, 0.04348455369472504, 0.06923240423202515, 0.09498025476932526, 0.12072811275720596, 0.14647597074508667, 0.17222382128238678, 0.1979716718196869, 0.2237195372581482, 0.2494673877954483, 0.2752152383327484, 0.3009631037712097, 0.32671093940734863, 0.35245880484580994, 0.37820667028427124, 0.40395450592041016, 0.42970237135887146, 0.45545023679733276, 0.4811980724334717, 0.5069459080696106, 0.5326938033103943, 0.5584416389465332, 0.5841894745826721, 0.609937310218811, 0.6356852054595947, 0.6614330410957336, 0.6871808767318726, 0.7129287123680115, 0.7386766076087952, 0.7644244432449341, 0.790172278881073, 0.8159201145172119, 0.8416680097579956, 0.8674158453941345, 0.8931637406349182]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 11.0, 17.0, 34.0, 42.0, 47.0, 67.0, 119.0, 186.0, 256.0, 355.0, 589.0, 948.0, 1514.0, 2660.0, 4438.0, 8298.0, 15967.0, 33208.0, 73202.0, 176049.0, 497234.0, 1781054.0, 1066953.0, 308512.0, 119082.0, 51418.0, 24205.0, 12172.0, 6564.0, 3599.0, 2018.0, 1255.0, 753.0, 505.0, 296.0, 179.0, 147.0, 97.0, 67.0, 35.0, 35.0, 25.0, 21.0, 8.0, 5.0, 2.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.1258544921875, -0.12212944030761719, -0.11840438842773438, -0.11467933654785156, -0.11095428466796875, -0.10722923278808594, -0.10350418090820312, -0.09977912902832031, -0.0960540771484375, -0.09232902526855469, -0.08860397338867188, -0.08487892150878906, -0.08115386962890625, -0.07742881774902344, -0.07370376586914062, -0.06997871398925781, -0.066253662109375, -0.06252861022949219, -0.058803558349609375, -0.05507850646972656, -0.05135345458984375, -0.04762840270996094, -0.043903350830078125, -0.04017829895019531, -0.0364532470703125, -0.03272819519042969, -0.029003143310546875, -0.025278091430664062, -0.02155303955078125, -0.017827987670898438, -0.014102935791015625, -0.010377883911132812, -0.00665283203125, -0.0029277801513671875, 0.000797271728515625, 0.0045223236083984375, 0.00824737548828125, 0.011972427368164062, 0.015697479248046875, 0.019422531127929688, 0.0231475830078125, 0.026872634887695312, 0.030597686767578125, 0.03432273864746094, 0.03804779052734375, 0.04177284240722656, 0.045497894287109375, 0.04922294616699219, 0.052947998046875, 0.05667304992675781, 0.060398101806640625, 0.06412315368652344, 0.06784820556640625, 0.07157325744628906, 0.07529830932617188, 0.07902336120605469, 0.0827484130859375, 0.08647346496582031, 0.09019851684570312, 0.09392356872558594, 0.09764862060546875, 0.10137367248535156, 0.10509872436523438, 0.10882377624511719, 0.112548828125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 11.0, 11.0, 10.0, 21.0, 18.0, 29.0, 30.0, 35.0, 39.0, 30.0, 30.0, 41.0, 46.0, 42.0, 51.0, 46.0, 55.0, 52.0, 41.0, 41.0, 43.0, 29.0, 33.0, 20.0, 22.0, 24.0, 25.0, 22.0, 18.0, 13.0, 8.0, 8.0, 9.0, 7.0, 4.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0770263671875, -0.07459449768066406, -0.07216262817382812, -0.06973075866699219, -0.06729888916015625, -0.06486701965332031, -0.062435150146484375, -0.06000328063964844, -0.0575714111328125, -0.05513954162597656, -0.052707672119140625, -0.05027580261230469, -0.04784393310546875, -0.04541206359863281, -0.042980194091796875, -0.04054832458496094, -0.038116455078125, -0.03568458557128906, -0.033252716064453125, -0.030820846557617188, -0.02838897705078125, -0.025957107543945312, -0.023525238037109375, -0.021093368530273438, -0.0186614990234375, -0.016229629516601562, -0.013797760009765625, -0.011365890502929688, -0.00893402099609375, -0.0065021514892578125, -0.004070281982421875, -0.0016384124755859375, 0.00079345703125, 0.0032253265380859375, 0.005657196044921875, 0.008089065551757812, 0.01052093505859375, 0.012952804565429688, 0.015384674072265625, 0.017816543579101562, 0.0202484130859375, 0.022680282592773438, 0.025112152099609375, 0.027544021606445312, 0.02997589111328125, 0.03240776062011719, 0.034839630126953125, 0.03727149963378906, 0.039703369140625, 0.04213523864746094, 0.044567108154296875, 0.04699897766113281, 0.04943084716796875, 0.05186271667480469, 0.054294586181640625, 0.05672645568847656, 0.0591583251953125, 0.06159019470214844, 0.06402206420898438, 0.06645393371582031, 0.06888580322265625, 0.07131767272949219, 0.07374954223632812, 0.07618141174316406, 0.07861328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 4.0, 2.0, 2.0, 6.0, 11.0, 13.0, 18.0, 28.0, 44.0, 61.0, 84.0, 101.0, 147.0, 214.0, 326.0, 522.0, 843.0, 1538.0, 2940.0, 6192.0, 14862.0, 39602.0, 117059.0, 404921.0, 1840216.0, 1322103.0, 297067.0, 90603.0, 31307.0, 12268.0, 5165.0, 2385.0, 1346.0, 773.0, 497.0, 296.0, 214.0, 140.0, 107.0, 83.0, 54.0, 35.0, 26.0, 17.0, 10.0, 14.0, 4.0, 6.0, 4.0, 1.0, 4.0, 4.0, 0.0, 2.0], "bins": [-0.2406005859375, -0.23370361328125, -0.226806640625, -0.21990966796875, -0.2130126953125, -0.20611572265625, -0.19921875, -0.19232177734375, -0.1854248046875, -0.17852783203125, -0.171630859375, -0.16473388671875, -0.1578369140625, -0.15093994140625, -0.14404296875, -0.13714599609375, -0.1302490234375, -0.12335205078125, -0.116455078125, -0.10955810546875, -0.1026611328125, -0.09576416015625, -0.0888671875, -0.08197021484375, -0.0750732421875, -0.06817626953125, -0.061279296875, -0.05438232421875, -0.0474853515625, -0.04058837890625, -0.03369140625, -0.02679443359375, -0.0198974609375, -0.01300048828125, -0.006103515625, 0.00079345703125, 0.0076904296875, 0.01458740234375, 0.021484375, 0.02838134765625, 0.0352783203125, 0.04217529296875, 0.049072265625, 0.05596923828125, 0.0628662109375, 0.06976318359375, 0.07666015625, 0.08355712890625, 0.0904541015625, 0.09735107421875, 0.104248046875, 0.11114501953125, 0.1180419921875, 0.12493896484375, 0.1318359375, 0.13873291015625, 0.1456298828125, 0.15252685546875, 0.159423828125, 0.16632080078125, 0.1732177734375, 0.18011474609375, 0.18701171875, 0.19390869140625, 0.2008056640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 10.0, 9.0, 28.0, 27.0, 49.0, 89.0, 108.0, 157.0, 204.0, 336.0, 519.0, 732.0, 634.0, 409.0, 253.0, 153.0, 103.0, 80.0, 45.0, 33.0, 24.0, 19.0, 13.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.225830078125, -0.2184619903564453, -0.21109390258789062, -0.20372581481933594, -0.19635772705078125, -0.18898963928222656, -0.18162155151367188, -0.1742534637451172, -0.1668853759765625, -0.1595172882080078, -0.15214920043945312, -0.14478111267089844, -0.13741302490234375, -0.13004493713378906, -0.12267684936523438, -0.11530876159667969, -0.107940673828125, -0.10057258605957031, -0.09320449829101562, -0.08583641052246094, -0.07846832275390625, -0.07110023498535156, -0.06373214721679688, -0.05636405944824219, -0.0489959716796875, -0.04162788391113281, -0.034259796142578125, -0.026891708374023438, -0.01952362060546875, -0.012155532836914062, -0.004787445068359375, 0.0025806427001953125, 0.00994873046875, 0.017316818237304688, 0.024684906005859375, 0.03205299377441406, 0.03942108154296875, 0.04678916931152344, 0.054157257080078125, 0.06152534484863281, 0.0688934326171875, 0.07626152038574219, 0.08362960815429688, 0.09099769592285156, 0.09836578369140625, 0.10573387145996094, 0.11310195922851562, 0.12047004699707031, 0.127838134765625, 0.1352062225341797, 0.14257431030273438, 0.14994239807128906, 0.15731048583984375, 0.16467857360839844, 0.17204666137695312, 0.1794147491455078, 0.1867828369140625, 0.1941509246826172, 0.20151901245117188, 0.20888710021972656, 0.21625518798828125, 0.22362327575683594, 0.23099136352539062, 0.2383594512939453, 0.2457275390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 7.0, 18.0, 22.0, 40.0, 46.0, 45.0, 91.0, 102.0, 108.0, 107.0, 103.0, 92.0, 66.0, 61.0, 44.0, 18.0, 17.0, 11.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8653383255004883, -1.8246281147003174, -1.7839179039001465, -1.743207573890686, -1.7024973630905151, -1.6617871522903442, -1.6210768222808838, -1.580366611480713, -1.539656400680542, -1.498946189880371, -1.4582359790802002, -1.4175256490707397, -1.3768154382705688, -1.336105227470398, -1.2953948974609375, -1.2546846866607666, -1.2139744758605957, -1.1732642650604248, -1.132554054260254, -1.0918437242507935, -1.0511335134506226, -1.0104233026504517, -0.969713032245636, -0.9290027618408203, -0.8882925510406494, -0.8475823402404785, -0.8068720698356628, -0.7661617994308472, -0.7254515886306763, -0.6847413778305054, -0.6440311074256897, -0.603320837020874, -0.5626106262207031, -0.5219004154205322, -0.48119014501571655, -0.44047990441322327, -0.39976966381073, -0.3590594232082367, -0.3183491826057434, -0.2776389420032501, -0.23692870140075684, -0.19621846079826355, -0.15550822019577026, -0.11479797959327698, -0.07408773899078369, -0.033377498388290405, 0.007332742214202881, 0.04804298281669617, 0.08875322341918945, 0.12946346402168274, 0.17017370462417603, 0.2108839452266693, 0.2515941858291626, 0.2923044264316559, 0.33301466703414917, 0.37372490763664246, 0.41443514823913574, 0.45514538884162903, 0.4958556294441223, 0.536565899848938, 0.5772761106491089, 0.6179863214492798, 0.6586965918540955, 0.6994068622589111, 0.740117073059082]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 8.0, 6.0, 7.0, 17.0, 10.0, 15.0, 22.0, 24.0, 28.0, 31.0, 35.0, 32.0, 52.0, 52.0, 37.0, 37.0, 44.0, 43.0, 50.0, 40.0, 54.0, 38.0, 32.0, 36.0, 34.0, 33.0, 28.0, 29.0, 23.0, 14.0, 26.0, 11.0, 14.0, 9.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.703260064125061, -0.681280255317688, -0.6593004465103149, -0.6373206377029419, -0.6153408288955688, -0.5933610200881958, -0.5713812112808228, -0.5494014024734497, -0.5274215936660767, -0.5054417848587036, -0.48346197605133057, -0.4614821672439575, -0.4395023584365845, -0.4175225496292114, -0.395542711019516, -0.37356290221214294, -0.3515830636024475, -0.32960325479507446, -0.3076234459877014, -0.28564363718032837, -0.2636638283729553, -0.24168400466442108, -0.21970418095588684, -0.1977243721485138, -0.17574456334114075, -0.1537647545337677, -0.13178494572639465, -0.10980512201786041, -0.08782531321048737, -0.06584550440311432, -0.04386568069458008, -0.02188587188720703, 9.387731552124023e-05, 0.022073689848184586, 0.04405350238084793, 0.06603331863880157, 0.08801312744617462, 0.10999293625354767, 0.1319727599620819, 0.15395256876945496, 0.175932377576828, 0.19791218638420105, 0.2198919951915741, 0.24187181890010834, 0.2638516426086426, 0.2858314514160156, 0.30781126022338867, 0.3297910690307617, 0.35177087783813477, 0.3737506866455078, 0.39573049545288086, 0.4177103042602539, 0.43969011306762695, 0.461669921875, 0.48364976048469543, 0.5056295394897461, 0.5276093482971191, 0.5495891571044922, 0.5715689659118652, 0.5935487747192383, 0.6155285835266113, 0.6375083923339844, 0.6594882011413574, 0.6814680099487305, 0.7034478783607483]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 27.0, 28.0, 40.0, 54.0, 105.0, 150.0, 197.0, 280.0, 391.0, 622.0, 934.0, 1437.0, 2222.0, 3564.0, 5942.0, 10226.0, 17598.0, 32747.0, 66904.0, 195720.0, 427906.0, 154535.0, 57718.0, 28902.0, 16164.0, 9308.0, 5436.0, 3420.0, 2070.0, 1291.0, 811.0, 607.0, 374.0, 258.0, 173.0, 117.0, 79.0, 52.0, 46.0, 28.0, 15.0, 9.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1656494140625, -0.16037559509277344, -0.15510177612304688, -0.1498279571533203, -0.14455413818359375, -0.1392803192138672, -0.13400650024414062, -0.12873268127441406, -0.1234588623046875, -0.11818504333496094, -0.11291122436523438, -0.10763740539550781, -0.10236358642578125, -0.09708976745605469, -0.09181594848632812, -0.08654212951660156, -0.081268310546875, -0.07599449157714844, -0.07072067260742188, -0.06544685363769531, -0.06017303466796875, -0.05489921569824219, -0.049625396728515625, -0.04435157775878906, -0.0390777587890625, -0.03380393981933594, -0.028530120849609375, -0.023256301879882812, -0.01798248291015625, -0.012708663940429688, -0.007434844970703125, -0.0021610260009765625, 0.00311279296875, 0.008386611938476562, 0.013660430908203125, 0.018934249877929688, 0.02420806884765625, 0.029481887817382812, 0.034755706787109375, 0.04002952575683594, 0.0453033447265625, 0.05057716369628906, 0.055850982666015625, 0.06112480163574219, 0.06639862060546875, 0.07167243957519531, 0.07694625854492188, 0.08222007751464844, 0.087493896484375, 0.09276771545410156, 0.09804153442382812, 0.10331535339355469, 0.10858917236328125, 0.11386299133300781, 0.11913681030273438, 0.12441062927246094, 0.1296844482421875, 0.13495826721191406, 0.14023208618164062, 0.1455059051513672, 0.15077972412109375, 0.1560535430908203, 0.16132736206054688, 0.16660118103027344, 0.171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 8.0, 5.0, 4.0, 9.0, 17.0, 12.0, 16.0, 25.0, 22.0, 31.0, 31.0, 42.0, 31.0, 20.0, 35.0, 39.0, 37.0, 40.0, 52.0, 49.0, 53.0, 38.0, 56.0, 42.0, 37.0, 31.0, 39.0, 28.0, 27.0, 28.0, 16.0, 17.0, 10.0, 8.0, 12.0, 9.0, 6.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08428955078125, -0.0815887451171875, -0.078887939453125, -0.0761871337890625, -0.073486328125, -0.0707855224609375, -0.068084716796875, -0.0653839111328125, -0.06268310546875, -0.0599822998046875, -0.057281494140625, -0.0545806884765625, -0.0518798828125, -0.0491790771484375, -0.046478271484375, -0.0437774658203125, -0.04107666015625, -0.0383758544921875, -0.035675048828125, -0.0329742431640625, -0.0302734375, -0.0275726318359375, -0.024871826171875, -0.0221710205078125, -0.01947021484375, -0.0167694091796875, -0.014068603515625, -0.0113677978515625, -0.0086669921875, -0.0059661865234375, -0.003265380859375, -0.0005645751953125, 0.00213623046875, 0.0048370361328125, 0.007537841796875, 0.0102386474609375, 0.012939453125, 0.0156402587890625, 0.018341064453125, 0.0210418701171875, 0.02374267578125, 0.0264434814453125, 0.029144287109375, 0.0318450927734375, 0.0345458984375, 0.0372467041015625, 0.039947509765625, 0.0426483154296875, 0.04534912109375, 0.0480499267578125, 0.050750732421875, 0.0534515380859375, 0.05615234375, 0.0588531494140625, 0.061553955078125, 0.0642547607421875, 0.06695556640625, 0.0696563720703125, 0.072357177734375, 0.0750579833984375, 0.0777587890625, 0.0804595947265625, 0.083160400390625, 0.0858612060546875, 0.08856201171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 11.0, 19.0, 22.0, 27.0, 56.0, 87.0, 129.0, 278.0, 531.0, 1131.0, 2614.0, 6366.0, 15826.0, 43130.0, 169967.0, 620492.0, 128162.0, 36082.0, 13593.0, 5484.0, 2446.0, 1009.0, 498.0, 231.0, 133.0, 82.0, 42.0, 32.0, 22.0, 16.0, 8.0, 7.0, 6.0, 7.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.362060546875, -0.3531036376953125, -0.344146728515625, -0.3351898193359375, -0.32623291015625, -0.3172760009765625, -0.308319091796875, -0.2993621826171875, -0.2904052734375, -0.2814483642578125, -0.272491455078125, -0.2635345458984375, -0.25457763671875, -0.2456207275390625, -0.236663818359375, -0.2277069091796875, -0.21875, -0.2097930908203125, -0.200836181640625, -0.1918792724609375, -0.18292236328125, -0.1739654541015625, -0.165008544921875, -0.1560516357421875, -0.1470947265625, -0.1381378173828125, -0.129180908203125, -0.1202239990234375, -0.11126708984375, -0.1023101806640625, -0.093353271484375, -0.0843963623046875, -0.075439453125, -0.0664825439453125, -0.057525634765625, -0.0485687255859375, -0.03961181640625, -0.0306549072265625, -0.021697998046875, -0.0127410888671875, -0.0037841796875, 0.0051727294921875, 0.014129638671875, 0.0230865478515625, 0.03204345703125, 0.0410003662109375, 0.049957275390625, 0.0589141845703125, 0.06787109375, 0.0768280029296875, 0.085784912109375, 0.0947418212890625, 0.10369873046875, 0.1126556396484375, 0.121612548828125, 0.1305694580078125, 0.1395263671875, 0.1484832763671875, 0.157440185546875, 0.1663970947265625, 0.17535400390625, 0.1843109130859375, 0.193267822265625, 0.2022247314453125, 0.211181640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 8.0, 7.0, 10.0, 14.0, 17.0, 18.0, 27.0, 22.0, 24.0, 26.0, 30.0, 33.0, 32.0, 41.0, 42.0, 43.0, 46.0, 43.0, 50.0, 43.0, 39.0, 37.0, 52.0, 41.0, 34.0, 24.0, 34.0, 21.0, 19.0, 16.0, 18.0, 17.0, 13.0, 10.0, 1.0, 8.0, 4.0, 7.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2333984375, -0.22604942321777344, -0.21870040893554688, -0.2113513946533203, -0.20400238037109375, -0.1966533660888672, -0.18930435180664062, -0.18195533752441406, -0.1746063232421875, -0.16725730895996094, -0.15990829467773438, -0.1525592803955078, -0.14521026611328125, -0.1378612518310547, -0.13051223754882812, -0.12316322326660156, -0.115814208984375, -0.10846519470214844, -0.10111618041992188, -0.09376716613769531, -0.08641815185546875, -0.07906913757324219, -0.07172012329101562, -0.06437110900878906, -0.0570220947265625, -0.04967308044433594, -0.042324066162109375, -0.03497505187988281, -0.02762603759765625, -0.020277023315429688, -0.012928009033203125, -0.0055789947509765625, 0.00177001953125, 0.009119033813476562, 0.016468048095703125, 0.023817062377929688, 0.03116607666015625, 0.03851509094238281, 0.045864105224609375, 0.05321311950683594, 0.0605621337890625, 0.06791114807128906, 0.07526016235351562, 0.08260917663574219, 0.08995819091796875, 0.09730720520019531, 0.10465621948242188, 0.11200523376464844, 0.119354248046875, 0.12670326232910156, 0.13405227661132812, 0.1414012908935547, 0.14875030517578125, 0.1560993194580078, 0.16344833374023438, 0.17079734802246094, 0.1781463623046875, 0.18549537658691406, 0.19284439086914062, 0.2001934051513672, 0.20754241943359375, 0.2148914337158203, 0.22224044799804688, 0.22958946228027344, 0.2369384765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 9.0, 11.0, 24.0, 28.0, 35.0, 73.0, 96.0, 171.0, 231.0, 400.0, 682.0, 1048.0, 1752.0, 2873.0, 4726.0, 7862.0, 13009.0, 22148.0, 38096.0, 66737.0, 130469.0, 305763.0, 226570.0, 96986.0, 53543.0, 30440.0, 17848.0, 10755.0, 6271.0, 3886.0, 2263.0, 1431.0, 861.0, 565.0, 320.0, 208.0, 123.0, 87.0, 64.0, 33.0, 26.0, 8.0, 7.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0633544921875, -0.061480045318603516, -0.05960559844970703, -0.05773115158081055, -0.05585670471191406, -0.05398225784301758, -0.052107810974121094, -0.05023336410522461, -0.048358917236328125, -0.04648447036743164, -0.044610023498535156, -0.04273557662963867, -0.04086112976074219, -0.0389866828918457, -0.03711223602294922, -0.035237789154052734, -0.03336334228515625, -0.031488895416259766, -0.02961444854736328, -0.027740001678466797, -0.025865554809570312, -0.023991107940673828, -0.022116661071777344, -0.02024221420288086, -0.018367767333984375, -0.01649332046508789, -0.014618873596191406, -0.012744426727294922, -0.010869979858398438, -0.008995532989501953, -0.007121086120605469, -0.005246639251708984, -0.0033721923828125, -0.0014977455139160156, 0.00037670135498046875, 0.002251148223876953, 0.0041255950927734375, 0.006000041961669922, 0.007874488830566406, 0.00974893569946289, 0.011623382568359375, 0.01349782943725586, 0.015372276306152344, 0.017246723175048828, 0.019121170043945312, 0.020995616912841797, 0.02287006378173828, 0.024744510650634766, 0.02661895751953125, 0.028493404388427734, 0.03036785125732422, 0.0322422981262207, 0.03411674499511719, 0.03599119186401367, 0.037865638732910156, 0.03974008560180664, 0.041614532470703125, 0.04348897933959961, 0.045363426208496094, 0.04723787307739258, 0.04911231994628906, 0.05098676681518555, 0.05286121368408203, 0.054735660552978516, 0.056610107421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 13.0, 8.0, 12.0, 15.0, 23.0, 36.0, 53.0, 61.0, 92.0, 123.0, 120.0, 110.0, 91.0, 56.0, 58.0, 29.0, 19.0, 19.0, 9.0, 3.0, 5.0, 7.0, 7.0, 8.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6716461181640625e-05, -3.57581302523613e-05, -3.479979932308197e-05, -3.384146839380264e-05, -3.2883137464523315e-05, -3.192480653524399e-05, -3.096647560596466e-05, -3.0008144676685333e-05, -2.9049813747406006e-05, -2.809148281812668e-05, -2.713315188884735e-05, -2.6174820959568024e-05, -2.5216490030288696e-05, -2.425815910100937e-05, -2.329982817173004e-05, -2.2341497242450714e-05, -2.1383166313171387e-05, -2.042483538389206e-05, -1.9466504454612732e-05, -1.8508173525333405e-05, -1.7549842596054077e-05, -1.659151166677475e-05, -1.5633180737495422e-05, -1.4674849808216095e-05, -1.3716518878936768e-05, -1.275818794965744e-05, -1.1799857020378113e-05, -1.0841526091098785e-05, -9.883195161819458e-06, -8.92486423254013e-06, -7.966533303260803e-06, -7.008202373981476e-06, -6.0498714447021484e-06, -5.091540515422821e-06, -4.133209586143494e-06, -3.1748786568641663e-06, -2.216547727584839e-06, -1.2582167983055115e-06, -2.998858690261841e-07, 6.584450602531433e-07, 1.6167759895324707e-06, 2.575106918811798e-06, 3.5334378480911255e-06, 4.491768777370453e-06, 5.45009970664978e-06, 6.408430635929108e-06, 7.366761565208435e-06, 8.325092494487762e-06, 9.28342342376709e-06, 1.0241754353046417e-05, 1.1200085282325745e-05, 1.2158416211605072e-05, 1.31167471408844e-05, 1.4075078070163727e-05, 1.5033408999443054e-05, 1.599173992872238e-05, 1.695007085800171e-05, 1.7908401787281036e-05, 1.8866732716560364e-05, 1.982506364583969e-05, 2.078339457511902e-05, 2.1741725504398346e-05, 2.2700056433677673e-05, 2.3658387362957e-05, 2.4616718292236328e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 4.0, 6.0, 12.0, 16.0, 26.0, 39.0, 48.0, 64.0, 106.0, 148.0, 203.0, 343.0, 567.0, 1001.0, 1852.0, 3555.0, 7167.0, 14412.0, 28607.0, 57773.0, 121249.0, 296100.0, 286066.0, 117210.0, 55796.0, 27705.0, 13614.0, 6992.0, 3538.0, 1782.0, 993.0, 579.0, 338.0, 212.0, 122.0, 93.0, 67.0, 39.0, 33.0, 25.0, 10.0, 15.0, 5.0, 7.0, 3.0, 9.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06744384765625, -0.06526660919189453, -0.06308937072753906, -0.060912132263183594, -0.058734893798828125, -0.056557655334472656, -0.05438041687011719, -0.05220317840576172, -0.05002593994140625, -0.04784870147705078, -0.04567146301269531, -0.043494224548339844, -0.041316986083984375, -0.039139747619628906, -0.03696250915527344, -0.03478527069091797, -0.0326080322265625, -0.03043079376220703, -0.028253555297851562, -0.026076316833496094, -0.023899078369140625, -0.021721839904785156, -0.019544601440429688, -0.01736736297607422, -0.01519012451171875, -0.013012886047363281, -0.010835647583007812, -0.008658409118652344, -0.006481170654296875, -0.004303932189941406, -0.0021266937255859375, 5.054473876953125e-05, 0.002227783203125, 0.004405021667480469, 0.0065822601318359375, 0.008759498596191406, 0.010936737060546875, 0.013113975524902344, 0.015291213989257812, 0.01746845245361328, 0.01964569091796875, 0.02182292938232422, 0.024000167846679688, 0.026177406311035156, 0.028354644775390625, 0.030531883239746094, 0.03270912170410156, 0.03488636016845703, 0.0370635986328125, 0.03924083709716797, 0.04141807556152344, 0.043595314025878906, 0.045772552490234375, 0.047949790954589844, 0.05012702941894531, 0.05230426788330078, 0.05448150634765625, 0.05665874481201172, 0.05883598327636719, 0.061013221740722656, 0.06319046020507812, 0.0653676986694336, 0.06754493713378906, 0.06972217559814453, 0.0718994140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 6.0, 3.0, 5.0, 6.0, 8.0, 14.0, 14.0, 14.0, 14.0, 10.0, 18.0, 17.0, 29.0, 35.0, 27.0, 34.0, 55.0, 64.0, 65.0, 63.0, 65.0, 67.0, 56.0, 48.0, 35.0, 41.0, 31.0, 17.0, 19.0, 19.0, 15.0, 12.0, 11.0, 13.0, 4.0, 8.0, 6.0, 1.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05364990234375, -0.051738739013671875, -0.04982757568359375, -0.047916412353515625, -0.0460052490234375, -0.044094085693359375, -0.04218292236328125, -0.040271759033203125, -0.038360595703125, -0.036449432373046875, -0.03453826904296875, -0.032627105712890625, -0.0307159423828125, -0.028804779052734375, -0.02689361572265625, -0.024982452392578125, -0.0230712890625, -0.021160125732421875, -0.01924896240234375, -0.017337799072265625, -0.0154266357421875, -0.013515472412109375, -0.01160430908203125, -0.009693145751953125, -0.007781982421875, -0.005870819091796875, -0.00395965576171875, -0.002048492431640625, -0.0001373291015625, 0.001773834228515625, 0.00368499755859375, 0.005596160888671875, 0.00750732421875, 0.009418487548828125, 0.01132965087890625, 0.013240814208984375, 0.0151519775390625, 0.017063140869140625, 0.01897430419921875, 0.020885467529296875, 0.022796630859375, 0.024707794189453125, 0.02661895751953125, 0.028530120849609375, 0.0304412841796875, 0.032352447509765625, 0.03426361083984375, 0.036174774169921875, 0.0380859375, 0.039997100830078125, 0.04190826416015625, 0.043819427490234375, 0.0457305908203125, 0.047641754150390625, 0.04955291748046875, 0.051464080810546875, 0.053375244140625, 0.055286407470703125, 0.05719757080078125, 0.059108734130859375, 0.0610198974609375, 0.06293106079101562, 0.06484222412109375, 0.06675338745117188, 0.06866455078125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 19.0, 41.0, 84.0, 145.0, 211.0, 220.0, 137.0, 82.0, 37.0, 12.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0237245559692383, -0.959030270576477, -0.894335925579071, -0.829641580581665, -0.7649472951889038, -0.7002530097961426, -0.6355586647987366, -0.5708643198013306, -0.5061700344085693, -0.4414757192134857, -0.3767814040184021, -0.3120870888233185, -0.24739277362823486, -0.18269845843315125, -0.11800414323806763, -0.05330982804298401, 0.01138448715209961, 0.07607880234718323, 0.14077311754226685, 0.20546743273735046, 0.2701617479324341, 0.3348560631275177, 0.3995503783226013, 0.46424469351768494, 0.5289390087127686, 0.5936332941055298, 0.6583276391029358, 0.7230219841003418, 0.787716269493103, 0.8524105548858643, 0.9171048998832703, 0.9817992448806763, 1.0464937686920166, 1.1111880540847778, 1.175882339477539, 1.2405767440795898, 1.305271029472351, 1.3699653148651123, 1.434659719467163, 1.4993540048599243, 1.5640482902526855, 1.6287425756454468, 1.693436861038208, 1.7581312656402588, 1.82282555103302, 1.8875198364257812, 1.952214241027832, 2.0169084072113037, 2.0816028118133545, 2.1462972164154053, 2.210991382598877, 2.2756857872009277, 2.3403801918029785, 2.40507435798645, 2.469768762588501, 2.5344629287719727, 2.5991573333740234, 2.663851737976074, 2.728545904159546, 2.7932403087615967, 2.8579344749450684, 2.922628879547119, 2.98732328414917, 3.0520174503326416, 3.1167118549346924]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 11.0, 10.0, 8.0, 7.0, 8.0, 18.0, 15.0, 28.0, 17.0, 22.0, 21.0, 22.0, 28.0, 27.0, 26.0, 35.0, 41.0, 33.0, 28.0, 33.0, 41.0, 33.0, 41.0, 37.0, 41.0, 35.0, 28.0, 35.0, 34.0, 28.0, 27.0, 17.0, 21.0, 20.0, 18.0, 16.0, 10.0, 10.0, 10.0, 5.0, 8.0, 8.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 0.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.5539728999137878, -0.5364972949028015, -0.5190216302871704, -0.5015460252761841, -0.48407039046287537, -0.46659475564956665, -0.4491191506385803, -0.4316435158252716, -0.4141678810119629, -0.3966922461986542, -0.37921661138534546, -0.36174100637435913, -0.3442653715610504, -0.3267897367477417, -0.30931413173675537, -0.29183849692344666, -0.27436286211013794, -0.2568872272968292, -0.2394116073846817, -0.22193598747253418, -0.20446035265922546, -0.18698471784591675, -0.16950909793376923, -0.1520334780216217, -0.134557843208313, -0.11708221584558487, -0.09960658848285675, -0.08213096112012863, -0.06465533375740051, -0.047179706394672394, -0.029704079031944275, -0.012228451669216156, 0.005247235298156738, 0.022722862660884857, 0.040198490023612976, 0.057674117386341095, 0.07514974474906921, 0.09262537211179733, 0.11010099947452545, 0.12757661938667297, 0.1450522541999817, 0.1625278890132904, 0.18000350892543793, 0.19747912883758545, 0.21495476365089417, 0.23243039846420288, 0.2499060183763504, 0.2673816382884979, 0.28485727310180664, 0.30233290791511536, 0.3198085427284241, 0.3372841477394104, 0.3547597825527191, 0.37223541736602783, 0.38971102237701416, 0.4071866571903229, 0.4246622920036316, 0.4421379268169403, 0.459613561630249, 0.47708916664123535, 0.49456480145454407, 0.5120404362678528, 0.5295160412788391, 0.5469917058944702, 0.5644673109054565]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 5.0, 9.0, 8.0, 15.0, 26.0, 58.0, 76.0, 123.0, 193.0, 319.0, 575.0, 997.0, 1880.0, 4003.0, 8105.0, 19335.0, 50858.0, 156417.0, 709596.0, 2544984.0, 499282.0, 124361.0, 41856.0, 16440.0, 7289.0, 3475.0, 1728.0, 1008.0, 519.0, 307.0, 157.0, 108.0, 51.0, 35.0, 21.0, 19.0, 10.0, 11.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180419921875, -0.17467498779296875, -0.1689300537109375, -0.16318511962890625, -0.157440185546875, -0.15169525146484375, -0.1459503173828125, -0.14020538330078125, -0.13446044921875, -0.12871551513671875, -0.1229705810546875, -0.11722564697265625, -0.111480712890625, -0.10573577880859375, -0.0999908447265625, -0.09424591064453125, -0.0885009765625, -0.08275604248046875, -0.0770111083984375, -0.07126617431640625, -0.065521240234375, -0.05977630615234375, -0.0540313720703125, -0.04828643798828125, -0.04254150390625, -0.03679656982421875, -0.0310516357421875, -0.02530670166015625, -0.019561767578125, -0.01381683349609375, -0.0080718994140625, -0.00232696533203125, 0.00341796875, 0.00916290283203125, 0.0149078369140625, 0.02065277099609375, 0.026397705078125, 0.03214263916015625, 0.0378875732421875, 0.04363250732421875, 0.04937744140625, 0.05512237548828125, 0.0608673095703125, 0.06661224365234375, 0.072357177734375, 0.07810211181640625, 0.0838470458984375, 0.08959197998046875, 0.0953369140625, 0.10108184814453125, 0.1068267822265625, 0.11257171630859375, 0.118316650390625, 0.12406158447265625, 0.1298065185546875, 0.13555145263671875, 0.14129638671875, 0.14704132080078125, 0.1527862548828125, 0.15853118896484375, 0.164276123046875, 0.17002105712890625, 0.1757659912109375, 0.18151092529296875, 0.187255859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 11.0, 16.0, 19.0, 30.0, 22.0, 28.0, 32.0, 39.0, 37.0, 44.0, 50.0, 48.0, 45.0, 52.0, 56.0, 58.0, 45.0, 39.0, 47.0, 43.0, 35.0, 23.0, 26.0, 15.0, 28.0, 17.0, 23.0, 12.0, 5.0, 13.0, 11.0, 5.0, 4.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06231689453125, -0.05953025817871094, -0.056743621826171875, -0.05395698547363281, -0.05117034912109375, -0.04838371276855469, -0.045597076416015625, -0.04281044006347656, -0.0400238037109375, -0.03723716735839844, -0.034450531005859375, -0.03166389465332031, -0.02887725830078125, -0.026090621948242188, -0.023303985595703125, -0.020517349243164062, -0.017730712890625, -0.014944076538085938, -0.012157440185546875, -0.009370803833007812, -0.00658416748046875, -0.0037975311279296875, -0.001010894775390625, 0.0017757415771484375, 0.0045623779296875, 0.0073490142822265625, 0.010135650634765625, 0.012922286987304688, 0.01570892333984375, 0.018495559692382812, 0.021282196044921875, 0.024068832397460938, 0.02685546875, 0.029642105102539062, 0.032428741455078125, 0.03521537780761719, 0.03800201416015625, 0.04078865051269531, 0.043575286865234375, 0.04636192321777344, 0.0491485595703125, 0.05193519592285156, 0.054721832275390625, 0.05750846862792969, 0.06029510498046875, 0.06308174133300781, 0.06586837768554688, 0.06865501403808594, 0.071441650390625, 0.07422828674316406, 0.07701492309570312, 0.07980155944824219, 0.08258819580078125, 0.08537483215332031, 0.08816146850585938, 0.09094810485839844, 0.0937347412109375, 0.09652137756347656, 0.09930801391601562, 0.10209465026855469, 0.10488128662109375, 0.10766792297363281, 0.11045455932617188, 0.11324119567871094, 0.11602783203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 10.0, 11.0, 11.0, 10.0, 16.0, 19.0, 33.0, 41.0, 71.0, 76.0, 104.0, 184.0, 267.0, 396.0, 673.0, 1403.0, 3459.0, 9836.0, 36305.0, 173097.0, 1591053.0, 2106720.0, 209306.0, 42036.0, 11443.0, 3894.0, 1602.0, 813.0, 456.0, 285.0, 194.0, 136.0, 81.0, 62.0, 53.0, 28.0, 23.0, 19.0, 19.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0], "bins": [-0.392333984375, -0.38114166259765625, -0.3699493408203125, -0.35875701904296875, -0.347564697265625, -0.33637237548828125, -0.3251800537109375, -0.31398773193359375, -0.30279541015625, -0.29160308837890625, -0.2804107666015625, -0.26921844482421875, -0.258026123046875, -0.24683380126953125, -0.2356414794921875, -0.22444915771484375, -0.2132568359375, -0.20206451416015625, -0.1908721923828125, -0.17967987060546875, -0.168487548828125, -0.15729522705078125, -0.1461029052734375, -0.13491058349609375, -0.12371826171875, -0.11252593994140625, -0.1013336181640625, -0.09014129638671875, -0.078948974609375, -0.06775665283203125, -0.0565643310546875, -0.04537200927734375, -0.0341796875, -0.02298736572265625, -0.0117950439453125, -0.00060272216796875, 0.010589599609375, 0.02178192138671875, 0.0329742431640625, 0.04416656494140625, 0.05535888671875, 0.06655120849609375, 0.0777435302734375, 0.08893585205078125, 0.100128173828125, 0.11132049560546875, 0.1225128173828125, 0.13370513916015625, 0.1448974609375, 0.15608978271484375, 0.1672821044921875, 0.17847442626953125, 0.189666748046875, 0.20085906982421875, 0.2120513916015625, 0.22324371337890625, 0.23443603515625, 0.24562835693359375, 0.2568206787109375, 0.26801300048828125, 0.279205322265625, 0.29039764404296875, 0.3015899658203125, 0.31278228759765625, 0.323974609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 14.0, 15.0, 40.0, 38.0, 73.0, 124.0, 206.0, 376.0, 710.0, 1095.0, 596.0, 326.0, 174.0, 101.0, 65.0, 37.0, 31.0, 7.0, 10.0, 8.0, 9.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385986328125, -0.3753929138183594, -0.36479949951171875, -0.3542060852050781, -0.3436126708984375, -0.3330192565917969, -0.32242584228515625, -0.3118324279785156, -0.301239013671875, -0.2906455993652344, -0.28005218505859375, -0.2694587707519531, -0.2588653564453125, -0.24827194213867188, -0.23767852783203125, -0.22708511352539062, -0.21649169921875, -0.20589828491210938, -0.19530487060546875, -0.18471145629882812, -0.1741180419921875, -0.16352462768554688, -0.15293121337890625, -0.14233779907226562, -0.131744384765625, -0.12115097045898438, -0.11055755615234375, -0.09996414184570312, -0.0893707275390625, -0.07877731323242188, -0.06818389892578125, -0.057590484619140625, -0.0469970703125, -0.036403656005859375, -0.02581024169921875, -0.015216827392578125, -0.0046234130859375, 0.005970001220703125, 0.01656341552734375, 0.027156829833984375, 0.037750244140625, 0.048343658447265625, 0.05893707275390625, 0.06953048706054688, 0.0801239013671875, 0.09071731567382812, 0.10131072998046875, 0.11190414428710938, 0.12249755859375, 0.13309097290039062, 0.14368438720703125, 0.15427780151367188, 0.1648712158203125, 0.17546463012695312, 0.18605804443359375, 0.19665145874023438, 0.207244873046875, 0.21783828735351562, 0.22843170166015625, 0.23902511596679688, 0.2496185302734375, 0.2602119445800781, 0.27080535888671875, 0.2813987731933594, 0.2919921875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 8.0, 3.0, 4.0, 8.0, 13.0, 27.0, 40.0, 56.0, 79.0, 85.0, 110.0, 109.0, 115.0, 98.0, 84.0, 64.0, 30.0, 32.0, 14.0, 13.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2572760581970215, -1.2133593559265137, -1.1694425344467163, -1.1255258321762085, -1.0816090106964111, -1.0376923084259033, -0.9937755465507507, -0.9498587846755981, -0.9059420228004456, -0.862025260925293, -0.8181084990501404, -0.7741917371749878, -0.73027503490448, -0.6863582134246826, -0.6424415111541748, -0.5985247492790222, -0.5546079874038696, -0.510691225528717, -0.46677446365356445, -0.42285773158073425, -0.37894096970558167, -0.3350242078304291, -0.2911074757575989, -0.2471907138824463, -0.2032739520072937, -0.1593571901321411, -0.11544044315814972, -0.07152369618415833, -0.027606934309005737, 0.01630982756614685, 0.06022655963897705, 0.10414332151412964, 0.14806020259857178, 0.19197696447372437, 0.23589371144771576, 0.27981045842170715, 0.32372722029685974, 0.36764398217201233, 0.41156071424484253, 0.4554774761199951, 0.4993942379951477, 0.5433109998703003, 0.5872277617454529, 0.6311445236206055, 0.6750612258911133, 0.7189780473709106, 0.7628947496414185, 0.806811511516571, 0.8507282733917236, 0.8946450352668762, 0.9385617971420288, 0.9824784994125366, 1.026395320892334, 1.0703120231628418, 1.1142287254333496, 1.158145546913147, 1.2020623683929443, 1.2459790706634521, 1.2898958921432495, 1.3338125944137573, 1.3777294158935547, 1.4216461181640625, 1.4655628204345703, 1.5094796419143677, 1.5533963441848755]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 11.0, 18.0, 19.0, 12.0, 22.0, 24.0, 23.0, 35.0, 33.0, 35.0, 37.0, 36.0, 49.0, 50.0, 47.0, 47.0, 60.0, 46.0, 48.0, 46.0, 48.0, 42.0, 32.0, 21.0, 29.0, 16.0, 24.0, 15.0, 21.0, 10.0, 7.0, 5.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7898635864257812, -0.764848530292511, -0.7398334741592407, -0.7148184180259705, -0.6898033618927002, -0.6647883057594299, -0.6397732496261597, -0.6147582530975342, -0.5897431373596191, -0.5647280812263489, -0.5397130250930786, -0.5146979689598083, -0.4896829128265381, -0.4646678566932678, -0.43965283036231995, -0.4146377742290497, -0.3896227478981018, -0.36460769176483154, -0.3395926356315613, -0.314577579498291, -0.28956252336502075, -0.2645474672317505, -0.2395324409008026, -0.21451738476753235, -0.18950232863426208, -0.16448727250099182, -0.13947221636772156, -0.11445717513561249, -0.08944211900234222, -0.06442706286907196, -0.03941202163696289, -0.014396965503692627, 0.010618150234222412, 0.03563320264220238, 0.06064825505018234, 0.08566330373287201, 0.11067835986614227, 0.13569341599941254, 0.1607084572315216, 0.18572351336479187, 0.21073856949806213, 0.2357536256313324, 0.26076868176460266, 0.28578370809555054, 0.3107987642288208, 0.33581382036209106, 0.36082887649536133, 0.3858439326286316, 0.41085898876190186, 0.4358740448951721, 0.4608891010284424, 0.48590415716171265, 0.5109192132949829, 0.5359342694282532, 0.5609493255615234, 0.5859643220901489, 0.610979437828064, 0.6359944939613342, 0.6610095500946045, 0.6860246062278748, 0.711039662361145, 0.7360547184944153, 0.7610697746276855, 0.786084771156311, 0.8110998272895813]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 12.0, 11.0, 9.0, 21.0, 31.0, 43.0, 67.0, 101.0, 154.0, 212.0, 288.0, 425.0, 650.0, 902.0, 1367.0, 2148.0, 3124.0, 4833.0, 7551.0, 12273.0, 21428.0, 44231.0, 121603.0, 340056.0, 298019.0, 99832.0, 38426.0, 19228.0, 11183.0, 6961.0, 4434.0, 2976.0, 2060.0, 1295.0, 788.0, 513.0, 366.0, 300.0, 207.0, 119.0, 93.0, 70.0, 47.0, 38.0, 22.0, 21.0, 10.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1583251953125, -0.1533641815185547, -0.14840316772460938, -0.14344215393066406, -0.13848114013671875, -0.13352012634277344, -0.12855911254882812, -0.12359809875488281, -0.1186370849609375, -0.11367607116699219, -0.10871505737304688, -0.10375404357910156, -0.09879302978515625, -0.09383201599121094, -0.08887100219726562, -0.08390998840332031, -0.078948974609375, -0.07398796081542969, -0.06902694702148438, -0.06406593322753906, -0.05910491943359375, -0.05414390563964844, -0.049182891845703125, -0.04422187805175781, -0.0392608642578125, -0.03429985046386719, -0.029338836669921875, -0.024377822875976562, -0.01941680908203125, -0.014455795288085938, -0.009494781494140625, -0.0045337677001953125, 0.00042724609375, 0.0053882598876953125, 0.010349273681640625, 0.015310287475585938, 0.02027130126953125, 0.025232315063476562, 0.030193328857421875, 0.03515434265136719, 0.0401153564453125, 0.04507637023925781, 0.050037384033203125, 0.05499839782714844, 0.05995941162109375, 0.06492042541503906, 0.06988143920898438, 0.07484245300292969, 0.079803466796875, 0.08476448059082031, 0.08972549438476562, 0.09468650817871094, 0.09964752197265625, 0.10460853576660156, 0.10956954956054688, 0.11453056335449219, 0.1194915771484375, 0.12445259094238281, 0.12941360473632812, 0.13437461853027344, 0.13933563232421875, 0.14429664611816406, 0.14925765991210938, 0.1542186737060547, 0.1591796875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 7.0, 2.0, 7.0, 8.0, 14.0, 11.0, 18.0, 22.0, 30.0, 32.0, 31.0, 30.0, 39.0, 41.0, 39.0, 44.0, 50.0, 46.0, 43.0, 44.0, 44.0, 54.0, 42.0, 41.0, 35.0, 33.0, 28.0, 31.0, 31.0, 10.0, 15.0, 15.0, 10.0, 6.0, 10.0, 9.0, 3.0, 5.0, 10.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0975341796875, -0.09446144104003906, -0.09138870239257812, -0.08831596374511719, -0.08524322509765625, -0.08217048645019531, -0.07909774780273438, -0.07602500915527344, -0.0729522705078125, -0.06987953186035156, -0.06680679321289062, -0.06373405456542969, -0.06066131591796875, -0.05758857727050781, -0.054515838623046875, -0.05144309997558594, -0.048370361328125, -0.04529762268066406, -0.042224884033203125, -0.03915214538574219, -0.03607940673828125, -0.03300666809082031, -0.029933929443359375, -0.026861190795898438, -0.0237884521484375, -0.020715713500976562, -0.017642974853515625, -0.014570236206054688, -0.01149749755859375, -0.008424758911132812, -0.005352020263671875, -0.0022792816162109375, 0.00079345703125, 0.0038661956787109375, 0.006938934326171875, 0.010011672973632812, 0.01308441162109375, 0.016157150268554688, 0.019229888916015625, 0.022302627563476562, 0.0253753662109375, 0.028448104858398438, 0.031520843505859375, 0.03459358215332031, 0.03766632080078125, 0.04073905944824219, 0.043811798095703125, 0.04688453674316406, 0.049957275390625, 0.05303001403808594, 0.056102752685546875, 0.05917549133300781, 0.06224822998046875, 0.06532096862792969, 0.06839370727539062, 0.07146644592285156, 0.0745391845703125, 0.07761192321777344, 0.08068466186523438, 0.08375740051269531, 0.08683013916015625, 0.08990287780761719, 0.09297561645507812, 0.09604835510253906, 0.09912109375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 7.0, 6.0, 18.0, 23.0, 23.0, 28.0, 45.0, 59.0, 106.0, 155.0, 308.0, 522.0, 1084.0, 2161.0, 4647.0, 10281.0, 25804.0, 91919.0, 484155.0, 331240.0, 60350.0, 19803.0, 8262.0, 3775.0, 1702.0, 878.0, 466.0, 256.0, 163.0, 81.0, 67.0, 39.0, 25.0, 22.0, 18.0, 7.0, 8.0, 5.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.267578125, -0.2596759796142578, -0.2517738342285156, -0.24387168884277344, -0.23596954345703125, -0.22806739807128906, -0.22016525268554688, -0.2122631072998047, -0.2043609619140625, -0.1964588165283203, -0.18855667114257812, -0.18065452575683594, -0.17275238037109375, -0.16485023498535156, -0.15694808959960938, -0.1490459442138672, -0.141143798828125, -0.1332416534423828, -0.12533950805664062, -0.11743736267089844, -0.10953521728515625, -0.10163307189941406, -0.09373092651367188, -0.08582878112792969, -0.0779266357421875, -0.07002449035644531, -0.062122344970703125, -0.05422019958496094, -0.04631805419921875, -0.03841590881347656, -0.030513763427734375, -0.022611618041992188, -0.01470947265625, -0.0068073272705078125, 0.001094818115234375, 0.008996963500976562, 0.01689910888671875, 0.024801254272460938, 0.032703399658203125, 0.04060554504394531, 0.0485076904296875, 0.05640983581542969, 0.06431198120117188, 0.07221412658691406, 0.08011627197265625, 0.08801841735839844, 0.09592056274414062, 0.10382270812988281, 0.111724853515625, 0.11962699890136719, 0.12752914428710938, 0.13543128967285156, 0.14333343505859375, 0.15123558044433594, 0.15913772583007812, 0.1670398712158203, 0.1749420166015625, 0.1828441619873047, 0.19074630737304688, 0.19864845275878906, 0.20655059814453125, 0.21445274353027344, 0.22235488891601562, 0.2302570343017578, 0.2381591796875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 7.0, 9.0, 5.0, 13.0, 17.0, 19.0, 20.0, 26.0, 29.0, 22.0, 42.0, 39.0, 47.0, 51.0, 46.0, 50.0, 59.0, 46.0, 55.0, 50.0, 49.0, 41.0, 42.0, 31.0, 34.0, 27.0, 24.0, 18.0, 13.0, 13.0, 14.0, 12.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.306640625, -0.2970619201660156, -0.28748321533203125, -0.2779045104980469, -0.2683258056640625, -0.2587471008300781, -0.24916839599609375, -0.23958969116210938, -0.230010986328125, -0.22043228149414062, -0.21085357666015625, -0.20127487182617188, -0.1916961669921875, -0.18211746215820312, -0.17253875732421875, -0.16296005249023438, -0.15338134765625, -0.14380264282226562, -0.13422393798828125, -0.12464523315429688, -0.1150665283203125, -0.10548782348632812, -0.09590911865234375, -0.08633041381835938, -0.076751708984375, -0.06717300415039062, -0.05759429931640625, -0.048015594482421875, -0.0384368896484375, -0.028858184814453125, -0.01927947998046875, -0.009700775146484375, -0.0001220703125, 0.009456634521484375, 0.01903533935546875, 0.028614044189453125, 0.0381927490234375, 0.047771453857421875, 0.05735015869140625, 0.06692886352539062, 0.076507568359375, 0.08608627319335938, 0.09566497802734375, 0.10524368286132812, 0.1148223876953125, 0.12440109252929688, 0.13397979736328125, 0.14355850219726562, 0.15313720703125, 0.16271591186523438, 0.17229461669921875, 0.18187332153320312, 0.1914520263671875, 0.20103073120117188, 0.21060943603515625, 0.22018814086914062, 0.229766845703125, 0.23934555053710938, 0.24892425537109375, 0.2585029602050781, 0.2680816650390625, 0.2776603698730469, 0.28723907470703125, 0.2968177795410156, 0.306396484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 11.0, 15.0, 13.0, 23.0, 34.0, 41.0, 78.0, 85.0, 126.0, 228.0, 365.0, 570.0, 963.0, 1731.0, 3201.0, 5670.0, 10525.0, 20120.0, 40919.0, 103503.0, 309942.0, 339972.0, 118212.0, 44937.0, 21966.0, 11460.0, 5974.0, 3295.0, 1786.0, 1062.0, 639.0, 402.0, 239.0, 152.0, 96.0, 67.0, 38.0, 21.0, 22.0, 10.0, 16.0, 7.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0819091796875, -0.07943153381347656, -0.07695388793945312, -0.07447624206542969, -0.07199859619140625, -0.06952095031738281, -0.06704330444335938, -0.06456565856933594, -0.0620880126953125, -0.05961036682128906, -0.057132720947265625, -0.05465507507324219, -0.05217742919921875, -0.04969978332519531, -0.047222137451171875, -0.04474449157714844, -0.042266845703125, -0.03978919982910156, -0.037311553955078125, -0.03483390808105469, -0.03235626220703125, -0.029878616333007812, -0.027400970458984375, -0.024923324584960938, -0.0224456787109375, -0.019968032836914062, -0.017490386962890625, -0.015012741088867188, -0.01253509521484375, -0.010057449340820312, -0.007579803466796875, -0.0051021575927734375, -0.00262451171875, -0.0001468658447265625, 0.002330780029296875, 0.0048084259033203125, 0.00728607177734375, 0.009763717651367188, 0.012241363525390625, 0.014719009399414062, 0.0171966552734375, 0.019674301147460938, 0.022151947021484375, 0.024629592895507812, 0.02710723876953125, 0.029584884643554688, 0.032062530517578125, 0.03454017639160156, 0.037017822265625, 0.03949546813964844, 0.041973114013671875, 0.04445075988769531, 0.04692840576171875, 0.04940605163574219, 0.051883697509765625, 0.05436134338378906, 0.0568389892578125, 0.05931663513183594, 0.061794281005859375, 0.06427192687988281, 0.06674957275390625, 0.06922721862792969, 0.07170486450195312, 0.07418251037597656, 0.07666015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 9.0, 6.0, 7.0, 3.0, 16.0, 13.0, 14.0, 19.0, 36.0, 62.0, 69.0, 92.0, 123.0, 132.0, 115.0, 96.0, 62.0, 33.0, 19.0, 11.0, 17.0, 7.0, 7.0, 7.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.5033950805664062e-05, -2.411752939224243e-05, -2.32011079788208e-05, -2.228468656539917e-05, -2.136826515197754e-05, -2.0451843738555908e-05, -1.9535422325134277e-05, -1.8619000911712646e-05, -1.7702579498291016e-05, -1.6786158084869385e-05, -1.5869736671447754e-05, -1.4953315258026123e-05, -1.4036893844604492e-05, -1.3120472431182861e-05, -1.220405101776123e-05, -1.12876296043396e-05, -1.0371208190917969e-05, -9.454786777496338e-06, -8.538365364074707e-06, -7.621943950653076e-06, -6.705522537231445e-06, -5.7891011238098145e-06, -4.872679710388184e-06, -3.956258296966553e-06, -3.039836883544922e-06, -2.123415470123291e-06, -1.2069940567016602e-06, -2.905726432800293e-07, 6.258487701416016e-07, 1.5422701835632324e-06, 2.4586915969848633e-06, 3.375113010406494e-06, 4.291534423828125e-06, 5.207955837249756e-06, 6.124377250671387e-06, 7.040798664093018e-06, 7.957220077514648e-06, 8.87364149093628e-06, 9.79006290435791e-06, 1.0706484317779541e-05, 1.1622905731201172e-05, 1.2539327144622803e-05, 1.3455748558044434e-05, 1.4372169971466064e-05, 1.5288591384887695e-05, 1.6205012798309326e-05, 1.7121434211730957e-05, 1.8037855625152588e-05, 1.895427703857422e-05, 1.987069845199585e-05, 2.078711986541748e-05, 2.170354127883911e-05, 2.2619962692260742e-05, 2.3536384105682373e-05, 2.4452805519104004e-05, 2.5369226932525635e-05, 2.6285648345947266e-05, 2.7202069759368896e-05, 2.8118491172790527e-05, 2.9034912586212158e-05, 2.995133399963379e-05, 3.086775541305542e-05, 3.178417682647705e-05, 3.270059823989868e-05, 3.361701965332031e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 6.0, 8.0, 19.0, 17.0, 42.0, 51.0, 59.0, 100.0, 158.0, 243.0, 369.0, 650.0, 1004.0, 1821.0, 3114.0, 5770.0, 10982.0, 21628.0, 47249.0, 126828.0, 330576.0, 303057.0, 110083.0, 42465.0, 19616.0, 10056.0, 5437.0, 2875.0, 1627.0, 1006.0, 575.0, 345.0, 231.0, 144.0, 106.0, 69.0, 48.0, 35.0, 28.0, 13.0, 13.0, 3.0, 12.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076171875, -0.07362747192382812, -0.07108306884765625, -0.06853866577148438, -0.0659942626953125, -0.06344985961914062, -0.06090545654296875, -0.058361053466796875, -0.055816650390625, -0.053272247314453125, -0.05072784423828125, -0.048183441162109375, -0.0456390380859375, -0.043094635009765625, -0.04055023193359375, -0.038005828857421875, -0.03546142578125, -0.032917022705078125, -0.03037261962890625, -0.027828216552734375, -0.0252838134765625, -0.022739410400390625, -0.02019500732421875, -0.017650604248046875, -0.015106201171875, -0.012561798095703125, -0.01001739501953125, -0.007472991943359375, -0.0049285888671875, -0.002384185791015625, 0.00016021728515625, 0.002704620361328125, 0.0052490234375, 0.007793426513671875, 0.01033782958984375, 0.012882232666015625, 0.0154266357421875, 0.017971038818359375, 0.02051544189453125, 0.023059844970703125, 0.025604248046875, 0.028148651123046875, 0.03069305419921875, 0.033237457275390625, 0.0357818603515625, 0.038326263427734375, 0.04087066650390625, 0.043415069580078125, 0.04595947265625, 0.048503875732421875, 0.05104827880859375, 0.053592681884765625, 0.0561370849609375, 0.058681488037109375, 0.06122589111328125, 0.06377029418945312, 0.066314697265625, 0.06885910034179688, 0.07140350341796875, 0.07394790649414062, 0.0764923095703125, 0.07903671264648438, 0.08158111572265625, 0.08412551879882812, 0.086669921875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 10.0, 9.0, 6.0, 13.0, 8.0, 28.0, 34.0, 41.0, 39.0, 46.0, 77.0, 82.0, 76.0, 83.0, 81.0, 67.0, 65.0, 40.0, 40.0, 24.0, 15.0, 19.0, 10.0, 14.0, 11.0, 6.0, 2.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.071533203125, -0.06906509399414062, -0.06659698486328125, -0.06412887573242188, -0.0616607666015625, -0.059192657470703125, -0.05672454833984375, -0.054256439208984375, -0.051788330078125, -0.049320220947265625, -0.04685211181640625, -0.044384002685546875, -0.0419158935546875, -0.039447784423828125, -0.03697967529296875, -0.034511566162109375, -0.03204345703125, -0.029575347900390625, -0.02710723876953125, -0.024639129638671875, -0.0221710205078125, -0.019702911376953125, -0.01723480224609375, -0.014766693115234375, -0.012298583984375, -0.009830474853515625, -0.00736236572265625, -0.004894256591796875, -0.0024261474609375, 4.1961669921875e-05, 0.00251007080078125, 0.004978179931640625, 0.0074462890625, 0.009914398193359375, 0.01238250732421875, 0.014850616455078125, 0.0173187255859375, 0.019786834716796875, 0.02225494384765625, 0.024723052978515625, 0.027191162109375, 0.029659271240234375, 0.03212738037109375, 0.034595489501953125, 0.0370635986328125, 0.039531707763671875, 0.04199981689453125, 0.044467926025390625, 0.04693603515625, 0.049404144287109375, 0.05187225341796875, 0.054340362548828125, 0.0568084716796875, 0.059276580810546875, 0.06174468994140625, 0.06421279907226562, 0.066680908203125, 0.06914901733398438, 0.07161712646484375, 0.07408523559570312, 0.0765533447265625, 0.07902145385742188, 0.08148956298828125, 0.08395767211914062, 0.08642578125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 14.0, 26.0, 42.0, 70.0, 108.0, 154.0, 179.0, 137.0, 88.0, 76.0, 46.0, 23.0, 19.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1050565242767334, -1.060091257095337, -1.0151258707046509, -0.9701606035232544, -0.9251952767372131, -0.8802299499511719, -0.8352646827697754, -0.7902993559837341, -0.7453340291976929, -0.7003687024116516, -0.6554033756256104, -0.6104381084442139, -0.5654727816581726, -0.5205074548721313, -0.4755421578884125, -0.4305768609046936, -0.38561153411865234, -0.3406462073326111, -0.2956809103488922, -0.25071561336517334, -0.20575028657913208, -0.16078497469425201, -0.11581966280937195, -0.07085436582565308, -0.025889039039611816, 0.01907627284526825, 0.06404158473014832, 0.10900689661502838, 0.15397220849990845, 0.1989375203847885, 0.24390283226966858, 0.28886812925338745, 0.3338334560394287, 0.37879878282546997, 0.42376407980918884, 0.4687293767929077, 0.513694703578949, 0.5586600303649902, 0.6036252975463867, 0.648590624332428, 0.6935559511184692, 0.7385212779045105, 0.7834866046905518, 0.8284518718719482, 0.8734171986579895, 0.9183825254440308, 0.9633477926254272, 1.0083131790161133, 1.0532784461975098, 1.0982437133789062, 1.1432090997695923, 1.1881743669509888, 1.2331397533416748, 1.2781050205230713, 1.3230702877044678, 1.3680355548858643, 1.4130009412765503, 1.4579662084579468, 1.5029315948486328, 1.5478968620300293, 1.5928621292114258, 1.6378275156021118, 1.6827927827835083, 1.7277581691741943, 1.7727234363555908]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 5.0, 9.0, 15.0, 18.0, 18.0, 25.0, 26.0, 42.0, 28.0, 35.0, 47.0, 56.0, 45.0, 70.0, 46.0, 54.0, 62.0, 51.0, 55.0, 45.0, 39.0, 38.0, 30.0, 33.0, 25.0, 22.0, 14.0, 11.0, 4.0, 10.0, 7.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8780883550643921, -0.8491085171699524, -0.8201287388801575, -0.7911489009857178, -0.7621691226959229, -0.7331892848014832, -0.7042094469070435, -0.6752296686172485, -0.6462498903274536, -0.6172700524330139, -0.588290274143219, -0.5593104362487793, -0.5303306579589844, -0.5013508200645447, -0.47237101197242737, -0.44339120388031006, -0.41441136598587036, -0.38543155789375305, -0.35645174980163574, -0.32747191190719604, -0.2984921336174011, -0.2695122957229614, -0.24053248763084412, -0.2115526795387268, -0.1825728714466095, -0.1535930633544922, -0.12461324781179428, -0.09563343226909637, -0.06665362417697906, -0.037673816084861755, -0.008693993091583252, 0.020285815000534058, 0.04926556348800659, 0.0782453715801239, 0.10722518712282181, 0.13620500266551971, 0.16518481075763702, 0.19416461884975433, 0.22314444184303284, 0.25212424993515015, 0.28110405802726746, 0.31008386611938477, 0.3390636742115021, 0.3680434823036194, 0.3970233201980591, 0.426003098487854, 0.4549829363822937, 0.483962744474411, 0.5129425525665283, 0.541922390460968, 0.5709021687507629, 0.5998820066452026, 0.6288617849349976, 0.6578416228294373, 0.686821460723877, 0.7158012390136719, 0.7447810173034668, 0.7737608551979065, 0.8027406334877014, 0.8317204713821411, 0.860700249671936, 0.8896800875663757, 0.9186599254608154, 0.9476397037506104, 0.97661954164505]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 14.0, 13.0, 24.0, 19.0, 41.0, 46.0, 84.0, 125.0, 187.0, 273.0, 468.0, 791.0, 1374.0, 2453.0, 4732.0, 9865.0, 22504.0, 57876.0, 174489.0, 687833.0, 2243846.0, 709107.0, 176736.0, 58010.0, 22708.0, 9816.0, 4910.0, 2485.0, 1369.0, 777.0, 460.0, 285.0, 193.0, 123.0, 89.0, 43.0, 28.0, 29.0, 14.0, 15.0, 12.0, 4.0, 1.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.19189453125, -0.1859912872314453, -0.18008804321289062, -0.17418479919433594, -0.16828155517578125, -0.16237831115722656, -0.15647506713867188, -0.1505718231201172, -0.1446685791015625, -0.1387653350830078, -0.13286209106445312, -0.12695884704589844, -0.12105560302734375, -0.11515235900878906, -0.10924911499023438, -0.10334587097167969, -0.097442626953125, -0.09153938293457031, -0.08563613891601562, -0.07973289489746094, -0.07382965087890625, -0.06792640686035156, -0.062023162841796875, -0.05611991882324219, -0.0502166748046875, -0.04431343078613281, -0.038410186767578125, -0.03250694274902344, -0.02660369873046875, -0.020700454711914062, -0.014797210693359375, -0.008893966674804688, -0.00299072265625, 0.0029125213623046875, 0.008815765380859375, 0.014719009399414062, 0.02062225341796875, 0.026525497436523438, 0.032428741455078125, 0.03833198547363281, 0.0442352294921875, 0.05013847351074219, 0.056041717529296875, 0.06194496154785156, 0.06784820556640625, 0.07375144958496094, 0.07965469360351562, 0.08555793762207031, 0.091461181640625, 0.09736442565917969, 0.10326766967773438, 0.10917091369628906, 0.11507415771484375, 0.12097740173339844, 0.12688064575195312, 0.1327838897705078, 0.1386871337890625, 0.1445903778076172, 0.15049362182617188, 0.15639686584472656, 0.16230010986328125, 0.16820335388183594, 0.17410659790039062, 0.1800098419189453, 0.1859130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 16.0, 15.0, 11.0, 11.0, 20.0, 21.0, 24.0, 24.0, 33.0, 33.0, 34.0, 35.0, 34.0, 50.0, 30.0, 37.0, 43.0, 35.0, 43.0, 53.0, 48.0, 32.0, 30.0, 36.0, 32.0, 27.0, 22.0, 13.0, 24.0, 17.0, 14.0, 14.0, 16.0, 8.0, 11.0, 11.0, 5.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0823974609375, -0.07973957061767578, -0.07708168029785156, -0.07442378997802734, -0.07176589965820312, -0.0691080093383789, -0.06645011901855469, -0.06379222869873047, -0.06113433837890625, -0.05847644805908203, -0.05581855773925781, -0.053160667419433594, -0.050502777099609375, -0.047844886779785156, -0.04518699645996094, -0.04252910614013672, -0.0398712158203125, -0.03721332550048828, -0.03455543518066406, -0.031897544860839844, -0.029239654541015625, -0.026581764221191406, -0.023923873901367188, -0.02126598358154297, -0.01860809326171875, -0.01595020294189453, -0.013292312622070312, -0.010634422302246094, -0.007976531982421875, -0.005318641662597656, -0.0026607513427734375, -2.86102294921875e-06, 0.002655029296875, 0.005312919616699219, 0.007970809936523438, 0.010628700256347656, 0.013286590576171875, 0.015944480895996094, 0.018602371215820312, 0.02126026153564453, 0.02391815185546875, 0.02657604217529297, 0.029233932495117188, 0.031891822814941406, 0.034549713134765625, 0.037207603454589844, 0.03986549377441406, 0.04252338409423828, 0.0451812744140625, 0.04783916473388672, 0.05049705505371094, 0.053154945373535156, 0.055812835693359375, 0.058470726013183594, 0.06112861633300781, 0.06378650665283203, 0.06644439697265625, 0.06910228729248047, 0.07176017761230469, 0.0744180679321289, 0.07707595825195312, 0.07973384857177734, 0.08239173889160156, 0.08504962921142578, 0.08770751953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 2.0, 5.0, 10.0, 13.0, 8.0, 31.0, 42.0, 59.0, 79.0, 115.0, 199.0, 280.0, 451.0, 681.0, 1140.0, 2053.0, 3845.0, 7354.0, 14908.0, 32802.0, 75355.0, 191019.0, 578936.0, 1943287.0, 896143.0, 263347.0, 100215.0, 42535.0, 19151.0, 9201.0, 4749.0, 2653.0, 1342.0, 834.0, 506.0, 317.0, 180.0, 128.0, 100.0, 58.0, 47.0, 31.0, 21.0, 18.0, 9.0, 4.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-0.1875, -0.18175888061523438, -0.17601776123046875, -0.17027664184570312, -0.1645355224609375, -0.15879440307617188, -0.15305328369140625, -0.14731216430664062, -0.141571044921875, -0.13582992553710938, -0.13008880615234375, -0.12434768676757812, -0.1186065673828125, -0.11286544799804688, -0.10712432861328125, -0.10138320922851562, -0.09564208984375, -0.08990097045898438, -0.08415985107421875, -0.07841873168945312, -0.0726776123046875, -0.06693649291992188, -0.06119537353515625, -0.055454254150390625, -0.049713134765625, -0.043972015380859375, -0.03823089599609375, -0.032489776611328125, -0.0267486572265625, -0.021007537841796875, -0.01526641845703125, -0.009525299072265625, -0.0037841796875, 0.001956939697265625, 0.00769805908203125, 0.013439178466796875, 0.0191802978515625, 0.024921417236328125, 0.03066253662109375, 0.036403656005859375, 0.042144775390625, 0.047885894775390625, 0.05362701416015625, 0.059368133544921875, 0.0651092529296875, 0.07085037231445312, 0.07659149169921875, 0.08233261108398438, 0.08807373046875, 0.09381484985351562, 0.09955596923828125, 0.10529708862304688, 0.1110382080078125, 0.11677932739257812, 0.12252044677734375, 0.12826156616210938, 0.134002685546875, 0.13974380493164062, 0.14548492431640625, 0.15122604370117188, 0.1569671630859375, 0.16270828247070312, 0.16844940185546875, 0.17419052124023438, 0.179931640625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 16.0, 11.0, 18.0, 33.0, 39.0, 39.0, 65.0, 79.0, 120.0, 155.0, 248.0, 351.0, 549.0, 658.0, 508.0, 335.0, 203.0, 180.0, 133.0, 87.0, 57.0, 49.0, 35.0, 32.0, 15.0, 6.0, 14.0, 5.0, 6.0, 5.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26220703125, -0.25460052490234375, -0.2469940185546875, -0.23938751220703125, -0.231781005859375, -0.22417449951171875, -0.2165679931640625, -0.20896148681640625, -0.20135498046875, -0.19374847412109375, -0.1861419677734375, -0.17853546142578125, -0.170928955078125, -0.16332244873046875, -0.1557159423828125, -0.14810943603515625, -0.1405029296875, -0.13289642333984375, -0.1252899169921875, -0.11768341064453125, -0.110076904296875, -0.10247039794921875, -0.0948638916015625, -0.08725738525390625, -0.07965087890625, -0.07204437255859375, -0.0644378662109375, -0.05683135986328125, -0.049224853515625, -0.04161834716796875, -0.0340118408203125, -0.02640533447265625, -0.018798828125, -0.01119232177734375, -0.0035858154296875, 0.00402069091796875, 0.011627197265625, 0.01923370361328125, 0.0268402099609375, 0.03444671630859375, 0.04205322265625, 0.04965972900390625, 0.0572662353515625, 0.06487274169921875, 0.072479248046875, 0.08008575439453125, 0.0876922607421875, 0.09529876708984375, 0.1029052734375, 0.11051177978515625, 0.1181182861328125, 0.12572479248046875, 0.133331298828125, 0.14093780517578125, 0.1485443115234375, 0.15615081787109375, 0.16375732421875, 0.17136383056640625, 0.1789703369140625, 0.18657684326171875, 0.194183349609375, 0.20178985595703125, 0.2093963623046875, 0.21700286865234375, 0.224609375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 9.0, 3.0, 15.0, 15.0, 27.0, 34.0, 51.0, 65.0, 95.0, 111.0, 103.0, 92.0, 96.0, 90.0, 56.0, 45.0, 34.0, 16.0, 12.0, 11.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2269476652145386, -1.1849476099014282, -1.1429476737976074, -1.100947618484497, -1.0589475631713867, -1.0169475078582764, -0.9749475121498108, -0.9329475164413452, -0.8909474611282349, -0.8489474058151245, -0.8069474101066589, -0.7649474143981934, -0.722947359085083, -0.6809473037719727, -0.6389473080635071, -0.5969473123550415, -0.5549472570419312, -0.5129472017288208, -0.4709472060203552, -0.42894718050956726, -0.3869471549987793, -0.34494712948799133, -0.30294710397720337, -0.2609470784664154, -0.21894705295562744, -0.17694702744483948, -0.1349470019340515, -0.09294697642326355, -0.050946950912475586, -0.008946925401687622, 0.03305310010910034, 0.0750531256198883, 0.11705327033996582, 0.15905329585075378, 0.20105332136154175, 0.2430533468723297, 0.2850533723831177, 0.32705339789390564, 0.3690534234046936, 0.41105344891548157, 0.45305347442626953, 0.4950534999370575, 0.5370535254478455, 0.579053521156311, 0.6210535764694214, 0.6630536317825317, 0.7050536274909973, 0.7470536231994629, 0.7890536785125732, 0.8310537338256836, 0.8730537295341492, 0.9150537252426147, 0.9570537805557251, 0.9990538358688354, 1.0410537719726562, 1.0830538272857666, 1.125053882598877, 1.1670539379119873, 1.2090539932250977, 1.2510539293289185, 1.2930539846420288, 1.3350540399551392, 1.37705397605896, 1.4190540313720703, 1.4610540866851807]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 7.0, 13.0, 9.0, 16.0, 10.0, 20.0, 21.0, 18.0, 33.0, 19.0, 28.0, 21.0, 30.0, 31.0, 36.0, 47.0, 35.0, 35.0, 37.0, 44.0, 36.0, 39.0, 34.0, 31.0, 33.0, 33.0, 28.0, 31.0, 32.0, 22.0, 26.0, 21.0, 19.0, 12.0, 16.0, 10.0, 11.0, 12.0, 4.0, 6.0, 5.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.6769410371780396, -0.6567697525024414, -0.6365984678268433, -0.6164271831512451, -0.596255898475647, -0.5760846138000488, -0.5559133291244507, -0.5357420444488525, -0.5155707597732544, -0.49539947509765625, -0.4752281904220581, -0.45505690574645996, -0.4348856210708618, -0.41471433639526367, -0.3945430517196655, -0.3743717670440674, -0.3542005121707916, -0.3340292274951935, -0.31385794281959534, -0.2936866581439972, -0.27351537346839905, -0.2533440887928009, -0.23317281901836395, -0.2130015343427658, -0.19283024966716766, -0.17265896499156952, -0.15248768031597137, -0.13231641054153442, -0.11214511841535568, -0.09197383373975754, -0.07180255651473999, -0.051631271839141846, -0.0314599871635437, -0.011288704350590706, 0.00888257846236229, 0.029053859412670135, 0.04922514408826828, 0.06939642876386642, 0.08956770598888397, 0.10973899066448212, 0.12991027534008026, 0.1500815600156784, 0.17025284469127655, 0.1904241144657135, 0.21059539914131165, 0.2307666838169098, 0.25093796849250793, 0.2711092531681061, 0.2912805378437042, 0.31145182251930237, 0.3316231071949005, 0.35179439187049866, 0.3719656765460968, 0.39213696122169495, 0.4123082160949707, 0.43247950077056885, 0.452650785446167, 0.47282207012176514, 0.4929933547973633, 0.5131646394729614, 0.5333359241485596, 0.5535072088241577, 0.5736784934997559, 0.593849778175354, 0.6140210628509521]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 9.0, 19.0, 19.0, 28.0, 59.0, 82.0, 131.0, 195.0, 331.0, 509.0, 645.0, 1075.0, 1481.0, 2217.0, 3442.0, 5070.0, 7705.0, 12424.0, 21664.0, 47173.0, 201714.0, 512967.0, 139462.0, 38844.0, 18936.0, 11179.0, 7092.0, 4691.0, 3113.0, 2056.0, 1463.0, 959.0, 585.0, 414.0, 286.0, 171.0, 129.0, 59.0, 49.0, 33.0, 26.0, 11.0, 7.0, 9.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0], "bins": [-0.259521484375, -0.25197601318359375, -0.2444305419921875, -0.23688507080078125, -0.229339599609375, -0.22179412841796875, -0.2142486572265625, -0.20670318603515625, -0.19915771484375, -0.19161224365234375, -0.1840667724609375, -0.17652130126953125, -0.168975830078125, -0.16143035888671875, -0.1538848876953125, -0.14633941650390625, -0.1387939453125, -0.13124847412109375, -0.1237030029296875, -0.11615753173828125, -0.108612060546875, -0.10106658935546875, -0.0935211181640625, -0.08597564697265625, -0.07843017578125, -0.07088470458984375, -0.0633392333984375, -0.05579376220703125, -0.048248291015625, -0.04070281982421875, -0.0331573486328125, -0.02561187744140625, -0.01806640625, -0.01052093505859375, -0.0029754638671875, 0.00457000732421875, 0.012115478515625, 0.01966094970703125, 0.0272064208984375, 0.03475189208984375, 0.04229736328125, 0.04984283447265625, 0.0573883056640625, 0.06493377685546875, 0.072479248046875, 0.08002471923828125, 0.0875701904296875, 0.09511566162109375, 0.1026611328125, 0.11020660400390625, 0.1177520751953125, 0.12529754638671875, 0.132843017578125, 0.14038848876953125, 0.1479339599609375, 0.15547943115234375, 0.16302490234375, 0.17057037353515625, 0.1781158447265625, 0.18566131591796875, 0.193206787109375, 0.20075225830078125, 0.2082977294921875, 0.21584320068359375, 0.223388671875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 4.0, 7.0, 6.0, 9.0, 14.0, 10.0, 18.0, 17.0, 16.0, 29.0, 22.0, 24.0, 45.0, 35.0, 36.0, 36.0, 47.0, 52.0, 44.0, 52.0, 51.0, 35.0, 37.0, 39.0, 43.0, 31.0, 40.0, 44.0, 27.0, 29.0, 16.0, 18.0, 14.0, 13.0, 8.0, 11.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.089111328125, -0.08586883544921875, -0.0826263427734375, -0.07938385009765625, -0.076141357421875, -0.07289886474609375, -0.0696563720703125, -0.06641387939453125, -0.06317138671875, -0.05992889404296875, -0.0566864013671875, -0.05344390869140625, -0.050201416015625, -0.04695892333984375, -0.0437164306640625, -0.04047393798828125, -0.0372314453125, -0.03398895263671875, -0.0307464599609375, -0.02750396728515625, -0.024261474609375, -0.02101898193359375, -0.0177764892578125, -0.01453399658203125, -0.01129150390625, -0.00804901123046875, -0.0048065185546875, -0.00156402587890625, 0.001678466796875, 0.00492095947265625, 0.0081634521484375, 0.01140594482421875, 0.0146484375, 0.01789093017578125, 0.0211334228515625, 0.02437591552734375, 0.027618408203125, 0.03086090087890625, 0.0341033935546875, 0.03734588623046875, 0.04058837890625, 0.04383087158203125, 0.0470733642578125, 0.05031585693359375, 0.053558349609375, 0.05680084228515625, 0.0600433349609375, 0.06328582763671875, 0.0665283203125, 0.06977081298828125, 0.0730133056640625, 0.07625579833984375, 0.079498291015625, 0.08274078369140625, 0.0859832763671875, 0.08922576904296875, 0.09246826171875, 0.09571075439453125, 0.0989532470703125, 0.10219573974609375, 0.105438232421875, 0.10868072509765625, 0.1119232177734375, 0.11516571044921875, 0.118408203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 11.0, 17.0, 22.0, 28.0, 44.0, 52.0, 76.0, 107.0, 213.0, 410.0, 842.0, 1498.0, 3371.0, 8089.0, 19264.0, 53407.0, 411955.0, 457105.0, 56760.0, 20312.0, 8107.0, 3454.0, 1616.0, 782.0, 407.0, 213.0, 130.0, 76.0, 63.0, 43.0, 23.0, 13.0, 10.0, 8.0, 6.0, 5.0, 3.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.303466796875, -0.2918052673339844, -0.28014373779296875, -0.2684822082519531, -0.2568206787109375, -0.24515914916992188, -0.23349761962890625, -0.22183609008789062, -0.210174560546875, -0.19851303100585938, -0.18685150146484375, -0.17518997192382812, -0.1635284423828125, -0.15186691284179688, -0.14020538330078125, -0.12854385375976562, -0.11688232421875, -0.10522079467773438, -0.09355926513671875, -0.08189773559570312, -0.0702362060546875, -0.058574676513671875, -0.04691314697265625, -0.035251617431640625, -0.023590087890625, -0.011928558349609375, -0.00026702880859375, 0.011394500732421875, 0.0230560302734375, 0.034717559814453125, 0.04637908935546875, 0.058040618896484375, 0.0697021484375, 0.08136367797851562, 0.09302520751953125, 0.10468673706054688, 0.1163482666015625, 0.12800979614257812, 0.13967132568359375, 0.15133285522460938, 0.162994384765625, 0.17465591430664062, 0.18631744384765625, 0.19797897338867188, 0.2096405029296875, 0.22130203247070312, 0.23296356201171875, 0.24462509155273438, 0.25628662109375, 0.2679481506347656, 0.27960968017578125, 0.2912712097167969, 0.3029327392578125, 0.3145942687988281, 0.32625579833984375, 0.3379173278808594, 0.349578857421875, 0.3612403869628906, 0.37290191650390625, 0.3845634460449219, 0.3962249755859375, 0.4078865051269531, 0.41954803466796875, 0.4312095642089844, 0.44287109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 6.0, 5.0, 7.0, 6.0, 8.0, 14.0, 7.0, 12.0, 13.0, 21.0, 19.0, 22.0, 16.0, 29.0, 32.0, 33.0, 43.0, 32.0, 39.0, 47.0, 54.0, 31.0, 44.0, 48.0, 44.0, 37.0, 36.0, 36.0, 40.0, 35.0, 29.0, 27.0, 20.0, 16.0, 18.0, 16.0, 18.0, 4.0, 10.0, 12.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.26088714599609375, -0.2527313232421875, -0.24457550048828125, -0.236419677734375, -0.22826385498046875, -0.2201080322265625, -0.21195220947265625, -0.20379638671875, -0.19564056396484375, -0.1874847412109375, -0.17932891845703125, -0.171173095703125, -0.16301727294921875, -0.1548614501953125, -0.14670562744140625, -0.1385498046875, -0.13039398193359375, -0.1222381591796875, -0.11408233642578125, -0.105926513671875, -0.09777069091796875, -0.0896148681640625, -0.08145904541015625, -0.07330322265625, -0.06514739990234375, -0.0569915771484375, -0.04883575439453125, -0.040679931640625, -0.03252410888671875, -0.0243682861328125, -0.01621246337890625, -0.008056640625, 9.918212890625e-05, 0.0082550048828125, 0.01641082763671875, 0.024566650390625, 0.03272247314453125, 0.0408782958984375, 0.04903411865234375, 0.05718994140625, 0.06534576416015625, 0.0735015869140625, 0.08165740966796875, 0.089813232421875, 0.09796905517578125, 0.1061248779296875, 0.11428070068359375, 0.1224365234375, 0.13059234619140625, 0.1387481689453125, 0.14690399169921875, 0.155059814453125, 0.16321563720703125, 0.1713714599609375, 0.17952728271484375, 0.18768310546875, 0.19583892822265625, 0.2039947509765625, 0.21215057373046875, 0.220306396484375, 0.22846221923828125, 0.2366180419921875, 0.24477386474609375, 0.2529296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 15.0, 26.0, 34.0, 55.0, 88.0, 134.0, 180.0, 317.0, 515.0, 806.0, 1318.0, 2204.0, 3755.0, 6460.0, 11778.0, 23316.0, 59223.0, 199980.0, 461631.0, 175797.0, 53260.0, 21625.0, 10866.0, 6048.0, 3606.0, 2071.0, 1287.0, 799.0, 504.0, 295.0, 184.0, 123.0, 75.0, 49.0, 34.0, 31.0, 12.0, 10.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.0920724868774414, -0.08923530578613281, -0.08639812469482422, -0.08356094360351562, -0.08072376251220703, -0.07788658142089844, -0.07504940032958984, -0.07221221923828125, -0.06937503814697266, -0.06653785705566406, -0.06370067596435547, -0.060863494873046875, -0.05802631378173828, -0.05518913269042969, -0.052351951599121094, -0.0495147705078125, -0.046677589416503906, -0.04384040832519531, -0.04100322723388672, -0.038166046142578125, -0.03532886505126953, -0.03249168395996094, -0.029654502868652344, -0.02681732177734375, -0.023980140686035156, -0.021142959594726562, -0.01830577850341797, -0.015468597412109375, -0.012631416320800781, -0.009794235229492188, -0.006957054138183594, -0.004119873046875, -0.0012826919555664062, 0.0015544891357421875, 0.004391670227050781, 0.007228851318359375, 0.010066032409667969, 0.012903213500976562, 0.015740394592285156, 0.01857757568359375, 0.021414756774902344, 0.024251937866210938, 0.02708911895751953, 0.029926300048828125, 0.03276348114013672, 0.03560066223144531, 0.038437843322753906, 0.0412750244140625, 0.044112205505371094, 0.04694938659667969, 0.04978656768798828, 0.052623748779296875, 0.05546092987060547, 0.05829811096191406, 0.061135292053222656, 0.06397247314453125, 0.06680965423583984, 0.06964683532714844, 0.07248401641845703, 0.07532119750976562, 0.07815837860107422, 0.08099555969238281, 0.0838327407836914, 0.086669921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 7.0, 11.0, 21.0, 42.0, 77.0, 120.0, 203.0, 183.0, 149.0, 61.0, 36.0, 25.0, 11.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.780292510986328e-05, -4.6351924538612366e-05, -4.490092396736145e-05, -4.3449923396110535e-05, -4.199892282485962e-05, -4.0547922253608704e-05, -3.909692168235779e-05, -3.764592111110687e-05, -3.619492053985596e-05, -3.474391996860504e-05, -3.3292919397354126e-05, -3.184191882610321e-05, -3.0390918254852295e-05, -2.893991768360138e-05, -2.7488917112350464e-05, -2.603791654109955e-05, -2.4586915969848633e-05, -2.3135915398597717e-05, -2.1684914827346802e-05, -2.0233914256095886e-05, -1.878291368484497e-05, -1.7331913113594055e-05, -1.588091254234314e-05, -1.4429911971092224e-05, -1.2978911399841309e-05, -1.1527910828590393e-05, -1.0076910257339478e-05, -8.625909686088562e-06, -7.1749091148376465e-06, -5.723908543586731e-06, -4.2729079723358154e-06, -2.8219074010849e-06, -1.3709068298339844e-06, 8.009374141693115e-08, 1.5310943126678467e-06, 2.982094883918762e-06, 4.433095455169678e-06, 5.884096026420593e-06, 7.335096597671509e-06, 8.786097168922424e-06, 1.023709774017334e-05, 1.1688098311424255e-05, 1.3139098882675171e-05, 1.4590099453926086e-05, 1.6041100025177002e-05, 1.7492100596427917e-05, 1.8943101167678833e-05, 2.039410173892975e-05, 2.1845102310180664e-05, 2.329610288143158e-05, 2.4747103452682495e-05, 2.619810402393341e-05, 2.7649104595184326e-05, 2.9100105166435242e-05, 3.055110573768616e-05, 3.200210630893707e-05, 3.345310688018799e-05, 3.4904107451438904e-05, 3.635510802268982e-05, 3.7806108593940735e-05, 3.925710916519165e-05, 4.0708109736442566e-05, 4.215911030769348e-05, 4.36101108789444e-05, 4.506111145019531e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 8.0, 12.0, 19.0, 22.0, 31.0, 53.0, 62.0, 110.0, 178.0, 369.0, 710.0, 1345.0, 2772.0, 6164.0, 14202.0, 37100.0, 115449.0, 329567.0, 346768.0, 125545.0, 40348.0, 15134.0, 6438.0, 3052.0, 1452.0, 705.0, 356.0, 219.0, 132.0, 66.0, 35.0, 37.0, 27.0, 16.0, 11.0, 9.0, 4.0, 5.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09613037109375, -0.09338665008544922, -0.09064292907714844, -0.08789920806884766, -0.08515548706054688, -0.0824117660522461, -0.07966804504394531, -0.07692432403564453, -0.07418060302734375, -0.07143688201904297, -0.06869316101074219, -0.0659494400024414, -0.06320571899414062, -0.060461997985839844, -0.05771827697753906, -0.05497455596923828, -0.0522308349609375, -0.04948711395263672, -0.04674339294433594, -0.043999671936035156, -0.041255950927734375, -0.038512229919433594, -0.03576850891113281, -0.03302478790283203, -0.03028106689453125, -0.02753734588623047, -0.024793624877929688, -0.022049903869628906, -0.019306182861328125, -0.016562461853027344, -0.013818740844726562, -0.011075019836425781, -0.008331298828125, -0.005587577819824219, -0.0028438568115234375, -0.00010013580322265625, 0.002643585205078125, 0.005387306213378906, 0.008131027221679688, 0.010874748229980469, 0.01361846923828125, 0.01636219024658203, 0.019105911254882812, 0.021849632263183594, 0.024593353271484375, 0.027337074279785156, 0.030080795288085938, 0.03282451629638672, 0.0355682373046875, 0.03831195831298828, 0.04105567932128906, 0.043799400329589844, 0.046543121337890625, 0.049286842346191406, 0.05203056335449219, 0.05477428436279297, 0.05751800537109375, 0.06026172637939453, 0.06300544738769531, 0.0657491683959961, 0.06849288940429688, 0.07123661041259766, 0.07398033142089844, 0.07672405242919922, 0.0794677734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 6.0, 8.0, 6.0, 6.0, 13.0, 11.0, 15.0, 15.0, 28.0, 39.0, 49.0, 53.0, 45.0, 80.0, 92.0, 74.0, 97.0, 81.0, 62.0, 29.0, 38.0, 29.0, 21.0, 24.0, 10.0, 10.0, 14.0, 11.0, 8.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0870361328125, -0.08456897735595703, -0.08210182189941406, -0.0796346664428711, -0.07716751098632812, -0.07470035552978516, -0.07223320007324219, -0.06976604461669922, -0.06729888916015625, -0.06483173370361328, -0.06236457824707031, -0.059897422790527344, -0.057430267333984375, -0.054963111877441406, -0.05249595642089844, -0.05002880096435547, -0.0475616455078125, -0.04509449005126953, -0.04262733459472656, -0.040160179138183594, -0.037693023681640625, -0.035225868225097656, -0.03275871276855469, -0.03029155731201172, -0.02782440185546875, -0.02535724639892578, -0.022890090942382812, -0.020422935485839844, -0.017955780029296875, -0.015488624572753906, -0.013021469116210938, -0.010554313659667969, -0.008087158203125, -0.005620002746582031, -0.0031528472900390625, -0.0006856918334960938, 0.001781463623046875, 0.004248619079589844, 0.0067157745361328125, 0.009182929992675781, 0.01165008544921875, 0.014117240905761719, 0.016584396362304688, 0.019051551818847656, 0.021518707275390625, 0.023985862731933594, 0.026453018188476562, 0.02892017364501953, 0.0313873291015625, 0.03385448455810547, 0.03632164001464844, 0.038788795471191406, 0.041255950927734375, 0.043723106384277344, 0.04619026184082031, 0.04865741729736328, 0.05112457275390625, 0.05359172821044922, 0.05605888366699219, 0.058526039123535156, 0.060993194580078125, 0.0634603500366211, 0.06592750549316406, 0.06839466094970703, 0.07086181640625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 10.0, 9.0, 14.0, 34.0, 45.0, 49.0, 72.0, 103.0, 94.0, 100.0, 103.0, 81.0, 63.0, 69.0, 59.0, 31.0, 26.0, 7.0, 10.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2977625131607056, -1.260359525680542, -1.222956657409668, -1.1855536699295044, -1.1481506824493408, -1.1107478141784668, -1.0733448266983032, -1.0359418392181396, -0.9985389709472656, -0.9611360430717468, -0.9237330555915833, -0.8863301277160645, -0.8489271998405457, -0.8115242719650269, -0.7741212844848633, -0.7367183566093445, -0.6993153691291809, -0.6619124412536621, -0.6245094537734985, -0.5871065258979797, -0.5497035980224609, -0.5123006105422974, -0.47489768266677856, -0.43749475479125977, -0.4000917971134186, -0.3626888394355774, -0.3252859115600586, -0.2878829538822174, -0.2504799962043762, -0.21307706832885742, -0.17567411065101624, -0.13827118277549744, -0.10086822509765625, -0.06346528232097626, -0.026062332093715668, 0.011340618133544922, 0.048743560910224915, 0.08614650368690491, 0.1235494613647461, 0.1609523892402649, 0.19835534691810608, 0.23575828969478607, 0.27316123247146606, 0.31056419014930725, 0.34796714782714844, 0.38537007570266724, 0.4227730333805084, 0.4601759612560272, 0.4975789189338684, 0.5349818468093872, 0.5723848342895508, 0.6097877621650696, 0.6471906900405884, 0.684593677520752, 0.7219966053962708, 0.7593995332717896, 0.7968025207519531, 0.8342054486274719, 0.8716084361076355, 0.9090113639831543, 0.9464142918586731, 0.9838172197341919, 1.0212202072143555, 1.0586230754852295, 1.096026062965393]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 9.0, 6.0, 9.0, 19.0, 6.0, 12.0, 23.0, 19.0, 16.0, 25.0, 31.0, 32.0, 31.0, 27.0, 38.0, 48.0, 35.0, 38.0, 40.0, 46.0, 34.0, 49.0, 40.0, 38.0, 33.0, 31.0, 34.0, 27.0, 25.0, 27.0, 33.0, 17.0, 21.0, 19.0, 11.0, 17.0, 8.0, 2.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62393718957901, -0.6016092896461487, -0.5792813301086426, -0.5569534301757812, -0.5346255302429199, -0.5122975707054138, -0.4899696707725525, -0.4676417410373688, -0.44531381130218506, -0.42298588156700134, -0.4006579518318176, -0.3783300518989563, -0.3560021221637726, -0.33367419242858887, -0.31134629249572754, -0.2890183627605438, -0.2666904330253601, -0.2443625032901764, -0.22203458845615387, -0.19970667362213135, -0.17737874388694763, -0.15505081415176392, -0.1327228993177414, -0.11039498448371887, -0.08806705474853516, -0.06573913246393204, -0.04341121017932892, -0.0210832878947258, 0.0012446343898773193, 0.023572556674480438, 0.04590047895908356, 0.06822839379310608, 0.09055638313293457, 0.11288430541753769, 0.1352122277021408, 0.15754014253616333, 0.17986807227134705, 0.20219600200653076, 0.22452391684055328, 0.2468518316745758, 0.2691797614097595, 0.29150769114494324, 0.31383562088012695, 0.3361635208129883, 0.358491450548172, 0.3808193802833557, 0.40314728021621704, 0.42547520995140076, 0.4478031396865845, 0.4701310694217682, 0.4924589991569519, 0.5147868990898132, 0.5371148586273193, 0.5594427585601807, 0.581770658493042, 0.6040985584259033, 0.6264265179634094, 0.6487544178962708, 0.6710823774337769, 0.6934102773666382, 0.7157381772994995, 0.7380661368370056, 0.7603940367698669, 0.782721996307373, 0.8050498962402344]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 9.0, 18.0, 32.0, 38.0, 82.0, 102.0, 164.0, 246.0, 424.0, 691.0, 1184.0, 2005.0, 3677.0, 6942.0, 13583.0, 27373.0, 56756.0, 130917.0, 357540.0, 1264236.0, 1563851.0, 469059.0, 161663.0, 68844.0, 31949.0, 15648.0, 7789.0, 4090.0, 2168.0, 1310.0, 668.0, 463.0, 262.0, 183.0, 110.0, 55.0, 58.0, 28.0, 23.0, 10.0, 7.0, 8.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1207275390625, -0.11627388000488281, -0.11182022094726562, -0.10736656188964844, -0.10291290283203125, -0.09845924377441406, -0.09400558471679688, -0.08955192565917969, -0.0850982666015625, -0.08064460754394531, -0.07619094848632812, -0.07173728942871094, -0.06728363037109375, -0.06282997131347656, -0.058376312255859375, -0.05392265319824219, -0.049468994140625, -0.04501533508300781, -0.040561676025390625, -0.03610801696777344, -0.03165435791015625, -0.027200698852539062, -0.022747039794921875, -0.018293380737304688, -0.0138397216796875, -0.009386062622070312, -0.004932403564453125, -0.0004787445068359375, 0.00397491455078125, 0.008428573608398438, 0.012882232666015625, 0.017335891723632812, 0.02178955078125, 0.026243209838867188, 0.030696868896484375, 0.03515052795410156, 0.03960418701171875, 0.04405784606933594, 0.048511505126953125, 0.05296516418457031, 0.0574188232421875, 0.06187248229980469, 0.06632614135742188, 0.07077980041503906, 0.07523345947265625, 0.07968711853027344, 0.08414077758789062, 0.08859443664550781, 0.093048095703125, 0.09750175476074219, 0.10195541381835938, 0.10640907287597656, 0.11086273193359375, 0.11531639099121094, 0.11977005004882812, 0.12422370910644531, 0.1286773681640625, 0.1331310272216797, 0.13758468627929688, 0.14203834533691406, 0.14649200439453125, 0.15094566345214844, 0.15539932250976562, 0.1598529815673828, 0.164306640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 10.0, 15.0, 9.0, 10.0, 14.0, 7.0, 20.0, 21.0, 24.0, 21.0, 28.0, 27.0, 30.0, 44.0, 19.0, 28.0, 29.0, 47.0, 37.0, 46.0, 42.0, 31.0, 35.0, 32.0, 42.0, 38.0, 22.0, 29.0, 28.0, 30.0, 23.0, 29.0, 25.0, 16.0, 15.0, 11.0, 11.0, 12.0, 10.0, 8.0, 5.0, 3.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08245849609375, -0.0798044204711914, -0.07715034484863281, -0.07449626922607422, -0.07184219360351562, -0.06918811798095703, -0.06653404235839844, -0.06387996673583984, -0.06122589111328125, -0.058571815490722656, -0.05591773986816406, -0.05326366424560547, -0.050609588623046875, -0.04795551300048828, -0.04530143737792969, -0.042647361755371094, -0.0399932861328125, -0.037339210510253906, -0.03468513488769531, -0.03203105926513672, -0.029376983642578125, -0.02672290802001953, -0.024068832397460938, -0.021414756774902344, -0.01876068115234375, -0.016106605529785156, -0.013452529907226562, -0.010798454284667969, -0.008144378662109375, -0.005490303039550781, -0.0028362274169921875, -0.00018215179443359375, 0.002471923828125, 0.005125999450683594, 0.0077800750732421875, 0.010434150695800781, 0.013088226318359375, 0.01574230194091797, 0.018396377563476562, 0.021050453186035156, 0.02370452880859375, 0.026358604431152344, 0.029012680053710938, 0.03166675567626953, 0.034320831298828125, 0.03697490692138672, 0.03962898254394531, 0.042283058166503906, 0.0449371337890625, 0.047591209411621094, 0.05024528503417969, 0.05289936065673828, 0.055553436279296875, 0.05820751190185547, 0.06086158752441406, 0.06351566314697266, 0.06616973876953125, 0.06882381439208984, 0.07147789001464844, 0.07413196563720703, 0.07678604125976562, 0.07944011688232422, 0.08209419250488281, 0.0847482681274414, 0.08740234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 3.0, 9.0, 13.0, 18.0, 23.0, 44.0, 34.0, 60.0, 94.0, 182.0, 276.0, 522.0, 1042.0, 2109.0, 4697.0, 12316.0, 33060.0, 98516.0, 343919.0, 1827191.0, 1450238.0, 286922.0, 84635.0, 28938.0, 10882.0, 4391.0, 1936.0, 945.0, 471.0, 277.0, 171.0, 122.0, 70.0, 49.0, 36.0, 22.0, 7.0, 12.0, 7.0, 7.0, 2.0, 0.0, 6.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.282470703125, -0.2748222351074219, -0.26717376708984375, -0.2595252990722656, -0.2518768310546875, -0.24422836303710938, -0.23657989501953125, -0.22893142700195312, -0.221282958984375, -0.21363449096679688, -0.20598602294921875, -0.19833755493164062, -0.1906890869140625, -0.18304061889648438, -0.17539215087890625, -0.16774368286132812, -0.16009521484375, -0.15244674682617188, -0.14479827880859375, -0.13714981079101562, -0.1295013427734375, -0.12185287475585938, -0.11420440673828125, -0.10655593872070312, -0.098907470703125, -0.09125900268554688, -0.08361053466796875, -0.07596206665039062, -0.0683135986328125, -0.060665130615234375, -0.05301666259765625, -0.045368194580078125, -0.0377197265625, -0.030071258544921875, -0.02242279052734375, -0.014774322509765625, -0.0071258544921875, 0.000522613525390625, 0.00817108154296875, 0.015819549560546875, 0.023468017578125, 0.031116485595703125, 0.03876495361328125, 0.046413421630859375, 0.0540618896484375, 0.061710357666015625, 0.06935882568359375, 0.07700729370117188, 0.08465576171875, 0.09230422973632812, 0.09995269775390625, 0.10760116577148438, 0.1152496337890625, 0.12289810180664062, 0.13054656982421875, 0.13819503784179688, 0.145843505859375, 0.15349197387695312, 0.16114044189453125, 0.16878890991210938, 0.1764373779296875, 0.18408584594726562, 0.19173431396484375, 0.19938278198242188, 0.20703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 6.0, 17.0, 18.0, 28.0, 36.0, 62.0, 77.0, 85.0, 149.0, 210.0, 282.0, 428.0, 694.0, 613.0, 405.0, 267.0, 177.0, 137.0, 92.0, 65.0, 54.0, 43.0, 27.0, 17.0, 20.0, 12.0, 11.0, 7.0, 14.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.199462890625, -0.19144821166992188, -0.18343353271484375, -0.17541885375976562, -0.1674041748046875, -0.15938949584960938, -0.15137481689453125, -0.14336013793945312, -0.135345458984375, -0.12733078002929688, -0.11931610107421875, -0.11130142211914062, -0.1032867431640625, -0.09527206420898438, -0.08725738525390625, -0.07924270629882812, -0.07122802734375, -0.06321334838867188, -0.05519866943359375, -0.047183990478515625, -0.0391693115234375, -0.031154632568359375, -0.02313995361328125, -0.015125274658203125, -0.007110595703125, 0.000904083251953125, 0.00891876220703125, 0.016933441162109375, 0.0249481201171875, 0.032962799072265625, 0.04097747802734375, 0.048992156982421875, 0.0570068359375, 0.06502151489257812, 0.07303619384765625, 0.08105087280273438, 0.0890655517578125, 0.09708023071289062, 0.10509490966796875, 0.11310958862304688, 0.121124267578125, 0.12913894653320312, 0.13715362548828125, 0.14516830444335938, 0.1531829833984375, 0.16119766235351562, 0.16921234130859375, 0.17722702026367188, 0.18524169921875, 0.19325637817382812, 0.20127105712890625, 0.20928573608398438, 0.2173004150390625, 0.22531509399414062, 0.23332977294921875, 0.24134445190429688, 0.249359130859375, 0.2573738098144531, 0.26538848876953125, 0.2734031677246094, 0.2814178466796875, 0.2894325256347656, 0.29744720458984375, 0.3054618835449219, 0.3134765625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 20.0, 47.0, 114.0, 166.0, 199.0, 185.0, 121.0, 66.0, 37.0, 20.0, 11.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.713821530342102, -1.6270647048950195, -1.540307879447937, -1.4535510540008545, -1.366794228553772, -1.2800374031066895, -1.1932806968688965, -1.1065237522125244, -1.0197670459747314, -0.9330102205276489, -0.8462533950805664, -0.7594965696334839, -0.6727397441864014, -0.5859829187393188, -0.4992261528968811, -0.4124693274497986, -0.3257124423980713, -0.23895561695098877, -0.15219880640506744, -0.06544199585914612, 0.0213148295879364, 0.10807165503501892, 0.19482845067977905, 0.2815852761268616, 0.3683421015739441, 0.4550989270210266, 0.5418557524681091, 0.6286125183105469, 0.7153693437576294, 0.8021261692047119, 0.8888829946517944, 0.975639820098877, 1.06239652633667, 1.1491533517837524, 1.235910177230835, 1.3226670026779175, 1.409423828125, 1.4961806535720825, 1.582937479019165, 1.669694185256958, 1.75645112991333, 1.8432079553604126, 1.9299647808074951, 2.016721487045288, 2.10347843170166, 2.190235137939453, 2.276992082595825, 2.363748788833618, 2.4505057334899902, 2.537262439727783, 2.6240193843841553, 2.7107760906219482, 2.7975330352783203, 2.8842897415161133, 2.9710466861724854, 3.0578033924102783, 3.1445600986480713, 3.2313168048858643, 3.3180737495422363, 3.4048304557800293, 3.4915874004364014, 3.5783441066741943, 3.6651010513305664, 3.7518577575683594, 3.8386147022247314]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 5.0, 3.0, 6.0, 9.0, 7.0, 11.0, 16.0, 21.0, 28.0, 16.0, 19.0, 26.0, 32.0, 31.0, 33.0, 26.0, 49.0, 51.0, 49.0, 41.0, 33.0, 41.0, 34.0, 34.0, 49.0, 45.0, 37.0, 32.0, 24.0, 27.0, 25.0, 20.0, 17.0, 19.0, 11.0, 13.0, 7.0, 10.0, 11.0, 4.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6711521148681641, -0.6478146314620972, -0.6244771480560303, -0.6011396646499634, -0.5778021812438965, -0.5544647574424744, -0.5311272740364075, -0.5077897906303406, -0.4844523072242737, -0.4611148238182068, -0.4377773404121399, -0.4144398868083954, -0.3911024034023285, -0.3677649199962616, -0.3444274663925171, -0.3210899829864502, -0.2977524995803833, -0.2744150161743164, -0.2510775327682495, -0.227740079164505, -0.2044025957584381, -0.18106511235237122, -0.15772764384746552, -0.13439017534255981, -0.11105269193649292, -0.08771521598100662, -0.06437774002552032, -0.04104026407003403, -0.01770278811454773, 0.005634687840938568, 0.028972163796424866, 0.052309632301330566, 0.07564717531204224, 0.09898465126752853, 0.12232212722301483, 0.14565959572792053, 0.16899707913398743, 0.19233456254005432, 0.21567203104496002, 0.23900949954986572, 0.2623469829559326, 0.2856844663619995, 0.3090219497680664, 0.3323594033718109, 0.3556968867778778, 0.3790343701839447, 0.4023718237876892, 0.4257093071937561, 0.449046790599823, 0.4723842740058899, 0.4957217574119568, 0.5190592408180237, 0.5423966646194458, 0.5657341480255127, 0.5890716314315796, 0.6124091148376465, 0.6357465982437134, 0.6590840816497803, 0.6824215650558472, 0.7057590484619141, 0.729096531867981, 0.7524339556694031, 0.77577143907547, 0.7991089224815369, 0.8224464058876038]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 4.0, 9.0, 10.0, 25.0, 30.0, 54.0, 78.0, 120.0, 219.0, 334.0, 473.0, 710.0, 1189.0, 2005.0, 3237.0, 4885.0, 7610.0, 12253.0, 19152.0, 32382.0, 74343.0, 272735.0, 394294.0, 117989.0, 42028.0, 22963.0, 14267.0, 9191.0, 5884.0, 3693.0, 2307.0, 1482.0, 944.0, 631.0, 364.0, 221.0, 144.0, 88.0, 68.0, 33.0, 38.0, 17.0, 15.0, 9.0, 5.0, 10.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.18695449829101562, -0.18054962158203125, -0.17414474487304688, -0.1677398681640625, -0.16133499145507812, -0.15493011474609375, -0.14852523803710938, -0.142120361328125, -0.13571548461914062, -0.12931060791015625, -0.12290573120117188, -0.1165008544921875, -0.11009597778320312, -0.10369110107421875, -0.09728622436523438, -0.09088134765625, -0.08447647094726562, -0.07807159423828125, -0.07166671752929688, -0.0652618408203125, -0.058856964111328125, -0.05245208740234375, -0.046047210693359375, -0.039642333984375, -0.033237457275390625, -0.02683258056640625, -0.020427703857421875, -0.0140228271484375, -0.007617950439453125, -0.00121307373046875, 0.005191802978515625, 0.0115966796875, 0.018001556396484375, 0.02440643310546875, 0.030811309814453125, 0.0372161865234375, 0.043621063232421875, 0.05002593994140625, 0.056430816650390625, 0.062835693359375, 0.06924057006835938, 0.07564544677734375, 0.08205032348632812, 0.0884552001953125, 0.09486007690429688, 0.10126495361328125, 0.10766983032226562, 0.11407470703125, 0.12047958374023438, 0.12688446044921875, 0.13328933715820312, 0.1396942138671875, 0.14609909057617188, 0.15250396728515625, 0.15890884399414062, 0.165313720703125, 0.17171859741210938, 0.17812347412109375, 0.18452835083007812, 0.1909332275390625, 0.19733810424804688, 0.20374298095703125, 0.21014785766601562, 0.216552734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 7.0, 12.0, 7.0, 12.0, 16.0, 17.0, 26.0, 16.0, 31.0, 31.0, 32.0, 20.0, 53.0, 38.0, 38.0, 42.0, 41.0, 44.0, 42.0, 60.0, 45.0, 35.0, 46.0, 37.0, 32.0, 28.0, 34.0, 25.0, 22.0, 18.0, 15.0, 18.0, 10.0, 10.0, 6.0, 8.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1168212890625, -0.11362743377685547, -0.11043357849121094, -0.1072397232055664, -0.10404586791992188, -0.10085201263427734, -0.09765815734863281, -0.09446430206298828, -0.09127044677734375, -0.08807659149169922, -0.08488273620605469, -0.08168888092041016, -0.07849502563476562, -0.0753011703491211, -0.07210731506347656, -0.06891345977783203, -0.0657196044921875, -0.06252574920654297, -0.05933189392089844, -0.056138038635253906, -0.052944183349609375, -0.049750328063964844, -0.04655647277832031, -0.04336261749267578, -0.04016876220703125, -0.03697490692138672, -0.03378105163574219, -0.030587196350097656, -0.027393341064453125, -0.024199485778808594, -0.021005630493164062, -0.01781177520751953, -0.014617919921875, -0.011424064636230469, -0.008230209350585938, -0.005036354064941406, -0.001842498779296875, 0.0013513565063476562, 0.0045452117919921875, 0.007739067077636719, 0.01093292236328125, 0.014126777648925781, 0.017320632934570312, 0.020514488220214844, 0.023708343505859375, 0.026902198791503906, 0.030096054077148438, 0.03328990936279297, 0.0364837646484375, 0.03967761993408203, 0.04287147521972656, 0.046065330505371094, 0.049259185791015625, 0.052453041076660156, 0.05564689636230469, 0.05884075164794922, 0.06203460693359375, 0.06522846221923828, 0.06842231750488281, 0.07161617279052734, 0.07481002807617188, 0.0780038833618164, 0.08119773864746094, 0.08439159393310547, 0.08758544921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 7.0, 9.0, 9.0, 14.0, 21.0, 28.0, 44.0, 58.0, 80.0, 115.0, 217.0, 368.0, 693.0, 1385.0, 2981.0, 7562.0, 18578.0, 55147.0, 442724.0, 432452.0, 54399.0, 18320.0, 7145.0, 3075.0, 1435.0, 668.0, 392.0, 229.0, 136.0, 74.0, 49.0, 45.0, 24.0, 19.0, 9.0, 8.0, 8.0, 5.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.374267578125, -0.3617897033691406, -0.34931182861328125, -0.3368339538574219, -0.3243560791015625, -0.3118782043457031, -0.29940032958984375, -0.2869224548339844, -0.274444580078125, -0.2619667053222656, -0.24948883056640625, -0.23701095581054688, -0.2245330810546875, -0.21205520629882812, -0.19957733154296875, -0.18709945678710938, -0.17462158203125, -0.16214370727539062, -0.14966583251953125, -0.13718795776367188, -0.1247100830078125, -0.11223220825195312, -0.09975433349609375, -0.08727645874023438, -0.074798583984375, -0.062320709228515625, -0.04984283447265625, -0.037364959716796875, -0.0248870849609375, -0.012409210205078125, 6.866455078125e-05, 0.012546539306640625, 0.0250244140625, 0.037502288818359375, 0.04998016357421875, 0.062458038330078125, 0.0749359130859375, 0.08741378784179688, 0.09989166259765625, 0.11236953735351562, 0.124847412109375, 0.13732528686523438, 0.14980316162109375, 0.16228103637695312, 0.1747589111328125, 0.18723678588867188, 0.19971466064453125, 0.21219253540039062, 0.22467041015625, 0.23714828491210938, 0.24962615966796875, 0.2621040344238281, 0.2745819091796875, 0.2870597839355469, 0.29953765869140625, 0.3120155334472656, 0.324493408203125, 0.3369712829589844, 0.34944915771484375, 0.3619270324707031, 0.3744049072265625, 0.3868827819824219, 0.39936065673828125, 0.4118385314941406, 0.42431640625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 6.0, 14.0, 12.0, 12.0, 9.0, 13.0, 10.0, 16.0, 35.0, 28.0, 24.0, 21.0, 37.0, 29.0, 35.0, 48.0, 34.0, 27.0, 40.0, 38.0, 31.0, 47.0, 45.0, 36.0, 47.0, 42.0, 25.0, 28.0, 26.0, 20.0, 19.0, 9.0, 20.0, 21.0, 14.0, 11.0, 9.0, 9.0, 12.0, 12.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 4.0], "bins": [-0.28515625, -0.27623748779296875, -0.2673187255859375, -0.25839996337890625, -0.249481201171875, -0.24056243896484375, -0.2316436767578125, -0.22272491455078125, -0.21380615234375, -0.20488739013671875, -0.1959686279296875, -0.18704986572265625, -0.178131103515625, -0.16921234130859375, -0.1602935791015625, -0.15137481689453125, -0.1424560546875, -0.13353729248046875, -0.1246185302734375, -0.11569976806640625, -0.106781005859375, -0.09786224365234375, -0.0889434814453125, -0.08002471923828125, -0.07110595703125, -0.06218719482421875, -0.0532684326171875, -0.04434967041015625, -0.035430908203125, -0.02651214599609375, -0.0175933837890625, -0.00867462158203125, 0.000244140625, 0.00916290283203125, 0.0180816650390625, 0.02700042724609375, 0.035919189453125, 0.04483795166015625, 0.0537567138671875, 0.06267547607421875, 0.07159423828125, 0.08051300048828125, 0.0894317626953125, 0.09835052490234375, 0.107269287109375, 0.11618804931640625, 0.1251068115234375, 0.13402557373046875, 0.1429443359375, 0.15186309814453125, 0.1607818603515625, 0.16970062255859375, 0.178619384765625, 0.18753814697265625, 0.1964569091796875, 0.20537567138671875, 0.21429443359375, 0.22321319580078125, 0.2321319580078125, 0.24105072021484375, 0.249969482421875, 0.25888824462890625, 0.2678070068359375, 0.27672576904296875, 0.28564453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 12.0, 6.0, 10.0, 15.0, 17.0, 31.0, 38.0, 75.0, 99.0, 145.0, 275.0, 417.0, 651.0, 1129.0, 1884.0, 3031.0, 5307.0, 9716.0, 19084.0, 40004.0, 100168.0, 374468.0, 327644.0, 88754.0, 36567.0, 17508.0, 9014.0, 5195.0, 2885.0, 1690.0, 1017.0, 649.0, 398.0, 223.0, 171.0, 96.0, 44.0, 39.0, 25.0, 21.0, 14.0, 3.0, 7.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1163330078125, -0.11300373077392578, -0.10967445373535156, -0.10634517669677734, -0.10301589965820312, -0.0996866226196289, -0.09635734558105469, -0.09302806854248047, -0.08969879150390625, -0.08636951446533203, -0.08304023742675781, -0.0797109603881836, -0.07638168334960938, -0.07305240631103516, -0.06972312927246094, -0.06639385223388672, -0.0630645751953125, -0.05973529815673828, -0.05640602111816406, -0.053076744079589844, -0.049747467041015625, -0.046418190002441406, -0.04308891296386719, -0.03975963592529297, -0.03643035888671875, -0.03310108184814453, -0.029771804809570312, -0.026442527770996094, -0.023113250732421875, -0.019783973693847656, -0.016454696655273438, -0.013125419616699219, -0.009796142578125, -0.006466865539550781, -0.0031375885009765625, 0.00019168853759765625, 0.003520965576171875, 0.006850242614746094, 0.010179519653320312, 0.013508796691894531, 0.01683807373046875, 0.02016735076904297, 0.023496627807617188, 0.026825904846191406, 0.030155181884765625, 0.033484458923339844, 0.03681373596191406, 0.04014301300048828, 0.0434722900390625, 0.04680156707763672, 0.05013084411621094, 0.053460121154785156, 0.056789398193359375, 0.060118675231933594, 0.06344795227050781, 0.06677722930908203, 0.07010650634765625, 0.07343578338623047, 0.07676506042480469, 0.0800943374633789, 0.08342361450195312, 0.08675289154052734, 0.09008216857910156, 0.09341144561767578, 0.09674072265625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 3.0, 3.0, 8.0, 9.0, 13.0, 12.0, 31.0, 49.0, 132.0, 261.0, 237.0, 110.0, 53.0, 18.0, 12.0, 10.0, 9.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.628036499023438e-05, -6.39054924249649e-05, -6.153061985969543e-05, -5.9155747294425964e-05, -5.6780874729156494e-05, -5.4406002163887024e-05, -5.2031129598617554e-05, -4.9656257033348083e-05, -4.728138446807861e-05, -4.490651190280914e-05, -4.253163933753967e-05, -4.01567667722702e-05, -3.778189420700073e-05, -3.540702164173126e-05, -3.303214907646179e-05, -3.065727651119232e-05, -2.828240394592285e-05, -2.590753138065338e-05, -2.353265881538391e-05, -2.115778625011444e-05, -1.878291368484497e-05, -1.64080411195755e-05, -1.403316855430603e-05, -1.165829598903656e-05, -9.28342342376709e-06, -6.90855085849762e-06, -4.533678293228149e-06, -2.158805727958679e-06, 2.1606683731079102e-07, 2.5909394025802612e-06, 4.9658119678497314e-06, 7.340684533119202e-06, 9.715557098388672e-06, 1.2090429663658142e-05, 1.4465302228927612e-05, 1.6840174794197083e-05, 1.9215047359466553e-05, 2.1589919924736023e-05, 2.3964792490005493e-05, 2.6339665055274963e-05, 2.8714537620544434e-05, 3.1089410185813904e-05, 3.3464282751083374e-05, 3.5839155316352844e-05, 3.8214027881622314e-05, 4.0588900446891785e-05, 4.2963773012161255e-05, 4.5338645577430725e-05, 4.7713518142700195e-05, 5.0088390707969666e-05, 5.2463263273239136e-05, 5.4838135838508606e-05, 5.7213008403778076e-05, 5.9587880969047546e-05, 6.196275353431702e-05, 6.433762609958649e-05, 6.671249866485596e-05, 6.908737123012543e-05, 7.14622437953949e-05, 7.383711636066437e-05, 7.621198892593384e-05, 7.858686149120331e-05, 8.096173405647278e-05, 8.333660662174225e-05, 8.571147918701172e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 8.0, 10.0, 11.0, 18.0, 27.0, 33.0, 71.0, 100.0, 124.0, 239.0, 455.0, 913.0, 2102.0, 5060.0, 13753.0, 40766.0, 135862.0, 482298.0, 262154.0, 68449.0, 22453.0, 7825.0, 3058.0, 1312.0, 625.0, 316.0, 187.0, 127.0, 75.0, 38.0, 28.0, 18.0, 9.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11224365234375, -0.10819530487060547, -0.10414695739746094, -0.1000986099243164, -0.09605026245117188, -0.09200191497802734, -0.08795356750488281, -0.08390522003173828, -0.07985687255859375, -0.07580852508544922, -0.07176017761230469, -0.06771183013916016, -0.06366348266601562, -0.059615135192871094, -0.05556678771972656, -0.05151844024658203, -0.0474700927734375, -0.04342174530029297, -0.03937339782714844, -0.035325050354003906, -0.031276702880859375, -0.027228355407714844, -0.023180007934570312, -0.01913166046142578, -0.01508331298828125, -0.011034965515136719, -0.0069866180419921875, -0.0029382705688476562, 0.001110076904296875, 0.005158424377441406, 0.009206771850585938, 0.013255119323730469, 0.017303466796875, 0.02135181427001953, 0.025400161743164062, 0.029448509216308594, 0.033496856689453125, 0.037545204162597656, 0.04159355163574219, 0.04564189910888672, 0.04969024658203125, 0.05373859405517578, 0.05778694152832031, 0.061835289001464844, 0.06588363647460938, 0.0699319839477539, 0.07398033142089844, 0.07802867889404297, 0.0820770263671875, 0.08612537384033203, 0.09017372131347656, 0.0942220687866211, 0.09827041625976562, 0.10231876373291016, 0.10636711120605469, 0.11041545867919922, 0.11446380615234375, 0.11851215362548828, 0.12256050109863281, 0.12660884857177734, 0.13065719604492188, 0.1347055435180664, 0.13875389099121094, 0.14280223846435547, 0.1468505859375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 4.0, 7.0, 7.0, 9.0, 16.0, 13.0, 10.0, 22.0, 26.0, 49.0, 41.0, 58.0, 74.0, 130.0, 114.0, 87.0, 79.0, 58.0, 42.0, 29.0, 22.0, 15.0, 19.0, 11.0, 10.0, 4.0, 6.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.14111328125, -0.1373291015625, -0.133544921875, -0.1297607421875, -0.1259765625, -0.1221923828125, -0.118408203125, -0.1146240234375, -0.11083984375, -0.1070556640625, -0.103271484375, -0.0994873046875, -0.095703125, -0.0919189453125, -0.088134765625, -0.0843505859375, -0.08056640625, -0.0767822265625, -0.072998046875, -0.0692138671875, -0.0654296875, -0.0616455078125, -0.057861328125, -0.0540771484375, -0.05029296875, -0.0465087890625, -0.042724609375, -0.0389404296875, -0.03515625, -0.0313720703125, -0.027587890625, -0.0238037109375, -0.02001953125, -0.0162353515625, -0.012451171875, -0.0086669921875, -0.0048828125, -0.0010986328125, 0.002685546875, 0.0064697265625, 0.01025390625, 0.0140380859375, 0.017822265625, 0.0216064453125, 0.025390625, 0.0291748046875, 0.032958984375, 0.0367431640625, 0.04052734375, 0.0443115234375, 0.048095703125, 0.0518798828125, 0.0556640625, 0.0594482421875, 0.063232421875, 0.0670166015625, 0.07080078125, 0.0745849609375, 0.078369140625, 0.0821533203125, 0.0859375, 0.0897216796875, 0.093505859375, 0.0972900390625, 0.10107421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 11.0, 28.0, 57.0, 103.0, 146.0, 204.0, 158.0, 124.0, 80.0, 42.0, 20.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.64121413230896, -1.5720226764678955, -1.502831220626831, -1.4336397647857666, -1.3644483089447021, -1.2952568531036377, -1.2260655164718628, -1.1568740606307983, -1.0876826047897339, -1.0184911489486694, -0.949299693107605, -0.8801082968711853, -0.8109168410301208, -0.7417253851890564, -0.6725339889526367, -0.6033425331115723, -0.5341510772705078, -0.46495962142944336, -0.3957681953907013, -0.32657676935195923, -0.2573853135108948, -0.18819385766983032, -0.11900243163108826, -0.04981100559234619, 0.01938045024871826, 0.08857189118862152, 0.15776333212852478, 0.22695477306842804, 0.2961462140083313, 0.36533766984939575, 0.4345290958881378, 0.5037205219268799, 0.5729122161865234, 0.6421036720275879, 0.7112951278686523, 0.780486524105072, 0.8496779799461365, 0.9188694357872009, 0.9880608320236206, 1.057252287864685, 1.1264437437057495, 1.195635199546814, 1.2648266553878784, 1.3340181112289429, 1.4032094478607178, 1.4724009037017822, 1.5415923595428467, 1.6107838153839111, 1.6799752712249756, 1.74916672706604, 1.8183581829071045, 1.887549638748169, 1.9567410945892334, 2.025932550430298, 2.0951240062713623, 2.1643152236938477, 2.233506679534912, 2.3026981353759766, 2.371889591217041, 2.4410810470581055, 2.51027250289917, 2.5794639587402344, 2.648655414581299, 2.7178468704223633, 2.7870383262634277]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 5.0, 12.0, 10.0, 9.0, 14.0, 12.0, 13.0, 20.0, 16.0, 18.0, 24.0, 34.0, 38.0, 34.0, 48.0, 42.0, 52.0, 38.0, 46.0, 45.0, 43.0, 37.0, 39.0, 40.0, 43.0, 36.0, 26.0, 33.0, 27.0, 28.0, 18.0, 24.0, 14.0, 18.0, 14.0, 6.0, 9.0, 9.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.005620002746582, -0.9786669015884399, -0.9517138004302979, -0.9247607588768005, -0.8978076577186584, -0.8708545565605164, -0.843901515007019, -0.816948413848877, -0.7899953126907349, -0.7630422115325928, -0.7360891103744507, -0.7091360688209534, -0.6821829676628113, -0.6552298665046692, -0.6282768249511719, -0.6013237237930298, -0.5743706226348877, -0.5474175214767456, -0.5204644203186035, -0.4935113787651062, -0.4665582776069641, -0.439605176448822, -0.4126521050930023, -0.3856990337371826, -0.3587459325790405, -0.33179283142089844, -0.30483976006507874, -0.27788668870925903, -0.25093358755111694, -0.22398050129413605, -0.19702741503715515, -0.17007432878017426, -0.14312124252319336, -0.11616815626621246, -0.08921507000923157, -0.06226198375225067, -0.035308897495269775, -0.00835581123828888, 0.018597275018692017, 0.04555036127567291, 0.07250344753265381, 0.0994565337896347, 0.1264096200466156, 0.1533627063035965, 0.1803157925605774, 0.2072688788175583, 0.23422196507453918, 0.2611750364303589, 0.288128137588501, 0.31508123874664307, 0.34203431010246277, 0.36898738145828247, 0.39594048261642456, 0.42289358377456665, 0.44984665513038635, 0.47679972648620605, 0.5037528276443481, 0.5307059288024902, 0.5576590299606323, 0.5846120715141296, 0.6115651726722717, 0.6385182738304138, 0.6654713153839111, 0.6924244165420532, 0.7193775177001953]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 16.0, 25.0, 24.0, 55.0, 68.0, 119.0, 186.0, 307.0, 473.0, 819.0, 1341.0, 2084.0, 3528.0, 6344.0, 10839.0, 19013.0, 34293.0, 63790.0, 123523.0, 264833.0, 646864.0, 1299127.0, 951314.0, 402989.0, 175153.0, 85333.0, 44568.0, 24516.0, 13475.0, 7753.0, 4493.0, 2723.0, 1607.0, 993.0, 646.0, 376.0, 249.0, 149.0, 96.0, 67.0, 30.0, 23.0, 19.0, 10.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10504150390625, -0.1017303466796875, -0.098419189453125, -0.0951080322265625, -0.091796875, -0.0884857177734375, -0.085174560546875, -0.0818634033203125, -0.07855224609375, -0.0752410888671875, -0.071929931640625, -0.0686187744140625, -0.0653076171875, -0.0619964599609375, -0.058685302734375, -0.0553741455078125, -0.05206298828125, -0.0487518310546875, -0.045440673828125, -0.0421295166015625, -0.038818359375, -0.0355072021484375, -0.032196044921875, -0.0288848876953125, -0.02557373046875, -0.0222625732421875, -0.018951416015625, -0.0156402587890625, -0.0123291015625, -0.0090179443359375, -0.005706787109375, -0.0023956298828125, 0.00091552734375, 0.0042266845703125, 0.007537841796875, 0.0108489990234375, 0.01416015625, 0.0174713134765625, 0.020782470703125, 0.0240936279296875, 0.02740478515625, 0.0307159423828125, 0.034027099609375, 0.0373382568359375, 0.0406494140625, 0.0439605712890625, 0.047271728515625, 0.0505828857421875, 0.05389404296875, 0.0572052001953125, 0.060516357421875, 0.0638275146484375, 0.067138671875, 0.0704498291015625, 0.073760986328125, 0.0770721435546875, 0.08038330078125, 0.0836944580078125, 0.087005615234375, 0.0903167724609375, 0.0936279296875, 0.0969390869140625, 0.100250244140625, 0.1035614013671875, 0.10687255859375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 11.0, 9.0, 7.0, 10.0, 12.0, 18.0, 17.0, 20.0, 30.0, 28.0, 32.0, 30.0, 32.0, 34.0, 37.0, 51.0, 42.0, 53.0, 53.0, 48.0, 51.0, 53.0, 55.0, 39.0, 32.0, 24.0, 34.0, 22.0, 15.0, 29.0, 12.0, 15.0, 11.0, 8.0, 7.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09716796875, -0.09373092651367188, -0.09029388427734375, -0.08685684204101562, -0.0834197998046875, -0.07998275756835938, -0.07654571533203125, -0.07310867309570312, -0.069671630859375, -0.06623458862304688, -0.06279754638671875, -0.059360504150390625, -0.0559234619140625, -0.052486419677734375, -0.04904937744140625, -0.045612335205078125, -0.04217529296875, -0.038738250732421875, -0.03530120849609375, -0.031864166259765625, -0.0284271240234375, -0.024990081787109375, -0.02155303955078125, -0.018115997314453125, -0.014678955078125, -0.011241912841796875, -0.00780487060546875, -0.004367828369140625, -0.0009307861328125, 0.002506256103515625, 0.00594329833984375, 0.009380340576171875, 0.0128173828125, 0.016254425048828125, 0.01969146728515625, 0.023128509521484375, 0.0265655517578125, 0.030002593994140625, 0.03343963623046875, 0.036876678466796875, 0.040313720703125, 0.043750762939453125, 0.04718780517578125, 0.050624847412109375, 0.0540618896484375, 0.057498931884765625, 0.06093597412109375, 0.06437301635742188, 0.06781005859375, 0.07124710083007812, 0.07468414306640625, 0.07812118530273438, 0.0815582275390625, 0.08499526977539062, 0.08843231201171875, 0.09186935424804688, 0.095306396484375, 0.09874343872070312, 0.10218048095703125, 0.10561752319335938, 0.1090545654296875, 0.11249160766601562, 0.11592864990234375, 0.11936569213867188, 0.122802734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 8.0, 9.0, 20.0, 23.0, 40.0, 73.0, 115.0, 214.0, 375.0, 671.0, 1406.0, 3376.0, 9306.0, 31309.0, 122305.0, 588885.0, 2563303.0, 683528.0, 137372.0, 34671.0, 10425.0, 3630.0, 1553.0, 742.0, 400.0, 220.0, 128.0, 74.0, 34.0, 24.0, 16.0, 9.0, 8.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.24269485473632812, -0.23319244384765625, -0.22369003295898438, -0.2141876220703125, -0.20468521118164062, -0.19518280029296875, -0.18568038940429688, -0.176177978515625, -0.16667556762695312, -0.15717315673828125, -0.14767074584960938, -0.1381683349609375, -0.12866592407226562, -0.11916351318359375, -0.10966110229492188, -0.10015869140625, -0.09065628051757812, -0.08115386962890625, -0.07165145874023438, -0.0621490478515625, -0.052646636962890625, -0.04314422607421875, -0.033641815185546875, -0.024139404296875, -0.014636993408203125, -0.00513458251953125, 0.004367828369140625, 0.0138702392578125, 0.023372650146484375, 0.03287506103515625, 0.042377471923828125, 0.0518798828125, 0.061382293701171875, 0.07088470458984375, 0.08038711547851562, 0.0898895263671875, 0.09939193725585938, 0.10889434814453125, 0.11839675903320312, 0.127899169921875, 0.13740158081054688, 0.14690399169921875, 0.15640640258789062, 0.1659088134765625, 0.17541122436523438, 0.18491363525390625, 0.19441604614257812, 0.20391845703125, 0.21342086791992188, 0.22292327880859375, 0.23242568969726562, 0.2419281005859375, 0.2514305114746094, 0.26093292236328125, 0.2704353332519531, 0.279937744140625, 0.2894401550292969, 0.29894256591796875, 0.3084449768066406, 0.3179473876953125, 0.3274497985839844, 0.33695220947265625, 0.3464546203613281, 0.35595703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 5.0, 7.0, 8.0, 14.0, 27.0, 23.0, 31.0, 43.0, 66.0, 75.0, 118.0, 171.0, 221.0, 369.0, 499.0, 637.0, 551.0, 346.0, 224.0, 168.0, 131.0, 106.0, 67.0, 38.0, 29.0, 28.0, 29.0, 12.0, 5.0, 5.0, 8.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2607612609863281, -0.25223541259765625, -0.24370956420898438, -0.2351837158203125, -0.22665786743164062, -0.21813201904296875, -0.20960617065429688, -0.201080322265625, -0.19255447387695312, -0.18402862548828125, -0.17550277709960938, -0.1669769287109375, -0.15845108032226562, -0.14992523193359375, -0.14139938354492188, -0.13287353515625, -0.12434768676757812, -0.11582183837890625, -0.10729598999023438, -0.0987701416015625, -0.09024429321289062, -0.08171844482421875, -0.07319259643554688, -0.064666748046875, -0.056140899658203125, -0.04761505126953125, -0.039089202880859375, -0.0305633544921875, -0.022037506103515625, -0.01351165771484375, -0.004985809326171875, 0.0035400390625, 0.012065887451171875, 0.02059173583984375, 0.029117584228515625, 0.0376434326171875, 0.046169281005859375, 0.05469512939453125, 0.06322097778320312, 0.071746826171875, 0.08027267456054688, 0.08879852294921875, 0.09732437133789062, 0.1058502197265625, 0.11437606811523438, 0.12290191650390625, 0.13142776489257812, 0.13995361328125, 0.14847946166992188, 0.15700531005859375, 0.16553115844726562, 0.1740570068359375, 0.18258285522460938, 0.19110870361328125, 0.19963455200195312, 0.208160400390625, 0.21668624877929688, 0.22521209716796875, 0.23373794555664062, 0.2422637939453125, 0.2507896423339844, 0.25931549072265625, 0.2678413391113281, 0.2763671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 14.0, 20.0, 36.0, 49.0, 65.0, 93.0, 116.0, 132.0, 112.0, 121.0, 88.0, 58.0, 34.0, 18.0, 15.0, 10.0, 1.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9978046417236328, -1.9423831701278687, -1.8869616985321045, -1.8315402269363403, -1.7761187553405762, -1.720697283744812, -1.6652758121490479, -1.6098544597625732, -1.5544328689575195, -1.4990113973617554, -1.4435899257659912, -1.388168454170227, -1.332746982574463, -1.2773255109786987, -1.2219040393829346, -1.16648268699646, -1.1110612154006958, -1.0556397438049316, -1.0002182722091675, -0.9447968006134033, -0.8893753290176392, -0.833953857421875, -0.7785324454307556, -0.7231109738349915, -0.6676895022392273, -0.6122680306434631, -0.556846559047699, -0.5014251470565796, -0.44600364565849304, -0.3905821740627289, -0.3351607322692871, -0.27973926067352295, -0.22431766986846924, -0.16889619827270508, -0.11347474157810211, -0.058053284883499146, -0.0026318132877349854, 0.052789658308029175, 0.10821110010147095, 0.1636325716972351, 0.21905404329299927, 0.2744755148887634, 0.3298969864845276, 0.38531842827796936, 0.4407398998737335, 0.4961613714694977, 0.5515828132629395, 0.6070042848587036, 0.6624257564544678, 0.7178472280502319, 0.7732686996459961, 0.8286901712417603, 0.8841116428375244, 0.9395331144332886, 0.994954526424408, 1.0503759384155273, 1.105797529220581, 1.1612190008163452, 1.2166404724121094, 1.2720619440078735, 1.3274834156036377, 1.3829048871994019, 1.438326358795166, 1.4937477111816406, 1.5491691827774048]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 8.0, 16.0, 9.0, 9.0, 18.0, 17.0, 17.0, 32.0, 22.0, 26.0, 37.0, 38.0, 52.0, 40.0, 50.0, 38.0, 37.0, 30.0, 45.0, 35.0, 29.0, 32.0, 35.0, 53.0, 23.0, 32.0, 29.0, 20.0, 25.0, 26.0, 18.0, 13.0, 9.0, 13.0, 12.0, 16.0, 5.0, 4.0, 3.0, 1.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.8304241299629211, -0.8052428960800171, -0.7800617218017578, -0.7548804879188538, -0.7296993136405945, -0.7045180797576904, -0.6793369054794312, -0.6541556715965271, -0.628974437713623, -0.603793203830719, -0.5786120295524597, -0.5534307956695557, -0.5282496213912964, -0.5030683875083923, -0.47788718342781067, -0.452705979347229, -0.42752477526664734, -0.4023435711860657, -0.377162367105484, -0.35198116302490234, -0.3267999291419983, -0.3016187250614166, -0.27643752098083496, -0.2512562870979309, -0.22607509791851044, -0.20089389383792877, -0.1757126748561859, -0.15053147077560425, -0.12535026669502258, -0.10016904771327972, -0.07498784363269806, -0.0498066246509552, -0.024625420570373535, 0.0005557890981435776, 0.02573699876666069, 0.050918206572532654, 0.07609941810369492, 0.10128062963485718, 0.12646183371543884, 0.1516430526971817, 0.17682425677776337, 0.20200546085834503, 0.2271866798400879, 0.25236788392066956, 0.2775490880012512, 0.3027303218841553, 0.32791149616241455, 0.3530927300453186, 0.37827393412590027, 0.40345513820648193, 0.4286363422870636, 0.45381754636764526, 0.4789987802505493, 0.5041799545288086, 0.5293611884117126, 0.5545424222946167, 0.579723596572876, 0.60490483045578, 0.6300860047340393, 0.6552672386169434, 0.6804484128952026, 0.7056296467781067, 0.7308108806610107, 0.75599205493927, 0.7811732888221741]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 12.0, 7.0, 21.0, 35.0, 46.0, 87.0, 124.0, 230.0, 371.0, 614.0, 1117.0, 1998.0, 3261.0, 5795.0, 9867.0, 17198.0, 31162.0, 65839.0, 185834.0, 392505.0, 191375.0, 67709.0, 32080.0, 17337.0, 9974.0, 5869.0, 3395.0, 1923.0, 1079.0, 707.0, 381.0, 245.0, 151.0, 84.0, 55.0, 29.0, 19.0, 12.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24169921875, -0.23525619506835938, -0.22881317138671875, -0.22237014770507812, -0.2159271240234375, -0.20948410034179688, -0.20304107666015625, -0.19659805297851562, -0.190155029296875, -0.18371200561523438, -0.17726898193359375, -0.17082595825195312, -0.1643829345703125, -0.15793991088867188, -0.15149688720703125, -0.14505386352539062, -0.13861083984375, -0.13216781616210938, -0.12572479248046875, -0.11928176879882812, -0.1128387451171875, -0.10639572143554688, -0.09995269775390625, -0.09350967407226562, -0.087066650390625, -0.08062362670898438, -0.07418060302734375, -0.06773757934570312, -0.0612945556640625, -0.054851531982421875, -0.04840850830078125, -0.041965484619140625, -0.0355224609375, -0.029079437255859375, -0.02263641357421875, -0.016193389892578125, -0.0097503662109375, -0.003307342529296875, 0.00313568115234375, 0.009578704833984375, 0.016021728515625, 0.022464752197265625, 0.02890777587890625, 0.035350799560546875, 0.0417938232421875, 0.048236846923828125, 0.05467987060546875, 0.061122894287109375, 0.06756591796875, 0.07400894165039062, 0.08045196533203125, 0.08689498901367188, 0.0933380126953125, 0.09978103637695312, 0.10622406005859375, 0.11266708374023438, 0.119110107421875, 0.12555313110351562, 0.13199615478515625, 0.13843917846679688, 0.1448822021484375, 0.15132522583007812, 0.15776824951171875, 0.16421127319335938, 0.170654296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 11.0, 3.0, 4.0, 9.0, 14.0, 15.0, 13.0, 13.0, 20.0, 17.0, 24.0, 33.0, 30.0, 39.0, 39.0, 52.0, 32.0, 40.0, 41.0, 40.0, 53.0, 41.0, 41.0, 39.0, 33.0, 35.0, 33.0, 39.0, 42.0, 14.0, 25.0, 22.0, 18.0, 19.0, 13.0, 15.0, 6.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09845352172851562, -0.09516143798828125, -0.09186935424804688, -0.0885772705078125, -0.08528518676757812, -0.08199310302734375, -0.07870101928710938, -0.075408935546875, -0.07211685180664062, -0.06882476806640625, -0.06553268432617188, -0.0622406005859375, -0.058948516845703125, -0.05565643310546875, -0.052364349365234375, -0.049072265625, -0.045780181884765625, -0.04248809814453125, -0.039196014404296875, -0.0359039306640625, -0.032611846923828125, -0.02931976318359375, -0.026027679443359375, -0.022735595703125, -0.019443511962890625, -0.01615142822265625, -0.012859344482421875, -0.0095672607421875, -0.006275177001953125, -0.00298309326171875, 0.000308990478515625, 0.00360107421875, 0.006893157958984375, 0.01018524169921875, 0.013477325439453125, 0.0167694091796875, 0.020061492919921875, 0.02335357666015625, 0.026645660400390625, 0.029937744140625, 0.033229827880859375, 0.03652191162109375, 0.039813995361328125, 0.0431060791015625, 0.046398162841796875, 0.04969024658203125, 0.052982330322265625, 0.0562744140625, 0.059566497802734375, 0.06285858154296875, 0.06615066528320312, 0.0694427490234375, 0.07273483276367188, 0.07602691650390625, 0.07931900024414062, 0.082611083984375, 0.08590316772460938, 0.08919525146484375, 0.09248733520507812, 0.0957794189453125, 0.09907150268554688, 0.10236358642578125, 0.10565567016601562, 0.10894775390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 11.0, 10.0, 14.0, 16.0, 28.0, 33.0, 32.0, 70.0, 102.0, 169.0, 238.0, 498.0, 775.0, 1527.0, 3329.0, 7458.0, 16822.0, 41146.0, 130714.0, 497668.0, 242104.0, 62719.0, 23809.0, 10124.0, 4625.0, 2046.0, 1027.0, 533.0, 308.0, 204.0, 118.0, 75.0, 53.0, 37.0, 30.0, 13.0, 13.0, 11.0, 12.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.29638671875, -0.2870368957519531, -0.27768707275390625, -0.2683372497558594, -0.2589874267578125, -0.24963760375976562, -0.24028778076171875, -0.23093795776367188, -0.221588134765625, -0.21223831176757812, -0.20288848876953125, -0.19353866577148438, -0.1841888427734375, -0.17483901977539062, -0.16548919677734375, -0.15613937377929688, -0.14678955078125, -0.13743972778320312, -0.12808990478515625, -0.11874008178710938, -0.1093902587890625, -0.10004043579101562, -0.09069061279296875, -0.08134078979492188, -0.071990966796875, -0.06264114379882812, -0.05329132080078125, -0.043941497802734375, -0.0345916748046875, -0.025241851806640625, -0.01589202880859375, -0.006542205810546875, 0.0028076171875, 0.012157440185546875, 0.02150726318359375, 0.030857086181640625, 0.0402069091796875, 0.049556732177734375, 0.05890655517578125, 0.06825637817382812, 0.077606201171875, 0.08695602416992188, 0.09630584716796875, 0.10565567016601562, 0.1150054931640625, 0.12435531616210938, 0.13370513916015625, 0.14305496215820312, 0.15240478515625, 0.16175460815429688, 0.17110443115234375, 0.18045425415039062, 0.1898040771484375, 0.19915390014648438, 0.20850372314453125, 0.21785354614257812, 0.227203369140625, 0.23655319213867188, 0.24590301513671875, 0.2552528381347656, 0.2646026611328125, 0.2739524841308594, 0.28330230712890625, 0.2926521301269531, 0.302001953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 5.0, 3.0, 10.0, 5.0, 9.0, 6.0, 13.0, 19.0, 31.0, 23.0, 22.0, 20.0, 32.0, 44.0, 37.0, 36.0, 34.0, 32.0, 43.0, 48.0, 40.0, 34.0, 28.0, 30.0, 45.0, 35.0, 37.0, 41.0, 27.0, 24.0, 23.0, 31.0, 26.0, 18.0, 16.0, 15.0, 13.0, 6.0, 8.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.31005859375, -0.3011817932128906, -0.29230499267578125, -0.2834281921386719, -0.2745513916015625, -0.2656745910644531, -0.25679779052734375, -0.24792098999023438, -0.239044189453125, -0.23016738891601562, -0.22129058837890625, -0.21241378784179688, -0.2035369873046875, -0.19466018676757812, -0.18578338623046875, -0.17690658569335938, -0.16802978515625, -0.15915298461914062, -0.15027618408203125, -0.14139938354492188, -0.1325225830078125, -0.12364578247070312, -0.11476898193359375, -0.10589218139648438, -0.097015380859375, -0.08813858032226562, -0.07926177978515625, -0.07038497924804688, -0.0615081787109375, -0.052631378173828125, -0.04375457763671875, -0.034877777099609375, -0.0260009765625, -0.017124176025390625, -0.00824737548828125, 0.000629425048828125, 0.0095062255859375, 0.018383026123046875, 0.02725982666015625, 0.036136627197265625, 0.045013427734375, 0.053890228271484375, 0.06276702880859375, 0.07164382934570312, 0.0805206298828125, 0.08939743041992188, 0.09827423095703125, 0.10715103149414062, 0.11602783203125, 0.12490463256835938, 0.13378143310546875, 0.14265823364257812, 0.1515350341796875, 0.16041183471679688, 0.16928863525390625, 0.17816543579101562, 0.187042236328125, 0.19591903686523438, 0.20479583740234375, 0.21367263793945312, 0.2225494384765625, 0.23142623901367188, 0.24030303955078125, 0.24917984008789062, 0.258056640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 8.0, 14.0, 20.0, 30.0, 45.0, 66.0, 81.0, 156.0, 180.0, 293.0, 448.0, 709.0, 1142.0, 2021.0, 3750.0, 7562.0, 15601.0, 33318.0, 87061.0, 314077.0, 397638.0, 107895.0, 39939.0, 17732.0, 8610.0, 4335.0, 2278.0, 1298.0, 738.0, 511.0, 297.0, 219.0, 150.0, 105.0, 60.0, 49.0, 41.0, 21.0, 9.0, 10.0, 5.0, 4.0, 3.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.11252689361572266, -0.10865974426269531, -0.10479259490966797, -0.10092544555664062, -0.09705829620361328, -0.09319114685058594, -0.0893239974975586, -0.08545684814453125, -0.0815896987915039, -0.07772254943847656, -0.07385540008544922, -0.06998825073242188, -0.06612110137939453, -0.06225395202636719, -0.058386802673339844, -0.0545196533203125, -0.050652503967285156, -0.04678535461425781, -0.04291820526123047, -0.039051055908203125, -0.03518390655517578, -0.03131675720214844, -0.027449607849121094, -0.02358245849609375, -0.019715309143066406, -0.015848159790039062, -0.011981010437011719, -0.008113861083984375, -0.004246711730957031, -0.0003795623779296875, 0.0034875869750976562, 0.007354736328125, 0.011221885681152344, 0.015089035034179688, 0.01895618438720703, 0.022823333740234375, 0.02669048309326172, 0.030557632446289062, 0.034424781799316406, 0.03829193115234375, 0.042159080505371094, 0.04602622985839844, 0.04989337921142578, 0.053760528564453125, 0.05762767791748047, 0.06149482727050781, 0.06536197662353516, 0.0692291259765625, 0.07309627532958984, 0.07696342468261719, 0.08083057403564453, 0.08469772338867188, 0.08856487274169922, 0.09243202209472656, 0.0962991714477539, 0.10016632080078125, 0.1040334701538086, 0.10790061950683594, 0.11176776885986328, 0.11563491821289062, 0.11950206756591797, 0.12336921691894531, 0.12723636627197266, 0.131103515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 8.0, 3.0, 5.0, 3.0, 6.0, 7.0, 10.0, 12.0, 16.0, 23.0, 25.0, 38.0, 53.0, 74.0, 140.0, 156.0, 147.0, 81.0, 52.0, 40.0, 33.0, 17.0, 10.0, 14.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.786252975463867e-05, -4.624016582965851e-05, -4.4617801904678345e-05, -4.299543797969818e-05, -4.137307405471802e-05, -3.9750710129737854e-05, -3.812834620475769e-05, -3.650598227977753e-05, -3.488361835479736e-05, -3.32612544298172e-05, -3.1638890504837036e-05, -3.0016526579856873e-05, -2.839416265487671e-05, -2.6771798729896545e-05, -2.5149434804916382e-05, -2.3527070879936218e-05, -2.1904706954956055e-05, -2.028234302997589e-05, -1.8659979104995728e-05, -1.7037615180015564e-05, -1.54152512550354e-05, -1.3792887330055237e-05, -1.2170523405075073e-05, -1.054815948009491e-05, -8.925795555114746e-06, -7.3034316301345825e-06, -5.681067705154419e-06, -4.058703780174255e-06, -2.436339855194092e-06, -8.139759302139282e-07, 8.083879947662354e-07, 2.430751919746399e-06, 4.0531158447265625e-06, 5.675479769706726e-06, 7.29784369468689e-06, 8.920207619667053e-06, 1.0542571544647217e-05, 1.216493546962738e-05, 1.3787299394607544e-05, 1.5409663319587708e-05, 1.703202724456787e-05, 1.8654391169548035e-05, 2.0276755094528198e-05, 2.1899119019508362e-05, 2.3521482944488525e-05, 2.514384686946869e-05, 2.6766210794448853e-05, 2.8388574719429016e-05, 3.001093864440918e-05, 3.163330256938934e-05, 3.325566649436951e-05, 3.487803041934967e-05, 3.6500394344329834e-05, 3.812275826931e-05, 3.974512219429016e-05, 4.1367486119270325e-05, 4.298985004425049e-05, 4.461221396923065e-05, 4.6234577894210815e-05, 4.785694181919098e-05, 4.947930574417114e-05, 5.1101669669151306e-05, 5.272403359413147e-05, 5.434639751911163e-05, 5.59687614440918e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 6.0, 10.0, 13.0, 23.0, 29.0, 35.0, 72.0, 102.0, 156.0, 201.0, 414.0, 677.0, 1115.0, 2186.0, 4582.0, 13752.0, 54174.0, 310676.0, 527593.0, 97405.0, 21998.0, 6873.0, 2901.0, 1457.0, 829.0, 479.0, 258.0, 175.0, 136.0, 59.0, 48.0, 35.0, 17.0, 9.0, 11.0, 11.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.2054443359375, -0.20006370544433594, -0.19468307495117188, -0.1893024444580078, -0.18392181396484375, -0.1785411834716797, -0.17316055297851562, -0.16777992248535156, -0.1623992919921875, -0.15701866149902344, -0.15163803100585938, -0.1462574005126953, -0.14087677001953125, -0.1354961395263672, -0.13011550903320312, -0.12473487854003906, -0.119354248046875, -0.11397361755371094, -0.10859298706054688, -0.10321235656738281, -0.09783172607421875, -0.09245109558105469, -0.08707046508789062, -0.08168983459472656, -0.0763092041015625, -0.07092857360839844, -0.06554794311523438, -0.06016731262207031, -0.05478668212890625, -0.04940605163574219, -0.044025421142578125, -0.03864479064941406, -0.03326416015625, -0.027883529663085938, -0.022502899169921875, -0.017122268676757812, -0.01174163818359375, -0.0063610076904296875, -0.000980377197265625, 0.0044002532958984375, 0.0097808837890625, 0.015161514282226562, 0.020542144775390625, 0.025922775268554688, 0.03130340576171875, 0.03668403625488281, 0.042064666748046875, 0.04744529724121094, 0.052825927734375, 0.05820655822753906, 0.06358718872070312, 0.06896781921386719, 0.07434844970703125, 0.07972908020019531, 0.08510971069335938, 0.09049034118652344, 0.0958709716796875, 0.10125160217285156, 0.10663223266601562, 0.11201286315917969, 0.11739349365234375, 0.12277412414550781, 0.12815475463867188, 0.13353538513183594, 0.138916015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 10.0, 3.0, 20.0, 15.0, 16.0, 24.0, 38.0, 57.0, 87.0, 89.0, 98.0, 109.0, 94.0, 72.0, 61.0, 43.0, 38.0, 21.0, 16.0, 14.0, 12.0, 10.0, 5.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.12188720703125, -0.11784076690673828, -0.11379432678222656, -0.10974788665771484, -0.10570144653320312, -0.1016550064086914, -0.09760856628417969, -0.09356212615966797, -0.08951568603515625, -0.08546924591064453, -0.08142280578613281, -0.0773763656616211, -0.07332992553710938, -0.06928348541259766, -0.06523704528808594, -0.06119060516357422, -0.0571441650390625, -0.05309772491455078, -0.04905128479003906, -0.045004844665527344, -0.040958404541015625, -0.036911964416503906, -0.03286552429199219, -0.02881908416748047, -0.02477264404296875, -0.02072620391845703, -0.016679763793945312, -0.012633323669433594, -0.008586883544921875, -0.004540443420410156, -0.0004940032958984375, 0.0035524368286132812, 0.007598876953125, 0.011645317077636719, 0.015691757202148438, 0.019738197326660156, 0.023784637451171875, 0.027831077575683594, 0.03187751770019531, 0.03592395782470703, 0.03997039794921875, 0.04401683807373047, 0.04806327819824219, 0.052109718322753906, 0.056156158447265625, 0.060202598571777344, 0.06424903869628906, 0.06829547882080078, 0.0723419189453125, 0.07638835906982422, 0.08043479919433594, 0.08448123931884766, 0.08852767944335938, 0.0925741195678711, 0.09662055969238281, 0.10066699981689453, 0.10471343994140625, 0.10875988006591797, 0.11280632019042969, 0.1168527603149414, 0.12089920043945312, 0.12494564056396484, 0.12899208068847656, 0.13303852081298828, 0.1370849609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 2.0, 16.0, 24.0, 30.0, 41.0, 82.0, 113.0, 109.0, 136.0, 121.0, 107.0, 92.0, 52.0, 30.0, 20.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9583238363265991, -1.9062167406082153, -1.8541096448898315, -1.8020026683807373, -1.7498955726623535, -1.6977884769439697, -1.645681381225586, -1.5935742855072021, -1.5414671897888184, -1.4893600940704346, -1.4372529983520508, -1.385145902633667, -1.3330389261245728, -1.280931830406189, -1.2288247346878052, -1.1767176389694214, -1.1246106624603271, -1.0725035667419434, -1.0203964710235596, -0.9682894349098206, -0.9161823987960815, -0.8640753030776978, -0.811968207359314, -0.7598611116409302, -0.7077540755271912, -0.6556469798088074, -0.6035399436950684, -0.5514328479766846, -0.49932578206062317, -0.44721871614456177, -0.395111620426178, -0.3430045545101166, -0.2908976078033447, -0.23879054188728333, -0.18668346107006073, -0.13457638025283813, -0.08246931433677673, -0.030362248420715332, 0.021744847297668457, 0.07385191321372986, 0.12595897912979126, 0.17806604504585266, 0.23017312586307526, 0.28228020668029785, 0.33438727259635925, 0.38649433851242065, 0.43860143423080444, 0.49070850014686584, 0.5428155660629272, 0.594922661781311, 0.64702969789505, 0.6991367936134338, 0.7512438297271729, 0.8033509254455566, 0.8554580211639404, 0.9075651168823242, 0.9596721529960632, 1.0117791891098022, 1.063886284828186, 1.1159933805465698, 1.1681004762649536, 1.2202074527740479, 1.2723145484924316, 1.3244216442108154, 1.3765287399291992]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 3.0, 4.0, 12.0, 12.0, 9.0, 16.0, 14.0, 14.0, 14.0, 27.0, 29.0, 25.0, 31.0, 29.0, 38.0, 39.0, 40.0, 40.0, 33.0, 43.0, 40.0, 54.0, 33.0, 57.0, 33.0, 30.0, 29.0, 39.0, 31.0, 23.0, 19.0, 16.0, 18.0, 26.0, 13.0, 9.0, 8.0, 15.0, 6.0, 9.0, 4.0, 3.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.7946980595588684, -0.7698838710784912, -0.7450696229934692, -0.7202553749084473, -0.6954411864280701, -0.6706269979476929, -0.6458127498626709, -0.6209985017776489, -0.5961843132972717, -0.5713701248168945, -0.5465558767318726, -0.5217416286468506, -0.4969274401664734, -0.4721132218837738, -0.4472990036010742, -0.42248478531837463, -0.39767056703567505, -0.37285634875297546, -0.3480421304702759, -0.3232279121875763, -0.2984136939048767, -0.2735994756221771, -0.24878525733947754, -0.22397103905677795, -0.19915682077407837, -0.17434260249137878, -0.1495283842086792, -0.12471416592597961, -0.09989994764328003, -0.07508572936058044, -0.05027151107788086, -0.025457292795181274, -0.0006430149078369141, 0.02417120337486267, 0.048985421657562256, 0.07379963994026184, 0.09861385822296143, 0.12342807650566101, 0.1482422947883606, 0.17305651307106018, 0.19787073135375977, 0.22268494963645935, 0.24749916791915894, 0.2723133862018585, 0.2971276044845581, 0.3219418227672577, 0.3467560410499573, 0.37157025933265686, 0.39638447761535645, 0.42119869589805603, 0.4460129141807556, 0.4708271324634552, 0.4956413507461548, 0.5204555988311768, 0.545269787311554, 0.5700839757919312, 0.5948982238769531, 0.6197124719619751, 0.6445266604423523, 0.6693408489227295, 0.6941550970077515, 0.7189693450927734, 0.7437835335731506, 0.7685977220535278, 0.7934119701385498]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 10.0, 10.0, 20.0, 25.0, 36.0, 58.0, 72.0, 135.0, 248.0, 379.0, 584.0, 951.0, 1613.0, 2957.0, 5310.0, 10258.0, 20202.0, 42152.0, 93665.0, 229506.0, 652838.0, 1515789.0, 1006909.0, 357184.0, 137305.0, 59370.0, 27508.0, 13374.0, 6818.0, 3596.0, 2102.0, 1301.0, 730.0, 454.0, 289.0, 166.0, 125.0, 84.0, 52.0, 40.0, 24.0, 13.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.119384765625, -0.11549758911132812, -0.11161041259765625, -0.10772323608398438, -0.1038360595703125, -0.09994888305664062, -0.09606170654296875, -0.09217453002929688, -0.088287353515625, -0.08440017700195312, -0.08051300048828125, -0.07662582397460938, -0.0727386474609375, -0.06885147094726562, -0.06496429443359375, -0.061077117919921875, -0.05718994140625, -0.053302764892578125, -0.04941558837890625, -0.045528411865234375, -0.0416412353515625, -0.037754058837890625, -0.03386688232421875, -0.029979705810546875, -0.026092529296875, -0.022205352783203125, -0.01831817626953125, -0.014430999755859375, -0.0105438232421875, -0.006656646728515625, -0.00276947021484375, 0.001117706298828125, 0.0050048828125, 0.008892059326171875, 0.01277923583984375, 0.016666412353515625, 0.0205535888671875, 0.024440765380859375, 0.02832794189453125, 0.032215118408203125, 0.036102294921875, 0.039989471435546875, 0.04387664794921875, 0.047763824462890625, 0.0516510009765625, 0.055538177490234375, 0.05942535400390625, 0.06331253051757812, 0.06719970703125, 0.07108688354492188, 0.07497406005859375, 0.07886123657226562, 0.0827484130859375, 0.08663558959960938, 0.09052276611328125, 0.09440994262695312, 0.098297119140625, 0.10218429565429688, 0.10607147216796875, 0.10995864868164062, 0.1138458251953125, 0.11773300170898438, 0.12162017822265625, 0.12550735473632812, 0.12939453125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 5.0, 9.0, 9.0, 14.0, 11.0, 17.0, 17.0, 16.0, 26.0, 26.0, 40.0, 35.0, 35.0, 36.0, 48.0, 64.0, 41.0, 45.0, 46.0, 40.0, 44.0, 50.0, 48.0, 41.0, 32.0, 31.0, 31.0, 26.0, 26.0, 17.0, 20.0, 7.0, 4.0, 9.0, 5.0, 9.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10970211029052734, -0.10624504089355469, -0.10278797149658203, -0.09933090209960938, -0.09587383270263672, -0.09241676330566406, -0.0889596939086914, -0.08550262451171875, -0.0820455551147461, -0.07858848571777344, -0.07513141632080078, -0.07167434692382812, -0.06821727752685547, -0.06476020812988281, -0.061303138732910156, -0.0578460693359375, -0.054388999938964844, -0.05093193054199219, -0.04747486114501953, -0.044017791748046875, -0.04056072235107422, -0.03710365295410156, -0.033646583557128906, -0.03018951416015625, -0.026732444763183594, -0.023275375366210938, -0.01981830596923828, -0.016361236572265625, -0.012904167175292969, -0.009447097778320312, -0.005990028381347656, -0.002532958984375, 0.0009241104125976562, 0.0043811798095703125, 0.007838249206542969, 0.011295318603515625, 0.014752388000488281, 0.018209457397460938, 0.021666526794433594, 0.02512359619140625, 0.028580665588378906, 0.03203773498535156, 0.03549480438232422, 0.038951873779296875, 0.04240894317626953, 0.04586601257324219, 0.049323081970214844, 0.0527801513671875, 0.056237220764160156, 0.05969429016113281, 0.06315135955810547, 0.06660842895507812, 0.07006549835205078, 0.07352256774902344, 0.0769796371459961, 0.08043670654296875, 0.0838937759399414, 0.08735084533691406, 0.09080791473388672, 0.09426498413085938, 0.09772205352783203, 0.10117912292480469, 0.10463619232177734, 0.10809326171875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 13.0, 15.0, 30.0, 36.0, 49.0, 103.0, 152.0, 230.0, 392.0, 792.0, 1466.0, 3280.0, 8899.0, 29216.0, 131525.0, 881619.0, 2668688.0, 371283.0, 68795.0, 17181.0, 5780.0, 2312.0, 1066.0, 534.0, 299.0, 215.0, 109.0, 70.0, 42.0, 30.0, 16.0, 16.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4033203125, -0.3922080993652344, -0.38109588623046875, -0.3699836730957031, -0.3588714599609375, -0.3477592468261719, -0.33664703369140625, -0.3255348205566406, -0.314422607421875, -0.3033103942871094, -0.29219818115234375, -0.2810859680175781, -0.2699737548828125, -0.2588615417480469, -0.24774932861328125, -0.23663711547851562, -0.22552490234375, -0.21441268920898438, -0.20330047607421875, -0.19218826293945312, -0.1810760498046875, -0.16996383666992188, -0.15885162353515625, -0.14773941040039062, -0.136627197265625, -0.12551498413085938, -0.11440277099609375, -0.10329055786132812, -0.0921783447265625, -0.08106613159179688, -0.06995391845703125, -0.058841705322265625, -0.0477294921875, -0.036617279052734375, -0.02550506591796875, -0.014392852783203125, -0.0032806396484375, 0.007831573486328125, 0.01894378662109375, 0.030055999755859375, 0.041168212890625, 0.052280426025390625, 0.06339263916015625, 0.07450485229492188, 0.0856170654296875, 0.09672927856445312, 0.10784149169921875, 0.11895370483398438, 0.13006591796875, 0.14117813110351562, 0.15229034423828125, 0.16340255737304688, 0.1745147705078125, 0.18562698364257812, 0.19673919677734375, 0.20785140991210938, 0.218963623046875, 0.23007583618164062, 0.24118804931640625, 0.2523002624511719, 0.2634124755859375, 0.2745246887207031, 0.28563690185546875, 0.2967491149902344, 0.307861328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 10.0, 13.0, 18.0, 21.0, 30.0, 54.0, 88.0, 137.0, 180.0, 311.0, 490.0, 846.0, 737.0, 428.0, 261.0, 137.0, 89.0, 73.0, 52.0, 25.0, 16.0, 15.0, 8.0, 14.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.320556640625, -0.30941009521484375, -0.2982635498046875, -0.28711700439453125, -0.275970458984375, -0.26482391357421875, -0.2536773681640625, -0.24253082275390625, -0.23138427734375, -0.22023773193359375, -0.2090911865234375, -0.19794464111328125, -0.186798095703125, -0.17565155029296875, -0.1645050048828125, -0.15335845947265625, -0.1422119140625, -0.13106536865234375, -0.1199188232421875, -0.10877227783203125, -0.097625732421875, -0.08647918701171875, -0.0753326416015625, -0.06418609619140625, -0.05303955078125, -0.04189300537109375, -0.0307464599609375, -0.01959991455078125, -0.008453369140625, 0.00269317626953125, 0.0138397216796875, 0.02498626708984375, 0.0361328125, 0.04727935791015625, 0.0584259033203125, 0.06957244873046875, 0.080718994140625, 0.09186553955078125, 0.1030120849609375, 0.11415863037109375, 0.12530517578125, 0.13645172119140625, 0.1475982666015625, 0.15874481201171875, 0.169891357421875, 0.18103790283203125, 0.1921844482421875, 0.20333099365234375, 0.2144775390625, 0.22562408447265625, 0.2367706298828125, 0.24791717529296875, 0.259063720703125, 0.27021026611328125, 0.2813568115234375, 0.29250335693359375, 0.30364990234375, 0.31479644775390625, 0.3259429931640625, 0.33708953857421875, 0.348236083984375, 0.35938262939453125, 0.3705291748046875, 0.38167572021484375, 0.392822265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 17.0, 23.0, 64.0, 139.0, 162.0, 180.0, 186.0, 103.0, 71.0, 27.0, 9.0, 9.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8788681030273438, -3.780748128890991, -3.6826281547546387, -3.5845084190368652, -3.4863884449005127, -3.38826847076416, -3.2901484966278076, -3.192028522491455, -3.0939085483551025, -2.99578857421875, -2.8976686000823975, -2.799548625946045, -2.7014288902282715, -2.603308916091919, -2.5051889419555664, -2.407068967819214, -2.3089489936828613, -2.210829019546509, -2.1127090454101562, -2.014589309692383, -1.9164692163467407, -1.8183493614196777, -1.7202293872833252, -1.6221094131469727, -1.5239896774291992, -1.4258697032928467, -1.3277498483657837, -1.2296298742294312, -1.1315099000930786, -1.0333900451660156, -0.9352700710296631, -0.8371500968933105, -0.739030122756958, -0.6409102082252502, -0.5427902340888977, -0.44467031955718994, -0.3465503752231598, -0.24843043088912964, -0.15031051635742188, -0.052190542221069336, 0.04592937231063843, 0.14404931664466858, 0.24216924607753754, 0.3402891755104065, 0.43840911984443665, 0.5365290641784668, 0.6346489787101746, 0.7327689528465271, 0.8308888673782349, 0.9290087819099426, 1.0271286964416504, 1.125248670578003, 1.2233686447143555, 1.321488618850708, 1.419608473777771, 1.5177284479141235, 1.6158483028411865, 1.713968276977539, 1.812088131904602, 1.9102081060409546, 2.0083279609680176, 2.10644793510437, 2.2045679092407227, 2.302687883377075, 2.4008078575134277]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 5.0, 13.0, 7.0, 16.0, 17.0, 11.0, 15.0, 13.0, 23.0, 24.0, 29.0, 35.0, 35.0, 42.0, 39.0, 40.0, 53.0, 42.0, 44.0, 41.0, 41.0, 48.0, 41.0, 40.0, 41.0, 32.0, 24.0, 31.0, 27.0, 23.0, 18.0, 14.0, 15.0, 7.0, 12.0, 15.0, 10.0, 6.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.9571223258972168, -0.9280504584312439, -0.8989786505699158, -0.8699067831039429, -0.8408349752426147, -0.8117631077766418, -0.782691240310669, -0.7536194324493408, -0.7245475649833679, -0.695475697517395, -0.6664038896560669, -0.637332022190094, -0.6082601547241211, -0.579188346862793, -0.5501164793968201, -0.5210446119308472, -0.49197280406951904, -0.46290096640586853, -0.433829128742218, -0.4047572612762451, -0.3756854236125946, -0.3466135859489441, -0.3175417184829712, -0.2884698808193207, -0.25939804315567017, -0.23032620549201965, -0.20125435292720795, -0.17218250036239624, -0.14311066269874573, -0.11403882503509521, -0.08496697247028351, -0.0558951199054718, -0.026823222637176514, 0.002248622477054596, 0.031320467591285706, 0.060392312705516815, 0.08946415781974792, 0.11853599548339844, 0.14760784804821014, 0.17667970061302185, 0.20575153827667236, 0.23482337594032288, 0.2638952136039734, 0.2929670810699463, 0.3220389187335968, 0.3511107563972473, 0.3801826238632202, 0.4092544615268707, 0.43832629919052124, 0.46739813685417175, 0.49646997451782227, 0.5255418419837952, 0.5546137094497681, 0.5836855173110962, 0.6127573847770691, 0.641829252243042, 0.6709010601043701, 0.699972927570343, 0.7290447354316711, 0.758116602897644, 0.7871884107589722, 0.8162602782249451, 0.845332145690918, 0.8744039535522461, 0.903475821018219]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 9.0, 27.0, 48.0, 74.0, 121.0, 219.0, 378.0, 718.0, 1389.0, 2639.0, 5290.0, 11864.0, 30949.0, 94042.0, 262112.0, 360826.0, 181160.0, 59348.0, 20570.0, 8436.0, 4009.0, 1963.0, 1051.0, 540.0, 346.0, 169.0, 89.0, 58.0, 33.0, 24.0, 10.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.1795787811279297, -0.17300033569335938, -0.16642189025878906, -0.15984344482421875, -0.15326499938964844, -0.14668655395507812, -0.1401081085205078, -0.1335296630859375, -0.1269512176513672, -0.12037277221679688, -0.11379432678222656, -0.10721588134765625, -0.10063743591308594, -0.09405899047851562, -0.08748054504394531, -0.080902099609375, -0.07432365417480469, -0.06774520874023438, -0.06116676330566406, -0.05458831787109375, -0.04800987243652344, -0.041431427001953125, -0.03485298156738281, -0.0282745361328125, -0.021696090698242188, -0.015117645263671875, -0.008539199829101562, -0.00196075439453125, 0.0046176910400390625, 0.011196136474609375, 0.017774581909179688, 0.02435302734375, 0.030931472778320312, 0.037509918212890625, 0.04408836364746094, 0.05066680908203125, 0.05724525451660156, 0.06382369995117188, 0.07040214538574219, 0.0769805908203125, 0.08355903625488281, 0.09013748168945312, 0.09671592712402344, 0.10329437255859375, 0.10987281799316406, 0.11645126342773438, 0.12302970886230469, 0.129608154296875, 0.1361865997314453, 0.14276504516601562, 0.14934349060058594, 0.15592193603515625, 0.16250038146972656, 0.16907882690429688, 0.1756572723388672, 0.1822357177734375, 0.1888141632080078, 0.19539260864257812, 0.20197105407714844, 0.20854949951171875, 0.21512794494628906, 0.22170639038085938, 0.2282848358154297, 0.23486328125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 8.0, 8.0, 5.0, 10.0, 15.0, 14.0, 19.0, 19.0, 21.0, 28.0, 29.0, 26.0, 32.0, 30.0, 32.0, 41.0, 34.0, 34.0, 40.0, 35.0, 47.0, 50.0, 40.0, 35.0, 38.0, 38.0, 34.0, 32.0, 25.0, 23.0, 21.0, 22.0, 18.0, 14.0, 14.0, 12.0, 10.0, 12.0, 5.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.11334228515625, -0.10999774932861328, -0.10665321350097656, -0.10330867767333984, -0.09996414184570312, -0.0966196060180664, -0.09327507019042969, -0.08993053436279297, -0.08658599853515625, -0.08324146270751953, -0.07989692687988281, -0.0765523910522461, -0.07320785522460938, -0.06986331939697266, -0.06651878356933594, -0.06317424774169922, -0.0598297119140625, -0.05648517608642578, -0.05314064025878906, -0.049796104431152344, -0.046451568603515625, -0.043107032775878906, -0.03976249694824219, -0.03641796112060547, -0.03307342529296875, -0.02972888946533203, -0.026384353637695312, -0.023039817810058594, -0.019695281982421875, -0.016350746154785156, -0.013006210327148438, -0.009661674499511719, -0.006317138671875, -0.0029726028442382812, 0.0003719329833984375, 0.0037164688110351562, 0.007061004638671875, 0.010405540466308594, 0.013750076293945312, 0.01709461212158203, 0.02043914794921875, 0.02378368377685547, 0.027128219604492188, 0.030472755432128906, 0.033817291259765625, 0.037161827087402344, 0.04050636291503906, 0.04385089874267578, 0.0471954345703125, 0.05053997039794922, 0.05388450622558594, 0.057229042053222656, 0.060573577880859375, 0.0639181137084961, 0.06726264953613281, 0.07060718536376953, 0.07395172119140625, 0.07729625701904297, 0.08064079284667969, 0.0839853286743164, 0.08732986450195312, 0.09067440032958984, 0.09401893615722656, 0.09736347198486328, 0.1007080078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 1.0, 8.0, 6.0, 10.0, 5.0, 9.0, 18.0, 19.0, 22.0, 38.0, 56.0, 68.0, 115.0, 183.0, 367.0, 714.0, 1416.0, 2800.0, 5973.0, 13690.0, 34569.0, 100199.0, 289230.0, 363839.0, 150874.0, 49814.0, 18970.0, 8077.0, 3691.0, 1737.0, 891.0, 407.0, 252.0, 153.0, 103.0, 61.0, 32.0, 40.0, 23.0, 20.0, 11.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0], "bins": [-0.221923828125, -0.21543121337890625, -0.2089385986328125, -0.20244598388671875, -0.195953369140625, -0.18946075439453125, -0.1829681396484375, -0.17647552490234375, -0.16998291015625, -0.16349029541015625, -0.1569976806640625, -0.15050506591796875, -0.144012451171875, -0.13751983642578125, -0.1310272216796875, -0.12453460693359375, -0.1180419921875, -0.11154937744140625, -0.1050567626953125, -0.09856414794921875, -0.092071533203125, -0.08557891845703125, -0.0790863037109375, -0.07259368896484375, -0.06610107421875, -0.05960845947265625, -0.0531158447265625, -0.04662322998046875, -0.040130615234375, -0.03363800048828125, -0.0271453857421875, -0.02065277099609375, -0.01416015625, -0.00766754150390625, -0.0011749267578125, 0.00531768798828125, 0.011810302734375, 0.01830291748046875, 0.0247955322265625, 0.03128814697265625, 0.03778076171875, 0.04427337646484375, 0.0507659912109375, 0.05725860595703125, 0.063751220703125, 0.07024383544921875, 0.0767364501953125, 0.08322906494140625, 0.0897216796875, 0.09621429443359375, 0.1027069091796875, 0.10919952392578125, 0.115692138671875, 0.12218475341796875, 0.1286773681640625, 0.13516998291015625, 0.14166259765625, 0.14815521240234375, 0.1546478271484375, 0.16114044189453125, 0.167633056640625, 0.17412567138671875, 0.1806182861328125, 0.18711090087890625, 0.193603515625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 5.0, 6.0, 9.0, 11.0, 17.0, 19.0, 20.0, 14.0, 18.0, 28.0, 17.0, 35.0, 24.0, 38.0, 31.0, 39.0, 41.0, 39.0, 48.0, 48.0, 47.0, 45.0, 45.0, 36.0, 29.0, 33.0, 37.0, 38.0, 24.0, 26.0, 19.0, 15.0, 17.0, 15.0, 11.0, 10.0, 11.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.332275390625, -0.3213462829589844, -0.31041717529296875, -0.2994880676269531, -0.2885589599609375, -0.2776298522949219, -0.26670074462890625, -0.2557716369628906, -0.244842529296875, -0.23391342163085938, -0.22298431396484375, -0.21205520629882812, -0.2011260986328125, -0.19019699096679688, -0.17926788330078125, -0.16833877563476562, -0.15740966796875, -0.14648056030273438, -0.13555145263671875, -0.12462234497070312, -0.1136932373046875, -0.10276412963867188, -0.09183502197265625, -0.08090591430664062, -0.069976806640625, -0.059047698974609375, -0.04811859130859375, -0.037189483642578125, -0.0262603759765625, -0.015331268310546875, -0.00440216064453125, 0.006526947021484375, 0.0174560546875, 0.028385162353515625, 0.03931427001953125, 0.050243377685546875, 0.0611724853515625, 0.07210159301757812, 0.08303070068359375, 0.09395980834960938, 0.104888916015625, 0.11581802368164062, 0.12674713134765625, 0.13767623901367188, 0.1486053466796875, 0.15953445434570312, 0.17046356201171875, 0.18139266967773438, 0.19232177734375, 0.20325088500976562, 0.21417999267578125, 0.22510910034179688, 0.2360382080078125, 0.24696731567382812, 0.25789642333984375, 0.2688255310058594, 0.279754638671875, 0.2906837463378906, 0.30161285400390625, 0.3125419616699219, 0.3234710693359375, 0.3344001770019531, 0.34532928466796875, 0.3562583923339844, 0.3671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 4.0, 6.0, 10.0, 17.0, 31.0, 28.0, 49.0, 69.0, 112.0, 153.0, 251.0, 380.0, 609.0, 990.0, 1691.0, 2913.0, 5156.0, 9698.0, 19747.0, 42533.0, 105821.0, 248836.0, 313098.0, 169740.0, 66946.0, 29011.0, 13939.0, 7123.0, 3859.0, 2269.0, 1288.0, 770.0, 482.0, 340.0, 182.0, 133.0, 85.0, 61.0, 42.0, 27.0, 20.0, 15.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.08423805236816406, -0.08125686645507812, -0.07827568054199219, -0.07529449462890625, -0.07231330871582031, -0.06933212280273438, -0.06635093688964844, -0.0633697509765625, -0.06038856506347656, -0.057407379150390625, -0.05442619323730469, -0.05144500732421875, -0.04846382141113281, -0.045482635498046875, -0.04250144958496094, -0.039520263671875, -0.03653907775878906, -0.033557891845703125, -0.030576705932617188, -0.02759552001953125, -0.024614334106445312, -0.021633148193359375, -0.018651962280273438, -0.0156707763671875, -0.012689590454101562, -0.009708404541015625, -0.0067272186279296875, -0.00374603271484375, -0.0007648468017578125, 0.002216339111328125, 0.0051975250244140625, 0.0081787109375, 0.011159896850585938, 0.014141082763671875, 0.017122268676757812, 0.02010345458984375, 0.023084640502929688, 0.026065826416015625, 0.029047012329101562, 0.0320281982421875, 0.03500938415527344, 0.037990570068359375, 0.04097175598144531, 0.04395294189453125, 0.04693412780761719, 0.049915313720703125, 0.05289649963378906, 0.055877685546875, 0.05885887145996094, 0.061840057373046875, 0.06482124328613281, 0.06780242919921875, 0.07078361511230469, 0.07376480102539062, 0.07674598693847656, 0.0797271728515625, 0.08270835876464844, 0.08568954467773438, 0.08867073059082031, 0.09165191650390625, 0.09463310241699219, 0.09761428833007812, 0.10059547424316406, 0.10357666015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 8.0, 7.0, 8.0, 12.0, 14.0, 15.0, 23.0, 26.0, 32.0, 45.0, 67.0, 79.0, 101.0, 95.0, 80.0, 92.0, 66.0, 55.0, 47.0, 29.0, 18.0, 16.0, 16.0, 14.0, 10.0, 3.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2007694244384766e-05, -3.097113221883774e-05, -2.993457019329071e-05, -2.8898008167743683e-05, -2.7861446142196655e-05, -2.6824884116649628e-05, -2.57883220911026e-05, -2.4751760065555573e-05, -2.3715198040008545e-05, -2.2678636014461517e-05, -2.164207398891449e-05, -2.0605511963367462e-05, -1.9568949937820435e-05, -1.8532387912273407e-05, -1.749582588672638e-05, -1.6459263861179352e-05, -1.5422701835632324e-05, -1.4386139810085297e-05, -1.3349577784538269e-05, -1.2313015758991241e-05, -1.1276453733444214e-05, -1.0239891707897186e-05, -9.203329682350159e-06, -8.166767656803131e-06, -7.1302056312561035e-06, -6.093643605709076e-06, -5.057081580162048e-06, -4.020519554615021e-06, -2.983957529067993e-06, -1.9473955035209656e-06, -9.10833477973938e-07, 1.257285475730896e-07, 1.1622905731201172e-06, 2.1988525986671448e-06, 3.2354146242141724e-06, 4.2719766497612e-06, 5.3085386753082275e-06, 6.345100700855255e-06, 7.381662726402283e-06, 8.41822475194931e-06, 9.454786777496338e-06, 1.0491348803043365e-05, 1.1527910828590393e-05, 1.256447285413742e-05, 1.3601034879684448e-05, 1.4637596905231476e-05, 1.5674158930778503e-05, 1.671072095632553e-05, 1.774728298187256e-05, 1.8783845007419586e-05, 1.9820407032966614e-05, 2.085696905851364e-05, 2.189353108406067e-05, 2.2930093109607697e-05, 2.3966655135154724e-05, 2.5003217160701752e-05, 2.603977918624878e-05, 2.7076341211795807e-05, 2.8112903237342834e-05, 2.9149465262889862e-05, 3.018602728843689e-05, 3.122258931398392e-05, 3.2259151339530945e-05, 3.329571336507797e-05, 3.4332275390625e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 10.0, 3.0, 7.0, 15.0, 12.0, 22.0, 46.0, 45.0, 90.0, 145.0, 221.0, 463.0, 957.0, 2070.0, 5231.0, 15889.0, 62432.0, 272084.0, 473282.0, 161614.0, 36565.0, 10544.0, 3721.0, 1533.0, 699.0, 350.0, 175.0, 96.0, 73.0, 45.0, 32.0, 23.0, 15.0, 15.0, 9.0, 6.0, 1.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.158782958984375, -0.15386962890625, -0.148956298828125, -0.14404296875, -0.139129638671875, -0.13421630859375, -0.129302978515625, -0.1243896484375, -0.119476318359375, -0.11456298828125, -0.109649658203125, -0.104736328125, -0.099822998046875, -0.09490966796875, -0.089996337890625, -0.0850830078125, -0.080169677734375, -0.07525634765625, -0.070343017578125, -0.0654296875, -0.060516357421875, -0.05560302734375, -0.050689697265625, -0.0457763671875, -0.040863037109375, -0.03594970703125, -0.031036376953125, -0.026123046875, -0.021209716796875, -0.01629638671875, -0.011383056640625, -0.0064697265625, -0.001556396484375, 0.00335693359375, 0.008270263671875, 0.01318359375, 0.018096923828125, 0.02301025390625, 0.027923583984375, 0.0328369140625, 0.037750244140625, 0.04266357421875, 0.047576904296875, 0.052490234375, 0.057403564453125, 0.06231689453125, 0.067230224609375, 0.0721435546875, 0.077056884765625, 0.08197021484375, 0.086883544921875, 0.091796875, 0.096710205078125, 0.10162353515625, 0.106536865234375, 0.1114501953125, 0.116363525390625, 0.12127685546875, 0.126190185546875, 0.131103515625, 0.136016845703125, 0.14093017578125, 0.145843505859375, 0.1507568359375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 11.0, 15.0, 24.0, 27.0, 30.0, 58.0, 66.0, 73.0, 79.0, 83.0, 98.0, 76.0, 84.0, 57.0, 45.0, 42.0, 35.0, 24.0, 21.0, 13.0, 12.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10736083984375, -0.10355472564697266, -0.09974861145019531, -0.09594249725341797, -0.09213638305664062, -0.08833026885986328, -0.08452415466308594, -0.0807180404663086, -0.07691192626953125, -0.0731058120727539, -0.06929969787597656, -0.06549358367919922, -0.061687469482421875, -0.05788135528564453, -0.05407524108886719, -0.050269126892089844, -0.0464630126953125, -0.042656898498535156, -0.03885078430175781, -0.03504467010498047, -0.031238555908203125, -0.02743244171142578, -0.023626327514648438, -0.019820213317871094, -0.01601409912109375, -0.012207984924316406, -0.008401870727539062, -0.004595756530761719, -0.000789642333984375, 0.0030164718627929688, 0.0068225860595703125, 0.010628700256347656, 0.014434814453125, 0.018240928649902344, 0.022047042846679688, 0.02585315704345703, 0.029659271240234375, 0.03346538543701172, 0.03727149963378906, 0.041077613830566406, 0.04488372802734375, 0.048689842224121094, 0.05249595642089844, 0.05630207061767578, 0.060108184814453125, 0.06391429901123047, 0.06772041320800781, 0.07152652740478516, 0.0753326416015625, 0.07913875579833984, 0.08294486999511719, 0.08675098419189453, 0.09055709838867188, 0.09436321258544922, 0.09816932678222656, 0.1019754409790039, 0.10578155517578125, 0.1095876693725586, 0.11339378356933594, 0.11719989776611328, 0.12100601196289062, 0.12481212615966797, 0.1286182403564453, 0.13242435455322266, 0.13623046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 46.0, 83.0, 219.0, 294.0, 217.0, 90.0, 31.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54978084564209, -2.4504687786102295, -2.351156711578369, -2.251844644546509, -2.1525325775146484, -2.053220510482788, -1.9539085626602173, -1.854596495628357, -1.7552844285964966, -1.6559723615646362, -1.5566602945327759, -1.457348346710205, -1.3580362796783447, -1.2587242126464844, -1.159412145614624, -1.0601000785827637, -0.9607880115509033, -0.861475944519043, -0.7621638774871826, -0.662851870059967, -0.5635398030281067, -0.46422773599624634, -0.36491572856903076, -0.2656036615371704, -0.16629159450531006, -0.0669795423746109, 0.03233250975608826, 0.13164454698562622, 0.23095661401748657, 0.3302686810493469, 0.4295806884765625, 0.5288927555084229, 0.6282048225402832, 0.7275168895721436, 0.8268289566040039, 0.9261409640312195, 1.0254530906677246, 1.124765157699585, 1.2240771055221558, 1.3233891725540161, 1.4227012395858765, 1.5220133066177368, 1.6213253736495972, 1.720637321472168, 1.8199493885040283, 1.9192614555358887, 2.018573522567749, 2.1178855895996094, 2.2171976566314697, 2.31650972366333, 2.4158217906951904, 2.515133857727051, 2.614445924758911, 2.7137579917907715, 2.8130698204040527, 2.912382125854492, 3.0116939544677734, 3.111006021499634, 3.210318088531494, 3.3096301555633545, 3.408942222595215, 3.508254289627075, 3.6075663566589355, 3.706878185272217, 3.8061904907226562]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 10.0, 11.0, 4.0, 9.0, 10.0, 11.0, 12.0, 9.0, 14.0, 25.0, 23.0, 30.0, 37.0, 31.0, 22.0, 27.0, 38.0, 44.0, 46.0, 48.0, 33.0, 47.0, 35.0, 39.0, 38.0, 39.0, 47.0, 31.0, 47.0, 27.0, 26.0, 22.0, 18.0, 17.0, 19.0, 12.0, 17.0, 7.0, 4.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0447423458099365, -1.011633038520813, -0.9785237312316895, -0.9454144239425659, -0.9123051166534424, -0.8791958093643188, -0.8460865020751953, -0.8129771947860718, -0.7798678874969482, -0.7467585802078247, -0.7136492729187012, -0.6805399656295776, -0.6474306583404541, -0.6143213510513306, -0.581212043762207, -0.5481027364730835, -0.5149933695793152, -0.48188406229019165, -0.4487747550010681, -0.4156654477119446, -0.38255614042282104, -0.3494468331336975, -0.3163374960422516, -0.28322818875312805, -0.2501188814640045, -0.21700957417488098, -0.18390026688575745, -0.15079094469547272, -0.11768163740634918, -0.08457233011722565, -0.05146300792694092, -0.018353700637817383, 0.014755606651306152, 0.047864917665719986, 0.08097422868013382, 0.11408354341983795, 0.1471928507089615, 0.18030215799808502, 0.21341148018836975, 0.2465207874774933, 0.2796300947666168, 0.31273940205574036, 0.3458487093448639, 0.3789580464363098, 0.41206735372543335, 0.4451766610145569, 0.4782859683036804, 0.511395275592804, 0.5445045828819275, 0.577613890171051, 0.6107231974601746, 0.6438325047492981, 0.6769418120384216, 0.7100511193275452, 0.7431604862213135, 0.776269793510437, 0.8093791007995605, 0.8424884080886841, 0.8755977153778076, 0.9087070226669312, 0.9418163299560547, 0.9749256372451782, 1.0080349445343018, 1.0411442518234253, 1.0742535591125488]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 7.0, 7.0, 6.0, 19.0, 26.0, 37.0, 57.0, 75.0, 126.0, 155.0, 243.0, 414.0, 632.0, 1102.0, 1906.0, 3405.0, 6059.0, 12171.0, 25611.0, 59881.0, 168293.0, 561408.0, 1645175.0, 1171028.0, 342896.0, 110917.0, 42948.0, 18865.0, 9161.0, 4734.0, 2697.0, 1614.0, 935.0, 554.0, 376.0, 253.0, 141.0, 120.0, 80.0, 44.0, 29.0, 26.0, 13.0, 15.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.151123046875, -0.14637184143066406, -0.14162063598632812, -0.1368694305419922, -0.13211822509765625, -0.1273670196533203, -0.12261581420898438, -0.11786460876464844, -0.1131134033203125, -0.10836219787597656, -0.10361099243164062, -0.09885978698730469, -0.09410858154296875, -0.08935737609863281, -0.08460617065429688, -0.07985496520996094, -0.075103759765625, -0.07035255432128906, -0.06560134887695312, -0.06085014343261719, -0.05609893798828125, -0.05134773254394531, -0.046596527099609375, -0.04184532165527344, -0.0370941162109375, -0.03234291076660156, -0.027591705322265625, -0.022840499877929688, -0.01808929443359375, -0.013338088989257812, -0.008586883544921875, -0.0038356781005859375, 0.00091552734375, 0.0056667327880859375, 0.010417938232421875, 0.015169143676757812, 0.01992034912109375, 0.024671554565429688, 0.029422760009765625, 0.03417396545410156, 0.0389251708984375, 0.04367637634277344, 0.048427581787109375, 0.05317878723144531, 0.05792999267578125, 0.06268119812011719, 0.06743240356445312, 0.07218360900878906, 0.076934814453125, 0.08168601989746094, 0.08643722534179688, 0.09118843078613281, 0.09593963623046875, 0.10069084167480469, 0.10544204711914062, 0.11019325256347656, 0.1149444580078125, 0.11969566345214844, 0.12444686889648438, 0.1291980743408203, 0.13394927978515625, 0.1387004852294922, 0.14345169067382812, 0.14820289611816406, 0.1529541015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 0.0, 2.0, 5.0, 6.0, 7.0, 10.0, 5.0, 16.0, 11.0, 19.0, 14.0, 21.0, 28.0, 30.0, 21.0, 36.0, 33.0, 40.0, 48.0, 25.0, 36.0, 29.0, 25.0, 25.0, 48.0, 39.0, 34.0, 40.0, 27.0, 29.0, 33.0, 33.0, 24.0, 29.0, 27.0, 26.0, 14.0, 15.0, 15.0, 13.0, 6.0, 11.0, 14.0, 7.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.10687255859375, -0.10349082946777344, -0.10010910034179688, -0.09672737121582031, -0.09334564208984375, -0.08996391296386719, -0.08658218383789062, -0.08320045471191406, -0.0798187255859375, -0.07643699645996094, -0.07305526733398438, -0.06967353820800781, -0.06629180908203125, -0.06291007995605469, -0.059528350830078125, -0.05614662170410156, -0.052764892578125, -0.04938316345214844, -0.046001434326171875, -0.04261970520019531, -0.03923797607421875, -0.03585624694824219, -0.032474517822265625, -0.029092788696289062, -0.0257110595703125, -0.022329330444335938, -0.018947601318359375, -0.015565872192382812, -0.01218414306640625, -0.008802413940429688, -0.005420684814453125, -0.0020389556884765625, 0.0013427734375, 0.0047245025634765625, 0.008106231689453125, 0.011487960815429688, 0.01486968994140625, 0.018251419067382812, 0.021633148193359375, 0.025014877319335938, 0.0283966064453125, 0.03177833557128906, 0.035160064697265625, 0.03854179382324219, 0.04192352294921875, 0.04530525207519531, 0.048686981201171875, 0.05206871032714844, 0.055450439453125, 0.05883216857910156, 0.062213897705078125, 0.06559562683105469, 0.06897735595703125, 0.07235908508300781, 0.07574081420898438, 0.07912254333496094, 0.0825042724609375, 0.08588600158691406, 0.08926773071289062, 0.09264945983886719, 0.09603118896484375, 0.09941291809082031, 0.10279464721679688, 0.10617637634277344, 0.10955810546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 10.0, 12.0, 9.0, 14.0, 32.0, 41.0, 51.0, 58.0, 125.0, 193.0, 326.0, 510.0, 906.0, 1588.0, 3143.0, 6737.0, 15735.0, 42463.0, 127954.0, 498093.0, 2350521.0, 859084.0, 188616.0, 59205.0, 21441.0, 8840.0, 3929.0, 2014.0, 1056.0, 589.0, 373.0, 225.0, 122.0, 84.0, 59.0, 39.0, 22.0, 15.0, 11.0, 12.0, 9.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.255615234375, -0.24802017211914062, -0.24042510986328125, -0.23283004760742188, -0.2252349853515625, -0.21763992309570312, -0.21004486083984375, -0.20244979858398438, -0.194854736328125, -0.18725967407226562, -0.17966461181640625, -0.17206954956054688, -0.1644744873046875, -0.15687942504882812, -0.14928436279296875, -0.14168930053710938, -0.13409423828125, -0.12649917602539062, -0.11890411376953125, -0.11130905151367188, -0.1037139892578125, -0.09611892700195312, -0.08852386474609375, -0.08092880249023438, -0.073333740234375, -0.06573867797851562, -0.05814361572265625, -0.050548553466796875, -0.0429534912109375, -0.035358428955078125, -0.02776336669921875, -0.020168304443359375, -0.0125732421875, -0.004978179931640625, 0.00261688232421875, 0.010211944580078125, 0.0178070068359375, 0.025402069091796875, 0.03299713134765625, 0.040592193603515625, 0.048187255859375, 0.055782318115234375, 0.06337738037109375, 0.07097244262695312, 0.0785675048828125, 0.08616256713867188, 0.09375762939453125, 0.10135269165039062, 0.10894775390625, 0.11654281616210938, 0.12413787841796875, 0.13173294067382812, 0.1393280029296875, 0.14692306518554688, 0.15451812744140625, 0.16211318969726562, 0.169708251953125, 0.17730331420898438, 0.18489837646484375, 0.19249343872070312, 0.2000885009765625, 0.20768356323242188, 0.21527862548828125, 0.22287368774414062, 0.23046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 8.0, 4.0, 7.0, 6.0, 5.0, 11.0, 16.0, 20.0, 28.0, 33.0, 50.0, 63.0, 88.0, 144.0, 144.0, 218.0, 349.0, 574.0, 638.0, 519.0, 336.0, 218.0, 125.0, 117.0, 75.0, 78.0, 42.0, 35.0, 21.0, 22.0, 23.0, 13.0, 12.0, 6.0, 9.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2122802734375, -0.2048015594482422, -0.19732284545898438, -0.18984413146972656, -0.18236541748046875, -0.17488670349121094, -0.16740798950195312, -0.1599292755126953, -0.1524505615234375, -0.1449718475341797, -0.13749313354492188, -0.13001441955566406, -0.12253570556640625, -0.11505699157714844, -0.10757827758789062, -0.10009956359863281, -0.092620849609375, -0.08514213562011719, -0.07766342163085938, -0.07018470764160156, -0.06270599365234375, -0.05522727966308594, -0.047748565673828125, -0.04026985168457031, -0.0327911376953125, -0.025312423706054688, -0.017833709716796875, -0.010354995727539062, -0.00287628173828125, 0.0046024322509765625, 0.012081146240234375, 0.019559860229492188, 0.02703857421875, 0.03451728820800781, 0.041996002197265625, 0.04947471618652344, 0.05695343017578125, 0.06443214416503906, 0.07191085815429688, 0.07938957214355469, 0.0868682861328125, 0.09434700012207031, 0.10182571411132812, 0.10930442810058594, 0.11678314208984375, 0.12426185607910156, 0.13174057006835938, 0.1392192840576172, 0.146697998046875, 0.1541767120361328, 0.16165542602539062, 0.16913414001464844, 0.17661285400390625, 0.18409156799316406, 0.19157028198242188, 0.1990489959716797, 0.2065277099609375, 0.2140064239501953, 0.22148513793945312, 0.22896385192871094, 0.23644256591796875, 0.24392127990722656, 0.2513999938964844, 0.2588787078857422, 0.266357421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 15.0, 40.0, 77.0, 136.0, 216.0, 220.0, 145.0, 86.0, 27.0, 17.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9351539611816406, -1.843516230583191, -1.7518786191940308, -1.660240888595581, -1.568603277206421, -1.4769655466079712, -1.3853278160095215, -1.2936902046203613, -1.2020524740219116, -1.110414743423462, -1.0187771320343018, -0.927139401435852, -0.8355017304420471, -0.7438640594482422, -0.6522263288497925, -0.5605886578559875, -0.4689509868621826, -0.3773133158683777, -0.28567561507225037, -0.19403791427612305, -0.10240024328231812, -0.010762572288513184, 0.08087515830993652, 0.17251282930374146, 0.2641505002975464, 0.3557881712913513, 0.44742587208747864, 0.539063572883606, 0.6307012438774109, 0.7223389148712158, 0.8139766454696655, 0.9056143164634705, 0.9972517490386963, 1.088889479637146, 1.1805270910263062, 1.2721648216247559, 1.363802433013916, 1.4554401636123657, 1.5470778942108154, 1.6387155055999756, 1.7303532361984253, 1.821990966796875, 1.9136285781860352, 2.0052661895751953, 2.0969040393829346, 2.1885416507720947, 2.280179500579834, 2.371817111968994, 2.4634547233581543, 2.5550923347473145, 2.6467301845550537, 2.738367795944214, 2.830005407333374, 2.9216432571411133, 3.0132808685302734, 3.1049184799194336, 3.1965560913085938, 3.288193702697754, 3.379831552505493, 3.4714691638946533, 3.5631067752838135, 3.6547446250915527, 3.746382236480713, 3.838019847869873, 3.9296576976776123]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 5.0, 10.0, 18.0, 13.0, 13.0, 17.0, 13.0, 20.0, 28.0, 26.0, 24.0, 38.0, 29.0, 36.0, 36.0, 38.0, 40.0, 46.0, 35.0, 36.0, 51.0, 33.0, 43.0, 31.0, 40.0, 45.0, 27.0, 26.0, 18.0, 19.0, 30.0, 23.0, 19.0, 13.0, 16.0, 10.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7087762355804443, -0.6855018138885498, -0.6622273325920105, -0.638952910900116, -0.6156784296035767, -0.5924040079116821, -0.5691295862197876, -0.5458551645278931, -0.5225806832313538, -0.49930623173713684, -0.4760317802429199, -0.4527573585510254, -0.42948290705680847, -0.40620845556259155, -0.382934033870697, -0.3596595823764801, -0.3363851308822632, -0.31311067938804626, -0.28983622789382935, -0.2665618062019348, -0.2432873547077179, -0.22001290321350098, -0.19673846662044525, -0.17346403002738953, -0.1501895785331726, -0.1269151270389557, -0.10364069044589996, -0.08036624640226364, -0.05709180235862732, -0.033817358314991, -0.010542914271354675, 0.01273152232170105, 0.036006033420562744, 0.059280477464199066, 0.08255492150783539, 0.10582936555147171, 0.12910380959510803, 0.15237826108932495, 0.17565269768238068, 0.1989271342754364, 0.22220158576965332, 0.24547603726387024, 0.26875048875808716, 0.2920249104499817, 0.3152993619441986, 0.3385738134384155, 0.36184823513031006, 0.385122686624527, 0.4083971381187439, 0.4316715896129608, 0.45494604110717773, 0.47822046279907227, 0.5014948844909668, 0.5247693657875061, 0.5480437874794006, 0.5713182687759399, 0.5945926904678345, 0.617867112159729, 0.6411415934562683, 0.6644160151481628, 0.6876904964447021, 0.7109649181365967, 0.7342393398284912, 0.7575137615203857, 0.780788242816925]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [6.0, 4.0, 6.0, 8.0, 7.0, 15.0, 17.0, 22.0, 29.0, 37.0, 49.0, 74.0, 121.0, 150.0, 242.0, 392.0, 626.0, 998.0, 1516.0, 2644.0, 4042.0, 6486.0, 11175.0, 20089.0, 41241.0, 98000.0, 235214.0, 316420.0, 170772.0, 68274.0, 30710.0, 15573.0, 9018.0, 5472.0, 3365.0, 2059.0, 1305.0, 841.0, 526.0, 336.0, 238.0, 142.0, 101.0, 82.0, 37.0, 24.0, 19.0, 13.0, 7.0, 8.0, 3.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.173828125, -0.16746139526367188, -0.16109466552734375, -0.15472793579101562, -0.1483612060546875, -0.14199447631835938, -0.13562774658203125, -0.12926101684570312, -0.122894287109375, -0.11652755737304688, -0.11016082763671875, -0.10379409790039062, -0.0974273681640625, -0.09106063842773438, -0.08469390869140625, -0.07832717895507812, -0.07196044921875, -0.06559371948242188, -0.05922698974609375, -0.052860260009765625, -0.0464935302734375, -0.040126800537109375, -0.03376007080078125, -0.027393341064453125, -0.021026611328125, -0.014659881591796875, -0.00829315185546875, -0.001926422119140625, 0.0044403076171875, 0.010807037353515625, 0.01717376708984375, 0.023540496826171875, 0.0299072265625, 0.036273956298828125, 0.04264068603515625, 0.049007415771484375, 0.0553741455078125, 0.061740875244140625, 0.06810760498046875, 0.07447433471679688, 0.080841064453125, 0.08720779418945312, 0.09357452392578125, 0.09994125366210938, 0.1063079833984375, 0.11267471313476562, 0.11904144287109375, 0.12540817260742188, 0.13177490234375, 0.13814163208007812, 0.14450836181640625, 0.15087509155273438, 0.1572418212890625, 0.16360855102539062, 0.16997528076171875, 0.17634201049804688, 0.182708740234375, 0.18907546997070312, 0.19544219970703125, 0.20180892944335938, 0.2081756591796875, 0.21454238891601562, 0.22090911865234375, 0.22727584838867188, 0.233642578125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 7.0, 9.0, 8.0, 7.0, 11.0, 9.0, 7.0, 19.0, 12.0, 22.0, 25.0, 38.0, 24.0, 36.0, 43.0, 41.0, 31.0, 44.0, 50.0, 45.0, 30.0, 39.0, 42.0, 41.0, 34.0, 38.0, 31.0, 26.0, 25.0, 28.0, 31.0, 20.0, 19.0, 15.0, 20.0, 17.0, 13.0, 9.0, 5.0, 6.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10803604125976562, -0.10425567626953125, -0.10047531127929688, -0.0966949462890625, -0.09291458129882812, -0.08913421630859375, -0.08535385131835938, -0.081573486328125, -0.07779312133789062, -0.07401275634765625, -0.07023239135742188, -0.0664520263671875, -0.06267166137695312, -0.05889129638671875, -0.055110931396484375, -0.05133056640625, -0.047550201416015625, -0.04376983642578125, -0.039989471435546875, -0.0362091064453125, -0.032428741455078125, -0.02864837646484375, -0.024868011474609375, -0.021087646484375, -0.017307281494140625, -0.01352691650390625, -0.009746551513671875, -0.0059661865234375, -0.002185821533203125, 0.00159454345703125, 0.005374908447265625, 0.0091552734375, 0.012935638427734375, 0.01671600341796875, 0.020496368408203125, 0.0242767333984375, 0.028057098388671875, 0.03183746337890625, 0.035617828369140625, 0.039398193359375, 0.043178558349609375, 0.04695892333984375, 0.050739288330078125, 0.0545196533203125, 0.058300018310546875, 0.06208038330078125, 0.06586074829101562, 0.06964111328125, 0.07342147827148438, 0.07720184326171875, 0.08098220825195312, 0.0847625732421875, 0.08854293823242188, 0.09232330322265625, 0.09610366821289062, 0.099884033203125, 0.10366439819335938, 0.10744476318359375, 0.11122512817382812, 0.1150054931640625, 0.11878585815429688, 0.12256622314453125, 0.12634658813476562, 0.130126953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 9.0, 6.0, 8.0, 18.0, 20.0, 32.0, 34.0, 85.0, 100.0, 169.0, 315.0, 505.0, 873.0, 1472.0, 2646.0, 4759.0, 8584.0, 16537.0, 35460.0, 91169.0, 256810.0, 365545.0, 156814.0, 55834.0, 24133.0, 11838.0, 6406.0, 3486.0, 2001.0, 1166.0, 742.0, 390.0, 216.0, 139.0, 76.0, 67.0, 35.0, 22.0, 18.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.19936561584472656, -0.19231033325195312, -0.1852550506591797, -0.17819976806640625, -0.1711444854736328, -0.16408920288085938, -0.15703392028808594, -0.1499786376953125, -0.14292335510253906, -0.13586807250976562, -0.1288127899169922, -0.12175750732421875, -0.11470222473144531, -0.10764694213867188, -0.10059165954589844, -0.093536376953125, -0.08648109436035156, -0.07942581176757812, -0.07237052917480469, -0.06531524658203125, -0.05825996398925781, -0.051204681396484375, -0.04414939880371094, -0.0370941162109375, -0.030038833618164062, -0.022983551025390625, -0.015928268432617188, -0.00887298583984375, -0.0018177032470703125, 0.005237579345703125, 0.012292861938476562, 0.01934814453125, 0.026403427124023438, 0.033458709716796875, 0.04051399230957031, 0.04756927490234375, 0.05462455749511719, 0.061679840087890625, 0.06873512268066406, 0.0757904052734375, 0.08284568786621094, 0.08990097045898438, 0.09695625305175781, 0.10401153564453125, 0.11106681823730469, 0.11812210083007812, 0.12517738342285156, 0.132232666015625, 0.13928794860839844, 0.14634323120117188, 0.1533985137939453, 0.16045379638671875, 0.1675090789794922, 0.17456436157226562, 0.18161964416503906, 0.1886749267578125, 0.19573020935058594, 0.20278549194335938, 0.2098407745361328, 0.21689605712890625, 0.2239513397216797, 0.23100662231445312, 0.23806190490722656, 0.2451171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 7.0, 11.0, 5.0, 11.0, 10.0, 16.0, 15.0, 15.0, 11.0, 31.0, 29.0, 25.0, 24.0, 34.0, 37.0, 43.0, 44.0, 30.0, 32.0, 48.0, 37.0, 31.0, 41.0, 36.0, 45.0, 35.0, 23.0, 33.0, 24.0, 38.0, 21.0, 20.0, 28.0, 25.0, 16.0, 13.0, 11.0, 7.0, 6.0, 6.0, 10.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3681640625, -0.3568687438964844, -0.34557342529296875, -0.3342781066894531, -0.3229827880859375, -0.3116874694824219, -0.30039215087890625, -0.2890968322753906, -0.277801513671875, -0.2665061950683594, -0.25521087646484375, -0.24391555786132812, -0.2326202392578125, -0.22132492065429688, -0.21002960205078125, -0.19873428344726562, -0.18743896484375, -0.17614364624023438, -0.16484832763671875, -0.15355300903320312, -0.1422576904296875, -0.13096237182617188, -0.11966705322265625, -0.10837173461914062, -0.097076416015625, -0.08578109741210938, -0.07448577880859375, -0.06319046020507812, -0.0518951416015625, -0.040599822998046875, -0.02930450439453125, -0.018009185791015625, -0.0067138671875, 0.004581451416015625, 0.01587677001953125, 0.027172088623046875, 0.0384674072265625, 0.049762725830078125, 0.06105804443359375, 0.07235336303710938, 0.083648681640625, 0.09494400024414062, 0.10623931884765625, 0.11753463745117188, 0.1288299560546875, 0.14012527465820312, 0.15142059326171875, 0.16271591186523438, 0.17401123046875, 0.18530654907226562, 0.19660186767578125, 0.20789718627929688, 0.2191925048828125, 0.23048782348632812, 0.24178314208984375, 0.2530784606933594, 0.264373779296875, 0.2756690979003906, 0.28696441650390625, 0.2982597351074219, 0.3095550537109375, 0.3208503723144531, 0.33214569091796875, 0.3434410095214844, 0.354736328125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 9.0, 20.0, 21.0, 35.0, 50.0, 76.0, 121.0, 204.0, 310.0, 518.0, 770.0, 1280.0, 2088.0, 3292.0, 5203.0, 8742.0, 15240.0, 27687.0, 53368.0, 111598.0, 239228.0, 286354.0, 145021.0, 67845.0, 34086.0, 18446.0, 10596.0, 6211.0, 3813.0, 2391.0, 1435.0, 916.0, 519.0, 387.0, 241.0, 143.0, 97.0, 60.0, 46.0, 21.0, 29.0, 6.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07891845703125, -0.07630252838134766, -0.07368659973144531, -0.07107067108154297, -0.06845474243164062, -0.06583881378173828, -0.06322288513183594, -0.060606956481933594, -0.05799102783203125, -0.055375099182128906, -0.05275917053222656, -0.05014324188232422, -0.047527313232421875, -0.04491138458251953, -0.04229545593261719, -0.039679527282714844, -0.0370635986328125, -0.034447669982910156, -0.03183174133300781, -0.02921581268310547, -0.026599884033203125, -0.02398395538330078, -0.021368026733398438, -0.018752098083496094, -0.01613616943359375, -0.013520240783691406, -0.010904312133789062, -0.008288383483886719, -0.005672454833984375, -0.0030565261840820312, -0.0004405975341796875, 0.0021753311157226562, 0.004791259765625, 0.007407188415527344, 0.010023117065429688, 0.012639045715332031, 0.015254974365234375, 0.01787090301513672, 0.020486831665039062, 0.023102760314941406, 0.02571868896484375, 0.028334617614746094, 0.030950546264648438, 0.03356647491455078, 0.036182403564453125, 0.03879833221435547, 0.04141426086425781, 0.044030189514160156, 0.0466461181640625, 0.049262046813964844, 0.05187797546386719, 0.05449390411376953, 0.057109832763671875, 0.05972576141357422, 0.06234169006347656, 0.0649576187133789, 0.06757354736328125, 0.0701894760131836, 0.07280540466308594, 0.07542133331298828, 0.07803726196289062, 0.08065319061279297, 0.08326911926269531, 0.08588504791259766, 0.0885009765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 9.0, 17.0, 22.0, 31.0, 39.0, 73.0, 96.0, 140.0, 173.0, 113.0, 88.0, 52.0, 44.0, 19.0, 16.0, 10.0, 7.0, 5.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9485435485839844e-05, -5.7931989431381226e-05, -5.637854337692261e-05, -5.482509732246399e-05, -5.327165126800537e-05, -5.171820521354675e-05, -5.0164759159088135e-05, -4.8611313104629517e-05, -4.70578670501709e-05, -4.550442099571228e-05, -4.395097494125366e-05, -4.2397528886795044e-05, -4.0844082832336426e-05, -3.929063677787781e-05, -3.773719072341919e-05, -3.618374466896057e-05, -3.463029861450195e-05, -3.3076852560043335e-05, -3.152340650558472e-05, -2.99699604511261e-05, -2.841651439666748e-05, -2.6863068342208862e-05, -2.5309622287750244e-05, -2.3756176233291626e-05, -2.2202730178833008e-05, -2.064928412437439e-05, -1.909583806991577e-05, -1.7542392015457153e-05, -1.5988945960998535e-05, -1.4435499906539917e-05, -1.2882053852081299e-05, -1.132860779762268e-05, -9.775161743164062e-06, -8.221715688705444e-06, -6.668269634246826e-06, -5.114823579788208e-06, -3.56137752532959e-06, -2.0079314708709717e-06, -4.544854164123535e-07, 1.0989606380462646e-06, 2.652406692504883e-06, 4.205852746963501e-06, 5.759298801422119e-06, 7.312744855880737e-06, 8.866190910339355e-06, 1.0419636964797974e-05, 1.1973083019256592e-05, 1.352652907371521e-05, 1.5079975128173828e-05, 1.6633421182632446e-05, 1.8186867237091064e-05, 1.9740313291549683e-05, 2.12937593460083e-05, 2.284720540046692e-05, 2.4400651454925537e-05, 2.5954097509384155e-05, 2.7507543563842773e-05, 2.906098961830139e-05, 3.061443567276001e-05, 3.216788172721863e-05, 3.3721327781677246e-05, 3.5274773836135864e-05, 3.682821989059448e-05, 3.83816659450531e-05, 3.993511199951172e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 9.0, 7.0, 7.0, 20.0, 26.0, 43.0, 90.0, 114.0, 214.0, 420.0, 692.0, 1209.0, 2325.0, 4537.0, 8966.0, 17981.0, 37808.0, 84291.0, 189541.0, 313722.0, 210119.0, 94044.0, 41927.0, 20141.0, 9893.0, 4932.0, 2384.0, 1323.0, 723.0, 419.0, 251.0, 137.0, 96.0, 54.0, 36.0, 20.0, 12.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09173583984375, -0.08882999420166016, -0.08592414855957031, -0.08301830291748047, -0.08011245727539062, -0.07720661163330078, -0.07430076599121094, -0.0713949203491211, -0.06848907470703125, -0.0655832290649414, -0.06267738342285156, -0.05977153778076172, -0.056865692138671875, -0.05395984649658203, -0.05105400085449219, -0.048148155212402344, -0.0452423095703125, -0.042336463928222656, -0.03943061828613281, -0.03652477264404297, -0.033618927001953125, -0.03071308135986328, -0.027807235717773438, -0.024901390075683594, -0.02199554443359375, -0.019089698791503906, -0.016183853149414062, -0.013278007507324219, -0.010372161865234375, -0.007466316223144531, -0.0045604705810546875, -0.0016546249389648438, 0.001251220703125, 0.004157066345214844, 0.0070629119873046875, 0.009968757629394531, 0.012874603271484375, 0.01578044891357422, 0.018686294555664062, 0.021592140197753906, 0.02449798583984375, 0.027403831481933594, 0.030309677124023438, 0.03321552276611328, 0.036121368408203125, 0.03902721405029297, 0.04193305969238281, 0.044838905334472656, 0.0477447509765625, 0.050650596618652344, 0.05355644226074219, 0.05646228790283203, 0.059368133544921875, 0.06227397918701172, 0.06517982482910156, 0.0680856704711914, 0.07099151611328125, 0.0738973617553711, 0.07680320739746094, 0.07970905303955078, 0.08261489868164062, 0.08552074432373047, 0.08842658996582031, 0.09133243560791016, 0.09423828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 9.0, 7.0, 7.0, 13.0, 21.0, 22.0, 21.0, 25.0, 52.0, 43.0, 57.0, 65.0, 72.0, 59.0, 84.0, 77.0, 69.0, 51.0, 43.0, 46.0, 24.0, 14.0, 23.0, 16.0, 11.0, 11.0, 10.0, 8.0, 6.0, 2.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0947265625, -0.09180831909179688, -0.08889007568359375, -0.08597183227539062, -0.0830535888671875, -0.08013534545898438, -0.07721710205078125, -0.07429885864257812, -0.071380615234375, -0.06846237182617188, -0.06554412841796875, -0.06262588500976562, -0.0597076416015625, -0.056789398193359375, -0.05387115478515625, -0.050952911376953125, -0.04803466796875, -0.045116424560546875, -0.04219818115234375, -0.039279937744140625, -0.0363616943359375, -0.033443450927734375, -0.03052520751953125, -0.027606964111328125, -0.024688720703125, -0.021770477294921875, -0.01885223388671875, -0.015933990478515625, -0.0130157470703125, -0.010097503662109375, -0.00717926025390625, -0.004261016845703125, -0.0013427734375, 0.001575469970703125, 0.00449371337890625, 0.007411956787109375, 0.0103302001953125, 0.013248443603515625, 0.01616668701171875, 0.019084930419921875, 0.022003173828125, 0.024921417236328125, 0.02783966064453125, 0.030757904052734375, 0.0336761474609375, 0.036594390869140625, 0.03951263427734375, 0.042430877685546875, 0.04534912109375, 0.048267364501953125, 0.05118560791015625, 0.054103851318359375, 0.0570220947265625, 0.059940338134765625, 0.06285858154296875, 0.06577682495117188, 0.068695068359375, 0.07161331176757812, 0.07453155517578125, 0.07744979858398438, 0.0803680419921875, 0.08328628540039062, 0.08620452880859375, 0.08912277221679688, 0.092041015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 10.0, 21.0, 56.0, 109.0, 196.0, 232.0, 182.0, 104.0, 47.0, 22.0, 14.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9997341632843018, -1.9105379581451416, -1.821341633796692, -1.7321454286575317, -1.6429492235183716, -1.5537528991699219, -1.4645566940307617, -1.3753604888916016, -1.2861642837524414, -1.1969680786132812, -1.1077717542648315, -1.0185755491256714, -0.9293793439865112, -0.8401830792427063, -0.7509868144989014, -0.6617906093597412, -0.5725942850112915, -0.48339805006980896, -0.3942018151283264, -0.3050055503845215, -0.21580931544303894, -0.1266130805015564, -0.037416815757751465, 0.05177938938140869, 0.14097565412521362, 0.23017188906669617, 0.3193681240081787, 0.40856438875198364, 0.4977606236934662, 0.5869568586349487, 0.6761531233787537, 0.7653493285179138, 0.8545455932617188, 0.9437418580055237, 1.0329381227493286, 1.1221343278884888, 1.211330533027649, 1.3005268573760986, 1.3897230625152588, 1.478919267654419, 1.568115472793579, 1.6573116779327393, 1.746508002281189, 1.8357042074203491, 1.9249004125595093, 2.014096736907959, 2.103292942047119, 2.1924891471862793, 2.2816853523254395, 2.3708815574645996, 2.4600777626037598, 2.54927396774292, 2.638470411300659, 2.7276666164398193, 2.8168628215789795, 2.9060590267181396, 2.995255470275879, 3.084451675415039, 3.173647880554199, 3.2628440856933594, 3.3520405292510986, 3.441236734390259, 3.530432939529419, 3.619629144668579, 3.7088253498077393]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 3.0, 5.0, 3.0, 15.0, 14.0, 13.0, 17.0, 17.0, 15.0, 23.0, 18.0, 19.0, 16.0, 36.0, 38.0, 39.0, 40.0, 38.0, 49.0, 43.0, 41.0, 43.0, 39.0, 42.0, 29.0, 34.0, 23.0, 37.0, 34.0, 29.0, 26.0, 19.0, 21.0, 15.0, 20.0, 12.0, 11.0, 8.0, 9.0, 10.0, 9.0, 6.0, 4.0, 1.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8899648785591125, -0.8600038886070251, -0.8300428986549377, -0.8000819683074951, -0.7701209783554077, -0.7401599884033203, -0.7101989984512329, -0.6802380084991455, -0.6502770185470581, -0.6203160285949707, -0.5903550386428833, -0.5603940486907959, -0.5304331183433533, -0.5004721283912659, -0.47051113843917847, -0.44055014848709106, -0.41058921813964844, -0.38062822818756104, -0.350667268037796, -0.3207062780857086, -0.2907453179359436, -0.2607843279838562, -0.2308233380317688, -0.2008623629808426, -0.17090138792991638, -0.14094041287899017, -0.11097943037748337, -0.08101844787597656, -0.051057472825050354, -0.021096497774124146, 0.008864492177963257, 0.038825467228889465, 0.0687863826751709, 0.0987473577260971, 0.12870833277702332, 0.15866932272911072, 0.18863029778003693, 0.21859127283096313, 0.24855226278305054, 0.27851325273513794, 0.30847421288490295, 0.33843520283699036, 0.36839616298675537, 0.3983571529388428, 0.4283181428909302, 0.4582791030406952, 0.4882400929927826, 0.5182010531425476, 0.548162043094635, 0.5781230330467224, 0.6080840229988098, 0.6380449533462524, 0.6680059432983398, 0.6979669332504272, 0.7279279232025146, 0.757888913154602, 0.7878499031066895, 0.8178108930587769, 0.8477718830108643, 0.8777328729629517, 0.9076938033103943, 0.9376547932624817, 0.9676157832145691, 0.9975767731666565, 1.0275377035140991]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 10.0, 13.0, 31.0, 39.0, 67.0, 75.0, 149.0, 208.0, 297.0, 505.0, 896.0, 1621.0, 2754.0, 5177.0, 10201.0, 21413.0, 50204.0, 141039.0, 448517.0, 1302496.0, 1429389.0, 517370.0, 158095.0, 56176.0, 23698.0, 11018.0, 5659.0, 2943.0, 1693.0, 1015.0, 554.0, 320.0, 224.0, 135.0, 84.0, 62.0, 44.0, 22.0, 16.0, 16.0, 12.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17919921875, -0.1740875244140625, -0.168975830078125, -0.1638641357421875, -0.15875244140625, -0.1536407470703125, -0.148529052734375, -0.1434173583984375, -0.1383056640625, -0.1331939697265625, -0.128082275390625, -0.1229705810546875, -0.11785888671875, -0.1127471923828125, -0.107635498046875, -0.1025238037109375, -0.097412109375, -0.0923004150390625, -0.087188720703125, -0.0820770263671875, -0.07696533203125, -0.0718536376953125, -0.066741943359375, -0.0616302490234375, -0.0565185546875, -0.0514068603515625, -0.046295166015625, -0.0411834716796875, -0.03607177734375, -0.0309600830078125, -0.025848388671875, -0.0207366943359375, -0.015625, -0.0105133056640625, -0.005401611328125, -0.0002899169921875, 0.00482177734375, 0.0099334716796875, 0.015045166015625, 0.0201568603515625, 0.0252685546875, 0.0303802490234375, 0.035491943359375, 0.0406036376953125, 0.04571533203125, 0.0508270263671875, 0.055938720703125, 0.0610504150390625, 0.066162109375, 0.0712738037109375, 0.076385498046875, 0.0814971923828125, 0.08660888671875, 0.0917205810546875, 0.096832275390625, 0.1019439697265625, 0.1070556640625, 0.1121673583984375, 0.117279052734375, 0.1223907470703125, 0.12750244140625, 0.1326141357421875, 0.137725830078125, 0.1428375244140625, 0.14794921875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 7.0, 10.0, 4.0, 10.0, 8.0, 18.0, 15.0, 23.0, 21.0, 14.0, 30.0, 27.0, 33.0, 31.0, 24.0, 30.0, 33.0, 38.0, 43.0, 34.0, 34.0, 38.0, 52.0, 33.0, 39.0, 38.0, 36.0, 28.0, 19.0, 28.0, 18.0, 26.0, 16.0, 23.0, 16.0, 12.0, 16.0, 10.0, 11.0, 9.0, 7.0, 3.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.10467529296875, -0.1010751724243164, -0.09747505187988281, -0.09387493133544922, -0.09027481079101562, -0.08667469024658203, -0.08307456970214844, -0.07947444915771484, -0.07587432861328125, -0.07227420806884766, -0.06867408752441406, -0.06507396697998047, -0.061473846435546875, -0.05787372589111328, -0.05427360534667969, -0.050673484802246094, -0.0470733642578125, -0.043473243713378906, -0.03987312316894531, -0.03627300262451172, -0.032672882080078125, -0.02907276153564453, -0.025472640991210938, -0.021872520446777344, -0.01827239990234375, -0.014672279357910156, -0.011072158813476562, -0.007472038269042969, -0.003871917724609375, -0.00027179718017578125, 0.0033283233642578125, 0.006928443908691406, 0.010528564453125, 0.014128684997558594, 0.017728805541992188, 0.02132892608642578, 0.024929046630859375, 0.02852916717529297, 0.03212928771972656, 0.035729408264160156, 0.03932952880859375, 0.042929649353027344, 0.04652976989746094, 0.05012989044189453, 0.053730010986328125, 0.05733013153076172, 0.06093025207519531, 0.0645303726196289, 0.0681304931640625, 0.0717306137084961, 0.07533073425292969, 0.07893085479736328, 0.08253097534179688, 0.08613109588623047, 0.08973121643066406, 0.09333133697509766, 0.09693145751953125, 0.10053157806396484, 0.10413169860839844, 0.10773181915283203, 0.11133193969726562, 0.11493206024169922, 0.11853218078613281, 0.1221323013305664, 0.125732421875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 5.0, 12.0, 15.0, 18.0, 32.0, 48.0, 76.0, 126.0, 184.0, 326.0, 531.0, 959.0, 1851.0, 3554.0, 7400.0, 16528.0, 41195.0, 117068.0, 403512.0, 1752621.0, 1378506.0, 313233.0, 94668.0, 34321.0, 14238.0, 6543.0, 3002.0, 1592.0, 872.0, 449.0, 271.0, 217.0, 99.0, 70.0, 40.0, 33.0, 21.0, 13.0, 6.0, 3.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.26318359375, -0.25585365295410156, -0.24852371215820312, -0.2411937713623047, -0.23386383056640625, -0.2265338897705078, -0.21920394897460938, -0.21187400817871094, -0.2045440673828125, -0.19721412658691406, -0.18988418579101562, -0.1825542449951172, -0.17522430419921875, -0.1678943634033203, -0.16056442260742188, -0.15323448181152344, -0.145904541015625, -0.13857460021972656, -0.13124465942382812, -0.12391471862792969, -0.11658477783203125, -0.10925483703613281, -0.10192489624023438, -0.09459495544433594, -0.0872650146484375, -0.07993507385253906, -0.07260513305664062, -0.06527519226074219, -0.05794525146484375, -0.05061531066894531, -0.043285369873046875, -0.03595542907714844, -0.02862548828125, -0.021295547485351562, -0.013965606689453125, -0.0066356658935546875, 0.00069427490234375, 0.008024215698242188, 0.015354156494140625, 0.022684097290039062, 0.0300140380859375, 0.03734397888183594, 0.044673919677734375, 0.05200386047363281, 0.05933380126953125, 0.06666374206542969, 0.07399368286132812, 0.08132362365722656, 0.088653564453125, 0.09598350524902344, 0.10331344604492188, 0.11064338684082031, 0.11797332763671875, 0.1253032684326172, 0.13263320922851562, 0.13996315002441406, 0.1472930908203125, 0.15462303161621094, 0.16195297241210938, 0.1692829132080078, 0.17661285400390625, 0.1839427947998047, 0.19127273559570312, 0.19860267639160156, 0.2059326171875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 12.0, 8.0, 14.0, 14.0, 17.0, 29.0, 37.0, 47.0, 80.0, 73.0, 101.0, 142.0, 241.0, 345.0, 425.0, 569.0, 524.0, 392.0, 252.0, 180.0, 155.0, 98.0, 93.0, 54.0, 40.0, 27.0, 22.0, 19.0, 12.0, 12.0, 7.0, 11.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27197265625, -0.2639045715332031, -0.25583648681640625, -0.24776840209960938, -0.2397003173828125, -0.23163223266601562, -0.22356414794921875, -0.21549606323242188, -0.207427978515625, -0.19935989379882812, -0.19129180908203125, -0.18322372436523438, -0.1751556396484375, -0.16708755493164062, -0.15901947021484375, -0.15095138549804688, -0.14288330078125, -0.13481521606445312, -0.12674713134765625, -0.11867904663085938, -0.1106109619140625, -0.10254287719726562, -0.09447479248046875, -0.08640670776367188, -0.078338623046875, -0.07027053833007812, -0.06220245361328125, -0.054134368896484375, -0.0460662841796875, -0.037998199462890625, -0.02993011474609375, -0.021862030029296875, -0.0137939453125, -0.005725860595703125, 0.00234222412109375, 0.010410308837890625, 0.0184783935546875, 0.026546478271484375, 0.03461456298828125, 0.042682647705078125, 0.050750732421875, 0.058818817138671875, 0.06688690185546875, 0.07495498657226562, 0.0830230712890625, 0.09109115600585938, 0.09915924072265625, 0.10722732543945312, 0.11529541015625, 0.12336349487304688, 0.13143157958984375, 0.13949966430664062, 0.1475677490234375, 0.15563583374023438, 0.16370391845703125, 0.17177200317382812, 0.179840087890625, 0.18790817260742188, 0.19597625732421875, 0.20404434204101562, 0.2121124267578125, 0.22018051147460938, 0.22824859619140625, 0.23631668090820312, 0.244384765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 10.0, 31.0, 41.0, 56.0, 113.0, 133.0, 141.0, 142.0, 113.0, 88.0, 50.0, 29.0, 22.0, 8.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4277150630950928, -1.3595829010009766, -1.2914507389068604, -1.2233184576034546, -1.1551862955093384, -1.0870541334152222, -1.0189218521118164, -0.9507896900177002, -0.882657527923584, -0.8145253658294678, -0.7463931441307068, -0.6782609224319458, -0.6101287603378296, -0.5419965982437134, -0.4738643765449524, -0.4057321846485138, -0.3375999927520752, -0.2694678008556366, -0.201335608959198, -0.1332034170627594, -0.0650712251663208, 0.003060966730117798, 0.0711931586265564, 0.139325350522995, 0.2074575424194336, 0.2755897343158722, 0.3437219262123108, 0.4118541181087494, 0.479986310005188, 0.5481184720993042, 0.6162506937980652, 0.6843829154968262, 0.7525148391723633, 0.8206470012664795, 0.8887792229652405, 0.9569114446640015, 1.0250436067581177, 1.0931757688522339, 1.1613080501556396, 1.2294402122497559, 1.297572374343872, 1.3657045364379883, 1.4338366985321045, 1.5019689798355103, 1.5701011419296265, 1.6382333040237427, 1.7063655853271484, 1.7744977474212646, 1.8426299095153809, 1.910762071609497, 1.9788942337036133, 2.0470263957977295, 2.1151585578918457, 2.183290958404541, 2.2514231204986572, 2.3195552825927734, 2.3876874446868896, 2.455819606781006, 2.523951768875122, 2.5920839309692383, 2.6602163314819336, 2.72834849357605, 2.796480655670166, 2.8646128177642822, 2.9327449798583984]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 16.0, 10.0, 18.0, 14.0, 19.0, 29.0, 23.0, 42.0, 33.0, 44.0, 46.0, 38.0, 37.0, 59.0, 55.0, 35.0, 61.0, 49.0, 53.0, 45.0, 32.0, 33.0, 30.0, 30.0, 28.0, 14.0, 16.0, 21.0, 12.0, 7.0, 13.0, 6.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9705355167388916, -0.9403336048126221, -0.9101316928863525, -0.879929780960083, -0.8497278690338135, -0.819525957107544, -0.7893240451812744, -0.7591221332550049, -0.7289202213287354, -0.6987183094024658, -0.6685163974761963, -0.6383144855499268, -0.6081125736236572, -0.5779106616973877, -0.5477087497711182, -0.5175068378448486, -0.4873049855232239, -0.45710307359695435, -0.4269011616706848, -0.3966992497444153, -0.36649733781814575, -0.3362954258918762, -0.3060935437679291, -0.27589163184165955, -0.24568971991539001, -0.21548780798912048, -0.18528589606285095, -0.15508399903774261, -0.12488208711147308, -0.09468017518520355, -0.06447827816009521, -0.034276366233825684, -0.004074513912200928, 0.026127394288778305, 0.05632930248975754, 0.08653120696544647, 0.116733118891716, 0.14693503081798553, 0.17713692784309387, 0.2073388397693634, 0.23754075169563293, 0.26774266362190247, 0.297944575548172, 0.32814645767211914, 0.35834836959838867, 0.3885502815246582, 0.41875219345092773, 0.44895410537719727, 0.4791560173034668, 0.5093579292297363, 0.5395598411560059, 0.5697617530822754, 0.5999636650085449, 0.6301655769348145, 0.660367488861084, 0.6905694007873535, 0.720771312713623, 0.7509732246398926, 0.7811751365661621, 0.8113770484924316, 0.8415789604187012, 0.8717808723449707, 0.9019827842712402, 0.9321846961975098, 0.9623865485191345]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 11.0, 8.0, 18.0, 38.0, 52.0, 72.0, 107.0, 155.0, 250.0, 398.0, 594.0, 890.0, 1422.0, 2120.0, 3183.0, 5032.0, 7715.0, 12612.0, 21934.0, 44803.0, 105271.0, 227525.0, 286036.0, 174180.0, 74869.0, 33019.0, 17464.0, 10076.0, 6435.0, 4364.0, 2657.0, 1860.0, 1202.0, 754.0, 469.0, 321.0, 203.0, 142.0, 95.0, 70.0, 48.0, 31.0, 19.0, 10.0, 7.0, 6.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.249267578125, -0.242401123046875, -0.23553466796875, -0.228668212890625, -0.2218017578125, -0.214935302734375, -0.20806884765625, -0.201202392578125, -0.1943359375, -0.187469482421875, -0.18060302734375, -0.173736572265625, -0.1668701171875, -0.160003662109375, -0.15313720703125, -0.146270751953125, -0.139404296875, -0.132537841796875, -0.12567138671875, -0.118804931640625, -0.1119384765625, -0.105072021484375, -0.09820556640625, -0.091339111328125, -0.08447265625, -0.077606201171875, -0.07073974609375, -0.063873291015625, -0.0570068359375, -0.050140380859375, -0.04327392578125, -0.036407470703125, -0.029541015625, -0.022674560546875, -0.01580810546875, -0.008941650390625, -0.0020751953125, 0.004791259765625, 0.01165771484375, 0.018524169921875, 0.025390625, 0.032257080078125, 0.03912353515625, 0.045989990234375, 0.0528564453125, 0.059722900390625, 0.06658935546875, 0.073455810546875, 0.080322265625, 0.087188720703125, 0.09405517578125, 0.100921630859375, 0.1077880859375, 0.114654541015625, 0.12152099609375, 0.128387451171875, 0.13525390625, 0.142120361328125, 0.14898681640625, 0.155853271484375, 0.1627197265625, 0.169586181640625, 0.17645263671875, 0.183319091796875, 0.190185546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 14.0, 8.0, 18.0, 13.0, 23.0, 25.0, 31.0, 27.0, 32.0, 33.0, 36.0, 33.0, 39.0, 40.0, 39.0, 23.0, 49.0, 39.0, 42.0, 34.0, 48.0, 35.0, 41.0, 36.0, 32.0, 37.0, 27.0, 19.0, 20.0, 12.0, 16.0, 20.0, 8.0, 3.0, 10.0, 9.0, 1.0, 1.0, 7.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.1435546875, -0.13928604125976562, -0.13501739501953125, -0.13074874877929688, -0.1264801025390625, -0.12221145629882812, -0.11794281005859375, -0.11367416381835938, -0.109405517578125, -0.10513687133789062, -0.10086822509765625, -0.09659957885742188, -0.0923309326171875, -0.08806228637695312, -0.08379364013671875, -0.07952499389648438, -0.07525634765625, -0.07098770141601562, -0.06671905517578125, -0.062450408935546875, -0.0581817626953125, -0.053913116455078125, -0.04964447021484375, -0.045375823974609375, -0.041107177734375, -0.036838531494140625, -0.03256988525390625, -0.028301239013671875, -0.0240325927734375, -0.019763946533203125, -0.01549530029296875, -0.011226654052734375, -0.0069580078125, -0.002689361572265625, 0.00157928466796875, 0.005847930908203125, 0.0101165771484375, 0.014385223388671875, 0.01865386962890625, 0.022922515869140625, 0.027191162109375, 0.031459808349609375, 0.03572845458984375, 0.039997100830078125, 0.0442657470703125, 0.048534393310546875, 0.05280303955078125, 0.057071685791015625, 0.06134033203125, 0.06560897827148438, 0.06987762451171875, 0.07414627075195312, 0.0784149169921875, 0.08268356323242188, 0.08695220947265625, 0.09122085571289062, 0.095489501953125, 0.09975814819335938, 0.10402679443359375, 0.10829544067382812, 0.1125640869140625, 0.11683273315429688, 0.12110137939453125, 0.12537002563476562, 0.129638671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 8.0, 14.0, 19.0, 18.0, 36.0, 54.0, 65.0, 127.0, 188.0, 336.0, 571.0, 1068.0, 2012.0, 4037.0, 8185.0, 17782.0, 44981.0, 152980.0, 432599.0, 263194.0, 72080.0, 25589.0, 11310.0, 5393.0, 2696.0, 1404.0, 731.0, 392.0, 228.0, 135.0, 98.0, 62.0, 47.0, 35.0, 18.0, 10.0, 13.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33203125, -0.3218803405761719, -0.31172943115234375, -0.3015785217285156, -0.2914276123046875, -0.2812767028808594, -0.27112579345703125, -0.2609748840332031, -0.250823974609375, -0.24067306518554688, -0.23052215576171875, -0.22037124633789062, -0.2102203369140625, -0.20006942749023438, -0.18991851806640625, -0.17976760864257812, -0.16961669921875, -0.15946578979492188, -0.14931488037109375, -0.13916397094726562, -0.1290130615234375, -0.11886215209960938, -0.10871124267578125, -0.09856033325195312, -0.088409423828125, -0.07825851440429688, -0.06810760498046875, -0.057956695556640625, -0.0478057861328125, -0.037654876708984375, -0.02750396728515625, -0.017353057861328125, -0.0072021484375, 0.002948760986328125, 0.01309967041015625, 0.023250579833984375, 0.0334014892578125, 0.043552398681640625, 0.05370330810546875, 0.06385421752929688, 0.074005126953125, 0.08415603637695312, 0.09430694580078125, 0.10445785522460938, 0.1146087646484375, 0.12475967407226562, 0.13491058349609375, 0.14506149291992188, 0.15521240234375, 0.16536331176757812, 0.17551422119140625, 0.18566513061523438, 0.1958160400390625, 0.20596694946289062, 0.21611785888671875, 0.22626876831054688, 0.236419677734375, 0.24657058715820312, 0.25672149658203125, 0.2668724060058594, 0.2770233154296875, 0.2871742248535156, 0.29732513427734375, 0.3074760437011719, 0.317626953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 7.0, 5.0, 8.0, 17.0, 23.0, 26.0, 14.0, 25.0, 18.0, 26.0, 33.0, 25.0, 37.0, 36.0, 50.0, 37.0, 40.0, 44.0, 51.0, 39.0, 42.0, 43.0, 47.0, 28.0, 46.0, 38.0, 34.0, 24.0, 26.0, 14.0, 10.0, 14.0, 13.0, 15.0, 12.0, 9.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3598594665527344, -0.34691619873046875, -0.3339729309082031, -0.3210296630859375, -0.3080863952636719, -0.29514312744140625, -0.2821998596191406, -0.269256591796875, -0.2563133239746094, -0.24337005615234375, -0.23042678833007812, -0.2174835205078125, -0.20454025268554688, -0.19159698486328125, -0.17865371704101562, -0.16571044921875, -0.15276718139648438, -0.13982391357421875, -0.12688064575195312, -0.1139373779296875, -0.10099411010742188, -0.08805084228515625, -0.07510757446289062, -0.062164306640625, -0.049221038818359375, -0.03627777099609375, -0.023334503173828125, -0.0103912353515625, 0.002552032470703125, 0.01549530029296875, 0.028438568115234375, 0.0413818359375, 0.054325103759765625, 0.06726837158203125, 0.08021163940429688, 0.0931549072265625, 0.10609817504882812, 0.11904144287109375, 0.13198471069335938, 0.144927978515625, 0.15787124633789062, 0.17081451416015625, 0.18375778198242188, 0.1967010498046875, 0.20964431762695312, 0.22258758544921875, 0.23553085327148438, 0.24847412109375, 0.2614173889160156, 0.27436065673828125, 0.2873039245605469, 0.3002471923828125, 0.3131904602050781, 0.32613372802734375, 0.3390769958496094, 0.352020263671875, 0.3649635314941406, 0.37790679931640625, 0.3908500671386719, 0.4037933349609375, 0.4167366027832031, 0.42967987060546875, 0.4426231384277344, 0.45556640625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 10.0, 16.0, 27.0, 41.0, 56.0, 86.0, 112.0, 188.0, 312.0, 458.0, 715.0, 1085.0, 1794.0, 3108.0, 4847.0, 8308.0, 13968.0, 25165.0, 50383.0, 114535.0, 255049.0, 290354.0, 145635.0, 61611.0, 29986.0, 16544.0, 9225.0, 5677.0, 3508.0, 2113.0, 1305.0, 869.0, 510.0, 341.0, 202.0, 143.0, 77.0, 69.0, 44.0, 27.0, 14.0, 13.0, 11.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08489990234375, -0.08188247680664062, -0.07886505126953125, -0.07584762573242188, -0.0728302001953125, -0.06981277465820312, -0.06679534912109375, -0.06377792358398438, -0.060760498046875, -0.057743072509765625, -0.05472564697265625, -0.051708221435546875, -0.0486907958984375, -0.045673370361328125, -0.04265594482421875, -0.039638519287109375, -0.03662109375, -0.033603668212890625, -0.03058624267578125, -0.027568817138671875, -0.0245513916015625, -0.021533966064453125, -0.01851654052734375, -0.015499114990234375, -0.012481689453125, -0.009464263916015625, -0.00644683837890625, -0.003429412841796875, -0.0004119873046875, 0.002605438232421875, 0.00562286376953125, 0.008640289306640625, 0.01165771484375, 0.014675140380859375, 0.01769256591796875, 0.020709991455078125, 0.0237274169921875, 0.026744842529296875, 0.02976226806640625, 0.032779693603515625, 0.035797119140625, 0.038814544677734375, 0.04183197021484375, 0.044849395751953125, 0.0478668212890625, 0.050884246826171875, 0.05390167236328125, 0.056919097900390625, 0.0599365234375, 0.06295394897460938, 0.06597137451171875, 0.06898880004882812, 0.0720062255859375, 0.07502365112304688, 0.07804107666015625, 0.08105850219726562, 0.084075927734375, 0.08709335327148438, 0.09011077880859375, 0.09312820434570312, 0.0961456298828125, 0.09916305541992188, 0.10218048095703125, 0.10519790649414062, 0.10821533203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 5.0, 11.0, 6.0, 12.0, 7.0, 17.0, 22.0, 22.0, 32.0, 58.0, 88.0, 98.0, 114.0, 116.0, 112.0, 89.0, 47.0, 33.0, 27.0, 14.0, 11.0, 11.0, 9.0, 1.0, 1.0, 3.0, 8.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.363059997558594e-05, -4.22624871134758e-05, -4.089437425136566e-05, -3.9526261389255524e-05, -3.8158148527145386e-05, -3.679003566503525e-05, -3.542192280292511e-05, -3.405380994081497e-05, -3.2685697078704834e-05, -3.1317584216594696e-05, -2.9949471354484558e-05, -2.858135849237442e-05, -2.7213245630264282e-05, -2.5845132768154144e-05, -2.4477019906044006e-05, -2.310890704393387e-05, -2.174079418182373e-05, -2.0372681319713593e-05, -1.9004568457603455e-05, -1.7636455595493317e-05, -1.626834273338318e-05, -1.490022987127304e-05, -1.3532117009162903e-05, -1.2164004147052765e-05, -1.0795891284942627e-05, -9.427778422832489e-06, -8.059665560722351e-06, -6.691552698612213e-06, -5.323439836502075e-06, -3.955326974391937e-06, -2.5872141122817993e-06, -1.2191012501716614e-06, 1.4901161193847656e-07, 1.5171244740486145e-06, 2.8852373361587524e-06, 4.25335019826889e-06, 5.621463060379028e-06, 6.989575922489166e-06, 8.357688784599304e-06, 9.725801646709442e-06, 1.109391450881958e-05, 1.2462027370929718e-05, 1.3830140233039856e-05, 1.5198253095149994e-05, 1.6566365957260132e-05, 1.793447881937027e-05, 1.9302591681480408e-05, 2.0670704543590546e-05, 2.2038817405700684e-05, 2.340693026781082e-05, 2.477504312992096e-05, 2.6143155992031097e-05, 2.7511268854141235e-05, 2.8879381716251373e-05, 3.024749457836151e-05, 3.161560744047165e-05, 3.298372030258179e-05, 3.4351833164691925e-05, 3.571994602680206e-05, 3.70880588889122e-05, 3.845617175102234e-05, 3.982428461313248e-05, 4.1192397475242615e-05, 4.256051033735275e-05, 4.392862319946289e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 19.0, 15.0, 25.0, 37.0, 62.0, 96.0, 162.0, 219.0, 390.0, 638.0, 1159.0, 2158.0, 3989.0, 7767.0, 15436.0, 33418.0, 77897.0, 181751.0, 300047.0, 232286.0, 105623.0, 44380.0, 20271.0, 9765.0, 4917.0, 2647.0, 1380.0, 769.0, 459.0, 234.0, 177.0, 104.0, 82.0, 62.0, 34.0, 17.0, 15.0, 16.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.088134765625, -0.08506107330322266, -0.08198738098144531, -0.07891368865966797, -0.07583999633789062, -0.07276630401611328, -0.06969261169433594, -0.0666189193725586, -0.06354522705078125, -0.060471534729003906, -0.05739784240722656, -0.05432415008544922, -0.051250457763671875, -0.04817676544189453, -0.04510307312011719, -0.042029380798339844, -0.0389556884765625, -0.035881996154785156, -0.03280830383300781, -0.02973461151123047, -0.026660919189453125, -0.02358722686767578, -0.020513534545898438, -0.017439842224121094, -0.01436614990234375, -0.011292457580566406, -0.008218765258789062, -0.005145072937011719, -0.002071380615234375, 0.0010023117065429688, 0.0040760040283203125, 0.007149696350097656, 0.010223388671875, 0.013297080993652344, 0.016370773315429688, 0.01944446563720703, 0.022518157958984375, 0.02559185028076172, 0.028665542602539062, 0.031739234924316406, 0.03481292724609375, 0.037886619567871094, 0.04096031188964844, 0.04403400421142578, 0.047107696533203125, 0.05018138885498047, 0.05325508117675781, 0.056328773498535156, 0.0594024658203125, 0.062476158142089844, 0.06554985046386719, 0.06862354278564453, 0.07169723510742188, 0.07477092742919922, 0.07784461975097656, 0.0809183120727539, 0.08399200439453125, 0.0870656967163086, 0.09013938903808594, 0.09321308135986328, 0.09628677368164062, 0.09936046600341797, 0.10243415832519531, 0.10550785064697266, 0.10858154296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 11.0, 4.0, 4.0, 5.0, 6.0, 5.0, 12.0, 10.0, 27.0, 24.0, 38.0, 61.0, 76.0, 72.0, 81.0, 82.0, 88.0, 79.0, 73.0, 43.0, 51.0, 39.0, 28.0, 22.0, 22.0, 9.0, 8.0, 8.0, 3.0, 1.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11194229125976562, -0.10779571533203125, -0.10364913940429688, -0.0995025634765625, -0.09535598754882812, -0.09120941162109375, -0.08706283569335938, -0.082916259765625, -0.07876968383789062, -0.07462310791015625, -0.07047653198242188, -0.0663299560546875, -0.062183380126953125, -0.05803680419921875, -0.053890228271484375, -0.04974365234375, -0.045597076416015625, -0.04145050048828125, -0.037303924560546875, -0.0331573486328125, -0.029010772705078125, -0.02486419677734375, -0.020717620849609375, -0.016571044921875, -0.012424468994140625, -0.00827789306640625, -0.004131317138671875, 1.52587890625e-05, 0.004161834716796875, 0.00830841064453125, 0.012454986572265625, 0.0166015625, 0.020748138427734375, 0.02489471435546875, 0.029041290283203125, 0.0331878662109375, 0.037334442138671875, 0.04148101806640625, 0.045627593994140625, 0.049774169921875, 0.053920745849609375, 0.05806732177734375, 0.062213897705078125, 0.0663604736328125, 0.07050704956054688, 0.07465362548828125, 0.07880020141601562, 0.08294677734375, 0.08709335327148438, 0.09123992919921875, 0.09538650512695312, 0.0995330810546875, 0.10367965698242188, 0.10782623291015625, 0.11197280883789062, 0.116119384765625, 0.12026596069335938, 0.12441253662109375, 0.12855911254882812, 0.1327056884765625, 0.13685226440429688, 0.14099884033203125, 0.14514541625976562, 0.1492919921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 10.0, 21.0, 60.0, 95.0, 140.0, 178.0, 158.0, 127.0, 94.0, 50.0, 26.0, 12.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564347267150879, -2.4867753982543945, -2.4092037677764893, -2.331631898880005, -2.2540602684020996, -2.1764883995056152, -2.09891676902771, -2.0213449001312256, -1.9437732696533203, -1.8662015199661255, -1.7886297702789307, -1.7110580205917358, -1.633486270904541, -1.5559145212173462, -1.4783427715301514, -1.400770902633667, -1.3231991529464722, -1.2456274032592773, -1.1680556535720825, -1.0904839038848877, -1.0129121541976929, -0.935340404510498, -0.8577685952186584, -0.7801968455314636, -0.7026250958442688, -0.625053346157074, -0.5474815964698792, -0.46990981698036194, -0.3923380672931671, -0.3147663176059723, -0.23719453811645508, -0.15962278842926025, -0.08205103874206543, -0.0044792816042900085, 0.07309247553348541, 0.15066424012184143, 0.22823598980903625, 0.3058077394962311, 0.3833795189857483, 0.4609512686729431, 0.5385230183601379, 0.6160947680473328, 0.6936665177345276, 0.7712383270263672, 0.848810076713562, 0.9263818264007568, 1.0039535760879517, 1.0815253257751465, 1.1590970754623413, 1.2366688251495361, 1.314240574836731, 1.3918123245239258, 1.4693840742111206, 1.5469558238983154, 1.6245276927947998, 1.702099323272705, 1.7796711921691895, 1.8572429418563843, 1.934814691543579, 2.0123865604400635, 2.0899581909179688, 2.167530059814453, 2.2451016902923584, 2.3226735591888428, 2.400245189666748]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 4.0, 7.0, 4.0, 10.0, 12.0, 7.0, 15.0, 15.0, 22.0, 18.0, 20.0, 22.0, 22.0, 36.0, 26.0, 37.0, 40.0, 42.0, 42.0, 38.0, 36.0, 44.0, 42.0, 42.0, 38.0, 51.0, 43.0, 29.0, 29.0, 24.0, 23.0, 18.0, 17.0, 18.0, 19.0, 18.0, 10.0, 16.0, 6.0, 10.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.9375360012054443, -0.9086465239524841, -0.8797570466995239, -0.8508675694465637, -0.8219780921936035, -0.7930886149406433, -0.7641991376876831, -0.7353096604347229, -0.7064201831817627, -0.6775307059288025, -0.6486412286758423, -0.6197517514228821, -0.5908622741699219, -0.5619727969169617, -0.5330833196640015, -0.5041938424110413, -0.47530439496040344, -0.44641491770744324, -0.41752544045448303, -0.3886359632015228, -0.3597464859485626, -0.3308570384979248, -0.3019675612449646, -0.2730780839920044, -0.244188591837883, -0.2152991145849228, -0.18640963733196259, -0.15752017498016357, -0.12863069772720337, -0.09974122047424316, -0.07085174322128296, -0.041962265968322754, -0.013072788715362549, 0.015816686674952507, 0.04470616206526756, 0.07359563559293747, 0.10248511284589767, 0.13137458264827728, 0.1602640599012375, 0.1891535371541977, 0.2180430144071579, 0.2469324916601181, 0.2758219540119171, 0.3047114312648773, 0.3336009085178375, 0.36249038577079773, 0.39137986302375793, 0.42026934027671814, 0.44915881752967834, 0.47804829478263855, 0.5069377422332764, 0.5358272194862366, 0.5647166967391968, 0.593606173992157, 0.6224956512451172, 0.6513851284980774, 0.6802746057510376, 0.7091640830039978, 0.738053560256958, 0.7669430375099182, 0.7958325147628784, 0.8247219920158386, 0.8536114692687988, 0.882500946521759, 0.9113904237747192]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 14.0, 20.0, 18.0, 41.0, 70.0, 109.0, 160.0, 273.0, 402.0, 690.0, 1205.0, 2125.0, 4196.0, 7872.0, 16487.0, 38407.0, 101424.0, 308674.0, 922567.0, 1552585.0, 817554.0, 266972.0, 88309.0, 33670.0, 14746.0, 7095.0, 3649.0, 2035.0, 1121.0, 686.0, 405.0, 237.0, 176.0, 118.0, 59.0, 39.0, 22.0, 15.0, 10.0, 7.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.17189788818359375, -0.1664276123046875, -0.16095733642578125, -0.155487060546875, -0.15001678466796875, -0.1445465087890625, -0.13907623291015625, -0.13360595703125, -0.12813568115234375, -0.1226654052734375, -0.11719512939453125, -0.111724853515625, -0.10625457763671875, -0.1007843017578125, -0.09531402587890625, -0.08984375, -0.08437347412109375, -0.0789031982421875, -0.07343292236328125, -0.067962646484375, -0.06249237060546875, -0.0570220947265625, -0.05155181884765625, -0.04608154296875, -0.04061126708984375, -0.0351409912109375, -0.02967071533203125, -0.024200439453125, -0.01873016357421875, -0.0132598876953125, -0.00778961181640625, -0.0023193359375, 0.00315093994140625, 0.0086212158203125, 0.01409149169921875, 0.019561767578125, 0.02503204345703125, 0.0305023193359375, 0.03597259521484375, 0.04144287109375, 0.04691314697265625, 0.0523834228515625, 0.05785369873046875, 0.063323974609375, 0.06879425048828125, 0.0742645263671875, 0.07973480224609375, 0.085205078125, 0.09067535400390625, 0.0961456298828125, 0.10161590576171875, 0.107086181640625, 0.11255645751953125, 0.1180267333984375, 0.12349700927734375, 0.12896728515625, 0.13443756103515625, 0.1399078369140625, 0.14537811279296875, 0.150848388671875, 0.15631866455078125, 0.1617889404296875, 0.16725921630859375, 0.1727294921875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 7.0, 11.0, 20.0, 24.0, 14.0, 30.0, 23.0, 31.0, 35.0, 31.0, 36.0, 37.0, 38.0, 44.0, 47.0, 56.0, 41.0, 40.0, 50.0, 34.0, 39.0, 55.0, 37.0, 33.0, 24.0, 28.0, 25.0, 21.0, 17.0, 14.0, 9.0, 10.0, 10.0, 8.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16064453125, -0.1556987762451172, -0.15075302124023438, -0.14580726623535156, -0.14086151123046875, -0.13591575622558594, -0.13097000122070312, -0.1260242462158203, -0.1210784912109375, -0.11613273620605469, -0.11118698120117188, -0.10624122619628906, -0.10129547119140625, -0.09634971618652344, -0.09140396118164062, -0.08645820617675781, -0.081512451171875, -0.07656669616699219, -0.07162094116210938, -0.06667518615722656, -0.06172943115234375, -0.05678367614746094, -0.051837921142578125, -0.04689216613769531, -0.0419464111328125, -0.03700065612792969, -0.032054901123046875, -0.027109146118164062, -0.02216339111328125, -0.017217636108398438, -0.012271881103515625, -0.0073261260986328125, -0.00238037109375, 0.0025653839111328125, 0.007511138916015625, 0.012456893920898438, 0.01740264892578125, 0.022348403930664062, 0.027294158935546875, 0.03223991394042969, 0.0371856689453125, 0.04213142395019531, 0.047077178955078125, 0.05202293395996094, 0.05696868896484375, 0.06191444396972656, 0.06686019897460938, 0.07180595397949219, 0.076751708984375, 0.08169746398925781, 0.08664321899414062, 0.09158897399902344, 0.09653472900390625, 0.10148048400878906, 0.10642623901367188, 0.11137199401855469, 0.1163177490234375, 0.12126350402832031, 0.12620925903320312, 0.13115501403808594, 0.13610076904296875, 0.14104652404785156, 0.14599227905273438, 0.1509380340576172, 0.1558837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 9.0, 13.0, 15.0, 26.0, 31.0, 45.0, 85.0, 125.0, 136.0, 214.0, 365.0, 592.0, 1066.0, 1730.0, 3070.0, 5774.0, 11148.0, 23266.0, 50718.0, 124187.0, 354849.0, 1246666.0, 1608895.0, 482625.0, 158908.0, 62736.0, 28079.0, 13247.0, 6831.0, 3664.0, 2032.0, 1160.0, 702.0, 409.0, 303.0, 179.0, 116.0, 79.0, 57.0, 39.0, 25.0, 18.0, 10.0, 12.0, 8.0, 3.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 4.0], "bins": [-0.21337890625, -0.2069377899169922, -0.20049667358398438, -0.19405555725097656, -0.18761444091796875, -0.18117332458496094, -0.17473220825195312, -0.1682910919189453, -0.1618499755859375, -0.1554088592529297, -0.14896774291992188, -0.14252662658691406, -0.13608551025390625, -0.12964439392089844, -0.12320327758789062, -0.11676216125488281, -0.110321044921875, -0.10387992858886719, -0.09743881225585938, -0.09099769592285156, -0.08455657958984375, -0.07811546325683594, -0.07167434692382812, -0.06523323059082031, -0.0587921142578125, -0.05235099792480469, -0.045909881591796875, -0.03946876525878906, -0.03302764892578125, -0.026586532592773438, -0.020145416259765625, -0.013704299926757812, -0.00726318359375, -0.0008220672607421875, 0.005619049072265625, 0.012060165405273438, 0.01850128173828125, 0.024942398071289062, 0.031383514404296875, 0.03782463073730469, 0.0442657470703125, 0.05070686340332031, 0.057147979736328125, 0.06358909606933594, 0.07003021240234375, 0.07647132873535156, 0.08291244506835938, 0.08935356140136719, 0.095794677734375, 0.10223579406738281, 0.10867691040039062, 0.11511802673339844, 0.12155914306640625, 0.12800025939941406, 0.13444137573242188, 0.1408824920654297, 0.1473236083984375, 0.1537647247314453, 0.16020584106445312, 0.16664695739746094, 0.17308807373046875, 0.17952919006347656, 0.18597030639648438, 0.1924114227294922, 0.1988525390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 12.0, 9.0, 18.0, 18.0, 24.0, 28.0, 32.0, 47.0, 65.0, 76.0, 98.0, 138.0, 173.0, 246.0, 327.0, 452.0, 464.0, 465.0, 328.0, 250.0, 192.0, 133.0, 111.0, 74.0, 63.0, 52.0, 35.0, 27.0, 15.0, 20.0, 13.0, 15.0, 14.0, 3.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.260009765625, -0.25225067138671875, -0.2444915771484375, -0.23673248291015625, -0.228973388671875, -0.22121429443359375, -0.2134552001953125, -0.20569610595703125, -0.19793701171875, -0.19017791748046875, -0.1824188232421875, -0.17465972900390625, -0.166900634765625, -0.15914154052734375, -0.1513824462890625, -0.14362335205078125, -0.1358642578125, -0.12810516357421875, -0.1203460693359375, -0.11258697509765625, -0.104827880859375, -0.09706878662109375, -0.0893096923828125, -0.08155059814453125, -0.07379150390625, -0.06603240966796875, -0.0582733154296875, -0.05051422119140625, -0.042755126953125, -0.03499603271484375, -0.0272369384765625, -0.01947784423828125, -0.01171875, -0.00395965576171875, 0.0037994384765625, 0.01155853271484375, 0.019317626953125, 0.02707672119140625, 0.0348358154296875, 0.04259490966796875, 0.05035400390625, 0.05811309814453125, 0.0658721923828125, 0.07363128662109375, 0.081390380859375, 0.08914947509765625, 0.0969085693359375, 0.10466766357421875, 0.1124267578125, 0.12018585205078125, 0.1279449462890625, 0.13570404052734375, 0.143463134765625, 0.15122222900390625, 0.1589813232421875, 0.16674041748046875, 0.17449951171875, 0.18225860595703125, 0.1900177001953125, 0.19777679443359375, 0.205535888671875, 0.21329498291015625, 0.2210540771484375, 0.22881317138671875, 0.236572265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 10.0, 7.0, 13.0, 31.0, 27.0, 44.0, 57.0, 72.0, 83.0, 110.0, 109.0, 92.0, 70.0, 76.0, 58.0, 36.0, 45.0, 20.0, 12.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8973208665847778, -1.8465251922607422, -1.795729637145996, -1.7449339628219604, -1.6941382884979248, -1.6433427333831787, -1.592547059059143, -1.5417513847351074, -1.4909558296203613, -1.4401601552963257, -1.3893646001815796, -1.338568925857544, -1.2877733707427979, -1.2369776964187622, -1.1861820220947266, -1.1353864669799805, -1.0845907926559448, -1.0337951183319092, -0.9829995632171631, -0.9322038888931274, -0.8814082741737366, -0.8306126594543457, -0.7798169851303101, -0.7290213704109192, -0.6782257556915283, -0.6274301409721375, -0.5766345262527466, -0.5258388519287109, -0.47504323720932007, -0.4242476224899292, -0.37345197796821594, -0.3226563334465027, -0.2718607187271118, -0.22106508910655975, -0.1702694594860077, -0.11947382986545563, -0.06867820024490356, -0.017882585525512695, 0.03291305899620056, 0.08370870351791382, 0.1345043182373047, 0.18529994785785675, 0.2360955774784088, 0.28689122200012207, 0.33768683671951294, 0.3884824514389038, 0.43927809596061707, 0.4900737404823303, 0.5408693552017212, 0.5916649699211121, 0.6424605846405029, 0.6932562589645386, 0.7440518736839294, 0.7948474884033203, 0.845643162727356, 0.8964387774467468, 0.9472343921661377, 0.9980300068855286, 1.0488256216049194, 1.099621295928955, 1.1504168510437012, 1.2012125253677368, 1.2520081996917725, 1.3028037548065186, 1.3535994291305542]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 4.0, 10.0, 7.0, 11.0, 7.0, 9.0, 18.0, 21.0, 29.0, 23.0, 26.0, 34.0, 30.0, 31.0, 30.0, 37.0, 34.0, 49.0, 41.0, 46.0, 44.0, 32.0, 45.0, 36.0, 25.0, 28.0, 23.0, 38.0, 20.0, 27.0, 29.0, 23.0, 21.0, 17.0, 10.0, 11.0, 10.0, 8.0, 8.0, 10.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.7454402446746826, -0.7218136191368103, -0.6981869339942932, -0.6745603084564209, -0.6509336233139038, -0.6273069977760315, -0.6036803126335144, -0.5800536870956421, -0.556427001953125, -0.5328003764152527, -0.5091736912727356, -0.4855470359325409, -0.4619203805923462, -0.4382937252521515, -0.4146670699119568, -0.3910404443740845, -0.36741378903388977, -0.34378713369369507, -0.32016047835350037, -0.29653382301330566, -0.27290716767311096, -0.24928051233291626, -0.22565387189388275, -0.20202721655368805, -0.17840056121349335, -0.15477390587329865, -0.13114725053310394, -0.10752060264348984, -0.08389394730329514, -0.06026729196310043, -0.03664064407348633, -0.013013988733291626, 0.010612666606903076, 0.03423932194709778, 0.05786597356200218, 0.08149262517690659, 0.10511928051710129, 0.1287459433078766, 0.1523725837469101, 0.1759992390871048, 0.1996258944272995, 0.2232525497674942, 0.2468792051076889, 0.2705058455467224, 0.2941325008869171, 0.3177591562271118, 0.3413858115673065, 0.3650124669075012, 0.3886391222476959, 0.4122657775878906, 0.4358924329280853, 0.45951908826828003, 0.48314574360847473, 0.5067723989486694, 0.5303990244865417, 0.5540257096290588, 0.5776523351669312, 0.6012789607048035, 0.6249056458473206, 0.6485322713851929, 0.67215895652771, 0.6957855820655823, 0.7194122672080994, 0.7430388927459717, 0.7666655778884888]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 11.0, 12.0, 26.0, 45.0, 55.0, 104.0, 153.0, 234.0, 325.0, 527.0, 893.0, 1441.0, 2414.0, 4184.0, 8302.0, 20392.0, 68455.0, 275560.0, 439714.0, 158614.0, 39068.0, 13503.0, 6170.0, 3302.0, 1877.0, 1237.0, 722.0, 420.0, 252.0, 167.0, 114.0, 78.0, 55.0, 30.0, 30.0, 9.0, 8.0, 13.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32861328125, -0.3181114196777344, -0.30760955810546875, -0.2971076965332031, -0.2866058349609375, -0.2761039733886719, -0.26560211181640625, -0.2551002502441406, -0.244598388671875, -0.23409652709960938, -0.22359466552734375, -0.21309280395507812, -0.2025909423828125, -0.19208908081054688, -0.18158721923828125, -0.17108535766601562, -0.16058349609375, -0.15008163452148438, -0.13957977294921875, -0.12907791137695312, -0.1185760498046875, -0.10807418823242188, -0.09757232666015625, -0.08707046508789062, -0.076568603515625, -0.06606674194335938, -0.05556488037109375, -0.045063018798828125, -0.0345611572265625, -0.024059295654296875, -0.01355743408203125, -0.003055572509765625, 0.0074462890625, 0.017948150634765625, 0.02845001220703125, 0.038951873779296875, 0.0494537353515625, 0.059955596923828125, 0.07045745849609375, 0.08095932006835938, 0.091461181640625, 0.10196304321289062, 0.11246490478515625, 0.12296676635742188, 0.1334686279296875, 0.14397048950195312, 0.15447235107421875, 0.16497421264648438, 0.17547607421875, 0.18597793579101562, 0.19647979736328125, 0.20698165893554688, 0.2174835205078125, 0.22798538208007812, 0.23848724365234375, 0.24898910522460938, 0.259490966796875, 0.2699928283691406, 0.28049468994140625, 0.2909965515136719, 0.3014984130859375, 0.3120002746582031, 0.32250213623046875, 0.3330039978027344, 0.343505859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 11.0, 6.0, 10.0, 15.0, 12.0, 16.0, 25.0, 26.0, 18.0, 37.0, 40.0, 35.0, 36.0, 44.0, 43.0, 47.0, 38.0, 37.0, 51.0, 43.0, 47.0, 39.0, 43.0, 38.0, 35.0, 27.0, 30.0, 25.0, 26.0, 25.0, 19.0, 16.0, 14.0, 7.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179443359375, -0.17399024963378906, -0.16853713989257812, -0.1630840301513672, -0.15763092041015625, -0.1521778106689453, -0.14672470092773438, -0.14127159118652344, -0.1358184814453125, -0.13036537170410156, -0.12491226196289062, -0.11945915222167969, -0.11400604248046875, -0.10855293273925781, -0.10309982299804688, -0.09764671325683594, -0.092193603515625, -0.08674049377441406, -0.08128738403320312, -0.07583427429199219, -0.07038116455078125, -0.06492805480957031, -0.059474945068359375, -0.05402183532714844, -0.0485687255859375, -0.04311561584472656, -0.037662506103515625, -0.03220939636230469, -0.02675628662109375, -0.021303176879882812, -0.015850067138671875, -0.010396957397460938, -0.00494384765625, 0.0005092620849609375, 0.005962371826171875, 0.011415481567382812, 0.01686859130859375, 0.022321701049804688, 0.027774810791015625, 0.03322792053222656, 0.0386810302734375, 0.04413414001464844, 0.049587249755859375, 0.05504035949707031, 0.06049346923828125, 0.06594657897949219, 0.07139968872070312, 0.07685279846191406, 0.082305908203125, 0.08775901794433594, 0.09321212768554688, 0.09866523742675781, 0.10411834716796875, 0.10957145690917969, 0.11502456665039062, 0.12047767639160156, 0.1259307861328125, 0.13138389587402344, 0.13683700561523438, 0.1422901153564453, 0.14774322509765625, 0.1531963348388672, 0.15864944458007812, 0.16410255432128906, 0.1695556640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 11.0, 16.0, 24.0, 38.0, 57.0, 89.0, 138.0, 200.0, 371.0, 614.0, 936.0, 1548.0, 2564.0, 4281.0, 7644.0, 13978.0, 29546.0, 71308.0, 186616.0, 335770.0, 228893.0, 90110.0, 35954.0, 16812.0, 8612.0, 5021.0, 2932.0, 1697.0, 1106.0, 628.0, 358.0, 249.0, 164.0, 92.0, 61.0, 37.0, 28.0, 19.0, 13.0, 5.0, 7.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1876220703125, -0.18106651306152344, -0.17451095581054688, -0.1679553985595703, -0.16139984130859375, -0.1548442840576172, -0.14828872680664062, -0.14173316955566406, -0.1351776123046875, -0.12862205505371094, -0.12206649780273438, -0.11551094055175781, -0.10895538330078125, -0.10239982604980469, -0.09584426879882812, -0.08928871154785156, -0.082733154296875, -0.07617759704589844, -0.06962203979492188, -0.06306648254394531, -0.05651092529296875, -0.04995536804199219, -0.043399810791015625, -0.03684425354003906, -0.0302886962890625, -0.023733139038085938, -0.017177581787109375, -0.010622024536132812, -0.00406646728515625, 0.0024890899658203125, 0.009044647216796875, 0.015600204467773438, 0.02215576171875, 0.028711318969726562, 0.035266876220703125, 0.04182243347167969, 0.04837799072265625, 0.05493354797363281, 0.061489105224609375, 0.06804466247558594, 0.0746002197265625, 0.08115577697753906, 0.08771133422851562, 0.09426689147949219, 0.10082244873046875, 0.10737800598144531, 0.11393356323242188, 0.12048912048339844, 0.127044677734375, 0.13360023498535156, 0.14015579223632812, 0.1467113494873047, 0.15326690673828125, 0.1598224639892578, 0.16637802124023438, 0.17293357849121094, 0.1794891357421875, 0.18604469299316406, 0.19260025024414062, 0.1991558074951172, 0.20571136474609375, 0.2122669219970703, 0.21882247924804688, 0.22537803649902344, 0.23193359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 9.0, 6.0, 0.0, 4.0, 8.0, 11.0, 10.0, 15.0, 18.0, 14.0, 20.0, 24.0, 29.0, 34.0, 32.0, 35.0, 34.0, 37.0, 54.0, 33.0, 46.0, 38.0, 39.0, 47.0, 42.0, 36.0, 40.0, 44.0, 36.0, 27.0, 26.0, 24.0, 20.0, 27.0, 19.0, 12.0, 18.0, 10.0, 2.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.473876953125, -0.460113525390625, -0.44635009765625, -0.432586669921875, -0.4188232421875, -0.405059814453125, -0.39129638671875, -0.377532958984375, -0.36376953125, -0.350006103515625, -0.33624267578125, -0.322479248046875, -0.3087158203125, -0.294952392578125, -0.28118896484375, -0.267425537109375, -0.253662109375, -0.239898681640625, -0.22613525390625, -0.212371826171875, -0.1986083984375, -0.184844970703125, -0.17108154296875, -0.157318115234375, -0.1435546875, -0.129791259765625, -0.11602783203125, -0.102264404296875, -0.0885009765625, -0.074737548828125, -0.06097412109375, -0.047210693359375, -0.033447265625, -0.019683837890625, -0.00592041015625, 0.007843017578125, 0.0216064453125, 0.035369873046875, 0.04913330078125, 0.062896728515625, 0.07666015625, 0.090423583984375, 0.10418701171875, 0.117950439453125, 0.1317138671875, 0.145477294921875, 0.15924072265625, 0.173004150390625, 0.186767578125, 0.200531005859375, 0.21429443359375, 0.228057861328125, 0.2418212890625, 0.255584716796875, 0.26934814453125, 0.283111572265625, 0.296875, 0.310638427734375, 0.32440185546875, 0.338165283203125, 0.3519287109375, 0.365692138671875, 0.37945556640625, 0.393218994140625, 0.406982421875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 11.0, 7.0, 18.0, 21.0, 26.0, 28.0, 61.0, 90.0, 154.0, 224.0, 454.0, 722.0, 1090.0, 1883.0, 3279.0, 5775.0, 10312.0, 19480.0, 39068.0, 85525.0, 188930.0, 291719.0, 209906.0, 98232.0, 43848.0, 21371.0, 11076.0, 6345.0, 3572.0, 2164.0, 1236.0, 749.0, 440.0, 274.0, 169.0, 129.0, 57.0, 40.0, 16.0, 21.0, 11.0, 9.0, 6.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.07489013671875, -0.0727243423461914, -0.07055854797363281, -0.06839275360107422, -0.06622695922851562, -0.06406116485595703, -0.06189537048339844, -0.059729576110839844, -0.05756378173828125, -0.055397987365722656, -0.05323219299316406, -0.05106639862060547, -0.048900604248046875, -0.04673480987548828, -0.04456901550292969, -0.042403221130371094, -0.0402374267578125, -0.038071632385253906, -0.03590583801269531, -0.03374004364013672, -0.031574249267578125, -0.02940845489501953, -0.027242660522460938, -0.025076866149902344, -0.02291107177734375, -0.020745277404785156, -0.018579483032226562, -0.01641368865966797, -0.014247894287109375, -0.012082099914550781, -0.009916305541992188, -0.007750511169433594, -0.005584716796875, -0.0034189224243164062, -0.0012531280517578125, 0.0009126663208007812, 0.003078460693359375, 0.005244255065917969, 0.0074100494384765625, 0.009575843811035156, 0.01174163818359375, 0.013907432556152344, 0.016073226928710938, 0.01823902130126953, 0.020404815673828125, 0.02257061004638672, 0.024736404418945312, 0.026902198791503906, 0.0290679931640625, 0.031233787536621094, 0.03339958190917969, 0.03556537628173828, 0.037731170654296875, 0.03989696502685547, 0.04206275939941406, 0.044228553771972656, 0.04639434814453125, 0.048560142517089844, 0.05072593688964844, 0.05289173126220703, 0.055057525634765625, 0.05722332000732422, 0.05938911437988281, 0.061554908752441406, 0.063720703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 9.0, 12.0, 19.0, 15.0, 23.0, 28.0, 63.0, 71.0, 100.0, 104.0, 122.0, 103.0, 86.0, 60.0, 44.0, 43.0, 22.0, 17.0, 15.0, 14.0, 10.0, 2.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.522634506225586e-05, -3.3991411328315735e-05, -3.275647759437561e-05, -3.1521543860435486e-05, -3.028661012649536e-05, -2.9051676392555237e-05, -2.7816742658615112e-05, -2.6581808924674988e-05, -2.5346875190734863e-05, -2.411194145679474e-05, -2.2877007722854614e-05, -2.164207398891449e-05, -2.0407140254974365e-05, -1.917220652103424e-05, -1.7937272787094116e-05, -1.6702339053153992e-05, -1.5467405319213867e-05, -1.4232471585273743e-05, -1.2997537851333618e-05, -1.1762604117393494e-05, -1.0527670383453369e-05, -9.292736649513245e-06, -8.05780291557312e-06, -6.822869181632996e-06, -5.587935447692871e-06, -4.353001713752747e-06, -3.118067979812622e-06, -1.8831342458724976e-06, -6.48200511932373e-07, 5.867332220077515e-07, 1.821666955947876e-06, 3.0566006898880005e-06, 4.291534423828125e-06, 5.5264681577682495e-06, 6.761401891708374e-06, 7.996335625648499e-06, 9.231269359588623e-06, 1.0466203093528748e-05, 1.1701136827468872e-05, 1.2936070561408997e-05, 1.4171004295349121e-05, 1.5405938029289246e-05, 1.664087176322937e-05, 1.7875805497169495e-05, 1.911073923110962e-05, 2.0345672965049744e-05, 2.1580606698989868e-05, 2.2815540432929993e-05, 2.4050474166870117e-05, 2.5285407900810242e-05, 2.6520341634750366e-05, 2.775527536869049e-05, 2.8990209102630615e-05, 3.022514283657074e-05, 3.1460076570510864e-05, 3.269501030445099e-05, 3.392994403839111e-05, 3.516487777233124e-05, 3.639981150627136e-05, 3.763474524021149e-05, 3.886967897415161e-05, 4.0104612708091736e-05, 4.133954644203186e-05, 4.2574480175971985e-05, 4.380941390991211e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 11.0, 10.0, 12.0, 25.0, 36.0, 32.0, 83.0, 94.0, 159.0, 233.0, 388.0, 626.0, 994.0, 1776.0, 3240.0, 5878.0, 11748.0, 24345.0, 52741.0, 118013.0, 236626.0, 279817.0, 166853.0, 76129.0, 34490.0, 16130.0, 8275.0, 4189.0, 2257.0, 1273.0, 767.0, 425.0, 293.0, 179.0, 130.0, 89.0, 54.0, 42.0, 20.0, 22.0, 14.0, 12.0, 9.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06787109375, -0.06554889678955078, -0.06322669982910156, -0.060904502868652344, -0.058582305908203125, -0.056260108947753906, -0.05393791198730469, -0.05161571502685547, -0.04929351806640625, -0.04697132110595703, -0.04464912414550781, -0.042326927185058594, -0.040004730224609375, -0.037682533264160156, -0.03536033630371094, -0.03303813934326172, -0.0307159423828125, -0.02839374542236328, -0.026071548461914062, -0.023749351501464844, -0.021427154541015625, -0.019104957580566406, -0.016782760620117188, -0.014460563659667969, -0.01213836669921875, -0.009816169738769531, -0.0074939727783203125, -0.005171775817871094, -0.002849578857421875, -0.0005273818969726562, 0.0017948150634765625, 0.004117012023925781, 0.006439208984375, 0.008761405944824219, 0.011083602905273438, 0.013405799865722656, 0.015727996826171875, 0.018050193786621094, 0.020372390747070312, 0.02269458770751953, 0.02501678466796875, 0.02733898162841797, 0.029661178588867188, 0.031983375549316406, 0.034305572509765625, 0.036627769470214844, 0.03894996643066406, 0.04127216339111328, 0.0435943603515625, 0.04591655731201172, 0.04823875427246094, 0.050560951232910156, 0.052883148193359375, 0.055205345153808594, 0.05752754211425781, 0.05984973907470703, 0.06217193603515625, 0.06449413299560547, 0.06681632995605469, 0.0691385269165039, 0.07146072387695312, 0.07378292083740234, 0.07610511779785156, 0.07842731475830078, 0.08074951171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 4.0, 8.0, 12.0, 24.0, 23.0, 22.0, 29.0, 45.0, 64.0, 65.0, 68.0, 99.0, 73.0, 82.0, 70.0, 65.0, 44.0, 36.0, 34.0, 22.0, 22.0, 15.0, 12.0, 3.0, 8.0, 6.0, 5.0, 3.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10406494140625, -0.10065841674804688, -0.09725189208984375, -0.09384536743164062, -0.0904388427734375, -0.08703231811523438, -0.08362579345703125, -0.08021926879882812, -0.076812744140625, -0.07340621948242188, -0.06999969482421875, -0.06659317016601562, -0.0631866455078125, -0.059780120849609375, -0.05637359619140625, -0.052967071533203125, -0.049560546875, -0.046154022216796875, -0.04274749755859375, -0.039340972900390625, -0.0359344482421875, -0.032527923583984375, -0.02912139892578125, -0.025714874267578125, -0.022308349609375, -0.018901824951171875, -0.01549530029296875, -0.012088775634765625, -0.0086822509765625, -0.005275726318359375, -0.00186920166015625, 0.001537322998046875, 0.00494384765625, 0.008350372314453125, 0.01175689697265625, 0.015163421630859375, 0.0185699462890625, 0.021976470947265625, 0.02538299560546875, 0.028789520263671875, 0.032196044921875, 0.035602569580078125, 0.03900909423828125, 0.042415618896484375, 0.0458221435546875, 0.049228668212890625, 0.05263519287109375, 0.056041717529296875, 0.0594482421875, 0.06285476684570312, 0.06626129150390625, 0.06966781616210938, 0.0730743408203125, 0.07648086547851562, 0.07988739013671875, 0.08329391479492188, 0.086700439453125, 0.09010696411132812, 0.09351348876953125, 0.09692001342773438, 0.1003265380859375, 0.10373306274414062, 0.10713958740234375, 0.11054611206054688, 0.11395263671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 13.0, 28.0, 53.0, 79.0, 125.0, 174.0, 163.0, 138.0, 98.0, 50.0, 32.0, 14.0, 12.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8534231185913086, -1.7811224460601807, -1.7088216543197632, -1.6365209817886353, -1.5642201900482178, -1.4919195175170898, -1.419618844985962, -1.3473180532455444, -1.275017261505127, -1.202716588973999, -1.1304157972335815, -1.0581151247024536, -0.9858143329620361, -0.9135136604309082, -0.8412129282951355, -0.7689121961593628, -0.6966115236282349, -0.6243107914924622, -0.5520100593566895, -0.47970935702323914, -0.40740862488746643, -0.3351078927516937, -0.2628071904182434, -0.1905064582824707, -0.118205726146698, -0.04590500146150589, 0.026395723223686218, 0.09869644045829773, 0.17099717259407043, 0.24329790472984314, 0.31559860706329346, 0.38789933919906616, 0.46020007133483887, 0.5325008034706116, 0.6048015356063843, 0.6771022081375122, 0.7494029998779297, 0.8217036724090576, 0.8940044045448303, 0.966305136680603, 1.0386059284210205, 1.1109066009521484, 1.183207392692566, 1.2555080652236938, 1.3278088569641113, 1.4001095294952393, 1.4724102020263672, 1.5447109937667847, 1.6170116662979126, 1.6893123388290405, 1.761613130569458, 1.833913803100586, 1.9062145948410034, 1.9785152673721313, 2.050816059112549, 2.1231167316436768, 2.1954174041748047, 2.2677180767059326, 2.3400187492370605, 2.4123196601867676, 2.4846203327178955, 2.5569210052490234, 2.6292216777801514, 2.7015223503112793, 2.7738232612609863]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 12.0, 14.0, 15.0, 14.0, 23.0, 20.0, 22.0, 24.0, 18.0, 21.0, 39.0, 30.0, 34.0, 33.0, 41.0, 47.0, 48.0, 54.0, 43.0, 43.0, 48.0, 35.0, 35.0, 37.0, 37.0, 31.0, 31.0, 28.0, 18.0, 14.0, 9.0, 17.0, 10.0, 6.0, 9.0, 6.0, 7.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.172210931777954, -1.1371248960494995, -1.1020389795303345, -1.0669529438018799, -1.0318669080734253, -0.9967809915542603, -0.9616949558258057, -0.9266089797019958, -0.891523003578186, -0.8564370274543762, -0.8213509917259216, -0.7862650156021118, -0.751179039478302, -0.7160930633544922, -0.6810070276260376, -0.6459210515022278, -0.6108350157737732, -0.5757490396499634, -0.5406630039215088, -0.505577027797699, -0.47049105167388916, -0.43540504574775696, -0.40031903982162476, -0.36523306369781494, -0.33014705777168274, -0.29506105184555054, -0.2599750757217407, -0.22488906979560852, -0.1898030787706375, -0.1547170877456665, -0.1196310818195343, -0.0845450907945633, -0.049459099769592285, -0.014373105019330978, 0.02071288973093033, 0.055798888206481934, 0.09088487923145294, 0.12597087025642395, 0.16105687618255615, 0.19614286720752716, 0.23122885823249817, 0.26631486415863037, 0.3014008402824402, 0.3364868462085724, 0.3715728521347046, 0.4066588282585144, 0.4417448341846466, 0.4768308401107788, 0.5119168162345886, 0.5470027923583984, 0.582088828086853, 0.6171748042106628, 0.6522607803344727, 0.6873468160629272, 0.7224327921867371, 0.7575187683105469, 0.7926048040390015, 0.8276907801628113, 0.8627768158912659, 0.8978627920150757, 0.9329487681388855, 0.9680347442626953, 1.00312077999115, 1.0382068157196045, 1.0732927322387695]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 15.0, 9.0, 18.0, 24.0, 46.0, 88.0, 153.0, 246.0, 545.0, 1157.0, 2312.0, 5682.0, 13987.0, 40792.0, 156064.0, 708404.0, 1983365.0, 979478.0, 217295.0, 54369.0, 17379.0, 6992.0, 2919.0, 1424.0, 669.0, 360.0, 199.0, 117.0, 53.0, 47.0, 23.0, 17.0, 10.0, 7.0, 2.0, 5.0, 0.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2344970703125, -0.2273082733154297, -0.22011947631835938, -0.21293067932128906, -0.20574188232421875, -0.19855308532714844, -0.19136428833007812, -0.1841754913330078, -0.1769866943359375, -0.1697978973388672, -0.16260910034179688, -0.15542030334472656, -0.14823150634765625, -0.14104270935058594, -0.13385391235351562, -0.1266651153564453, -0.119476318359375, -0.11228752136230469, -0.10509872436523438, -0.09790992736816406, -0.09072113037109375, -0.08353233337402344, -0.07634353637695312, -0.06915473937988281, -0.0619659423828125, -0.05477714538574219, -0.047588348388671875, -0.04039955139160156, -0.03321075439453125, -0.026021957397460938, -0.018833160400390625, -0.011644363403320312, -0.00445556640625, 0.0027332305908203125, 0.009922027587890625, 0.017110824584960938, 0.02429962158203125, 0.03148841857910156, 0.038677215576171875, 0.04586601257324219, 0.0530548095703125, 0.06024360656738281, 0.06743240356445312, 0.07462120056152344, 0.08180999755859375, 0.08899879455566406, 0.09618759155273438, 0.10337638854980469, 0.110565185546875, 0.11775398254394531, 0.12494277954101562, 0.13213157653808594, 0.13932037353515625, 0.14650917053222656, 0.15369796752929688, 0.1608867645263672, 0.1680755615234375, 0.1752643585205078, 0.18245315551757812, 0.18964195251464844, 0.19683074951171875, 0.20401954650878906, 0.21120834350585938, 0.2183971405029297, 0.2255859375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 11.0, 16.0, 10.0, 10.0, 25.0, 20.0, 31.0, 35.0, 39.0, 55.0, 53.0, 50.0, 43.0, 46.0, 51.0, 52.0, 57.0, 52.0, 37.0, 39.0, 46.0, 36.0, 33.0, 34.0, 19.0, 20.0, 18.0, 16.0, 13.0, 9.0, 8.0, 4.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1641845703125, -0.1586742401123047, -0.15316390991210938, -0.14765357971191406, -0.14214324951171875, -0.13663291931152344, -0.13112258911132812, -0.1256122589111328, -0.1201019287109375, -0.11459159851074219, -0.10908126831054688, -0.10357093811035156, -0.09806060791015625, -0.09255027770996094, -0.08703994750976562, -0.08152961730957031, -0.076019287109375, -0.07050895690917969, -0.06499862670898438, -0.05948829650878906, -0.05397796630859375, -0.04846763610839844, -0.042957305908203125, -0.03744697570800781, -0.0319366455078125, -0.026426315307617188, -0.020915985107421875, -0.015405654907226562, -0.00989532470703125, -0.0043849945068359375, 0.001125335693359375, 0.0066356658935546875, 0.01214599609375, 0.017656326293945312, 0.023166656494140625, 0.028676986694335938, 0.03418731689453125, 0.03969764709472656, 0.045207977294921875, 0.05071830749511719, 0.0562286376953125, 0.06173896789550781, 0.06724929809570312, 0.07275962829589844, 0.07826995849609375, 0.08378028869628906, 0.08929061889648438, 0.09480094909667969, 0.100311279296875, 0.10582160949707031, 0.11133193969726562, 0.11684226989746094, 0.12235260009765625, 0.12786293029785156, 0.13337326049804688, 0.1388835906982422, 0.1443939208984375, 0.1499042510986328, 0.15541458129882812, 0.16092491149902344, 0.16643524169921875, 0.17194557189941406, 0.17745590209960938, 0.1829662322998047, 0.1884765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 12.0, 15.0, 15.0, 16.0, 34.0, 65.0, 87.0, 137.0, 252.0, 387.0, 695.0, 1160.0, 2042.0, 3727.0, 7250.0, 14872.0, 33577.0, 84712.0, 256180.0, 1067177.0, 1975919.0, 506165.0, 143483.0, 52200.0, 21968.0, 10346.0, 5145.0, 2792.0, 1531.0, 895.0, 506.0, 338.0, 189.0, 144.0, 84.0, 59.0, 35.0, 31.0, 17.0, 11.0, 7.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1854248046875, -0.1786212921142578, -0.17181777954101562, -0.16501426696777344, -0.15821075439453125, -0.15140724182128906, -0.14460372924804688, -0.1378002166748047, -0.1309967041015625, -0.12419319152832031, -0.11738967895507812, -0.11058616638183594, -0.10378265380859375, -0.09697914123535156, -0.09017562866210938, -0.08337211608886719, -0.076568603515625, -0.06976509094238281, -0.06296157836914062, -0.05615806579589844, -0.04935455322265625, -0.04255104064941406, -0.035747528076171875, -0.028944015502929688, -0.0221405029296875, -0.015336990356445312, -0.008533477783203125, -0.0017299652099609375, 0.00507354736328125, 0.011877059936523438, 0.018680572509765625, 0.025484085083007812, 0.03228759765625, 0.03909111022949219, 0.045894622802734375, 0.05269813537597656, 0.05950164794921875, 0.06630516052246094, 0.07310867309570312, 0.07991218566894531, 0.0867156982421875, 0.09351921081542969, 0.10032272338867188, 0.10712623596191406, 0.11392974853515625, 0.12073326110839844, 0.12753677368164062, 0.1343402862548828, 0.141143798828125, 0.1479473114013672, 0.15475082397460938, 0.16155433654785156, 0.16835784912109375, 0.17516136169433594, 0.18196487426757812, 0.1887683868408203, 0.1955718994140625, 0.2023754119873047, 0.20917892456054688, 0.21598243713378906, 0.22278594970703125, 0.22958946228027344, 0.23639297485351562, 0.2431964874267578, 0.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 6.0, 7.0, 8.0, 6.0, 13.0, 14.0, 22.0, 25.0, 28.0, 40.0, 47.0, 61.0, 92.0, 111.0, 137.0, 183.0, 248.0, 389.0, 481.0, 506.0, 423.0, 316.0, 223.0, 157.0, 121.0, 93.0, 57.0, 50.0, 47.0, 23.0, 27.0, 24.0, 20.0, 16.0, 13.0, 7.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.222412109375, -0.2150402069091797, -0.20766830444335938, -0.20029640197753906, -0.19292449951171875, -0.18555259704589844, -0.17818069458007812, -0.1708087921142578, -0.1634368896484375, -0.1560649871826172, -0.14869308471679688, -0.14132118225097656, -0.13394927978515625, -0.12657737731933594, -0.11920547485351562, -0.11183357238769531, -0.104461669921875, -0.09708976745605469, -0.08971786499023438, -0.08234596252441406, -0.07497406005859375, -0.06760215759277344, -0.060230255126953125, -0.05285835266113281, -0.0454864501953125, -0.03811454772949219, -0.030742645263671875, -0.023370742797851562, -0.01599884033203125, -0.008626937866210938, -0.001255035400390625, 0.0061168670654296875, 0.01348876953125, 0.020860671997070312, 0.028232574462890625, 0.03560447692871094, 0.04297637939453125, 0.05034828186035156, 0.057720184326171875, 0.06509208679199219, 0.0724639892578125, 0.07983589172363281, 0.08720779418945312, 0.09457969665527344, 0.10195159912109375, 0.10932350158691406, 0.11669540405273438, 0.12406730651855469, 0.131439208984375, 0.1388111114501953, 0.14618301391601562, 0.15355491638183594, 0.16092681884765625, 0.16829872131347656, 0.17567062377929688, 0.1830425262451172, 0.1904144287109375, 0.1977863311767578, 0.20515823364257812, 0.21253013610839844, 0.21990203857421875, 0.22727394104003906, 0.23464584350585938, 0.2420177459716797, 0.2493896484375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 14.0, 20.0, 30.0, 55.0, 78.0, 110.0, 127.0, 150.0, 130.0, 104.0, 64.0, 58.0, 20.0, 11.0, 11.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.002749443054199, -1.9293506145477295, -1.8559517860412598, -1.78255295753479, -1.7091541290283203, -1.6357553005218506, -1.5623564720153809, -1.4889576435089111, -1.4155588150024414, -1.3421599864959717, -1.268761157989502, -1.1953623294830322, -1.1219635009765625, -1.0485646724700928, -0.975165843963623, -0.9017670154571533, -0.8283681869506836, -0.7549693584442139, -0.6815705299377441, -0.6081717014312744, -0.5347728729248047, -0.46137404441833496, -0.38797521591186523, -0.3145763874053955, -0.24117755889892578, -0.16777873039245605, -0.09437990188598633, -0.0209810733795166, 0.052417755126953125, 0.12581658363342285, 0.19921541213989258, 0.2726142406463623, 0.34601330757141113, 0.41941213607788086, 0.4928109645843506, 0.5662097930908203, 0.63960862159729, 0.7130074501037598, 0.7864062786102295, 0.8598051071166992, 0.933203935623169, 1.0066027641296387, 1.0800015926361084, 1.1534004211425781, 1.2267992496490479, 1.3001980781555176, 1.3735969066619873, 1.446995735168457, 1.5203945636749268, 1.5937933921813965, 1.6671922206878662, 1.740591049194336, 1.8139898777008057, 1.8873887062072754, 1.9607875347137451, 2.034186363220215, 2.1075851917266846, 2.1809840202331543, 2.254382848739624, 2.3277816772460938, 2.4011805057525635, 2.474579334259033, 2.547978162765503, 2.6213769912719727, 2.6947758197784424]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 7.0, 12.0, 12.0, 10.0, 15.0, 19.0, 25.0, 30.0, 36.0, 27.0, 37.0, 38.0, 53.0, 41.0, 54.0, 47.0, 52.0, 61.0, 45.0, 53.0, 47.0, 35.0, 41.0, 33.0, 34.0, 29.0, 21.0, 16.0, 7.0, 8.0, 15.0, 6.0, 6.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1127369403839111, -1.0802067518234253, -1.0476765632629395, -1.0151463747024536, -0.9826161861419678, -0.9500859975814819, -0.9175558090209961, -0.8850256204605103, -0.8524954319000244, -0.8199652433395386, -0.7874350547790527, -0.7549048662185669, -0.722374677658081, -0.6898444890975952, -0.6573143005371094, -0.6247841119766235, -0.5922539234161377, -0.5597237348556519, -0.527193546295166, -0.4946633577346802, -0.46213316917419434, -0.4296029806137085, -0.39707279205322266, -0.3645426034927368, -0.332012414932251, -0.29948222637176514, -0.2669520378112793, -0.23442184925079346, -0.20189166069030762, -0.16936147212982178, -0.13683128356933594, -0.1043010950088501, -0.07177096605300903, -0.03924077749252319, -0.0067105889320373535, 0.025819599628448486, 0.058349788188934326, 0.09087997674942017, 0.123410165309906, 0.15594035387039185, 0.18847054243087769, 0.22100073099136353, 0.25353091955184937, 0.2860611081123352, 0.31859129667282104, 0.3511214852333069, 0.3836516737937927, 0.41618186235427856, 0.4487120509147644, 0.48124223947525024, 0.5137724280357361, 0.5463026165962219, 0.5788328051567078, 0.6113629937171936, 0.6438931822776794, 0.6764233708381653, 0.7089535593986511, 0.741483747959137, 0.7740139365196228, 0.8065441250801086, 0.8390743136405945, 0.8716045022010803, 0.9041346907615662, 0.936664879322052, 0.9691950678825378]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 17.0, 25.0, 39.0, 47.0, 53.0, 95.0, 133.0, 197.0, 281.0, 441.0, 656.0, 1050.0, 1595.0, 2583.0, 4052.0, 6892.0, 11633.0, 20316.0, 36193.0, 65768.0, 116768.0, 182548.0, 212743.0, 161067.0, 97096.0, 54344.0, 30035.0, 16767.0, 9800.0, 5645.0, 3522.0, 2184.0, 1370.0, 832.0, 586.0, 379.0, 246.0, 169.0, 121.0, 66.0, 80.0, 37.0, 23.0, 17.0, 12.0, 9.0, 3.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.1319580078125, -0.12799930572509766, -0.12404060363769531, -0.12008190155029297, -0.11612319946289062, -0.11216449737548828, -0.10820579528808594, -0.1042470932006836, -0.10028839111328125, -0.0963296890258789, -0.09237098693847656, -0.08841228485107422, -0.08445358276367188, -0.08049488067626953, -0.07653617858886719, -0.07257747650146484, -0.0686187744140625, -0.06466007232666016, -0.06070137023925781, -0.05674266815185547, -0.052783966064453125, -0.04882526397705078, -0.04486656188964844, -0.040907859802246094, -0.03694915771484375, -0.032990455627441406, -0.029031753540039062, -0.02507305145263672, -0.021114349365234375, -0.01715564727783203, -0.013196945190429688, -0.009238243103027344, -0.005279541015625, -0.0013208389282226562, 0.0026378631591796875, 0.006596565246582031, 0.010555267333984375, 0.014513969421386719, 0.018472671508789062, 0.022431373596191406, 0.02639007568359375, 0.030348777770996094, 0.03430747985839844, 0.03826618194580078, 0.042224884033203125, 0.04618358612060547, 0.05014228820800781, 0.054100990295410156, 0.0580596923828125, 0.062018394470214844, 0.06597709655761719, 0.06993579864501953, 0.07389450073242188, 0.07785320281982422, 0.08181190490722656, 0.0857706069946289, 0.08972930908203125, 0.0936880111694336, 0.09764671325683594, 0.10160541534423828, 0.10556411743164062, 0.10952281951904297, 0.11348152160644531, 0.11744022369384766, 0.12139892578125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 0.0, 6.0, 5.0, 9.0, 4.0, 18.0, 22.0, 16.0, 19.0, 28.0, 28.0, 24.0, 22.0, 25.0, 33.0, 37.0, 47.0, 42.0, 49.0, 42.0, 43.0, 38.0, 34.0, 35.0, 41.0, 43.0, 35.0, 33.0, 23.0, 16.0, 20.0, 28.0, 23.0, 25.0, 12.0, 12.0, 12.0, 14.0, 8.0, 7.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1817626953125, -0.1766338348388672, -0.17150497436523438, -0.16637611389160156, -0.16124725341796875, -0.15611839294433594, -0.15098953247070312, -0.1458606719970703, -0.1407318115234375, -0.1356029510498047, -0.13047409057617188, -0.12534523010253906, -0.12021636962890625, -0.11508750915527344, -0.10995864868164062, -0.10482978820800781, -0.099700927734375, -0.09457206726074219, -0.08944320678710938, -0.08431434631347656, -0.07918548583984375, -0.07405662536621094, -0.06892776489257812, -0.06379890441894531, -0.0586700439453125, -0.05354118347167969, -0.048412322998046875, -0.04328346252441406, -0.03815460205078125, -0.03302574157714844, -0.027896881103515625, -0.022768020629882812, -0.01763916015625, -0.012510299682617188, -0.007381439208984375, -0.0022525787353515625, 0.00287628173828125, 0.008005142211914062, 0.013134002685546875, 0.018262863159179688, 0.0233917236328125, 0.028520584106445312, 0.033649444580078125, 0.03877830505371094, 0.04390716552734375, 0.04903602600097656, 0.054164886474609375, 0.05929374694824219, 0.064422607421875, 0.06955146789550781, 0.07468032836914062, 0.07980918884277344, 0.08493804931640625, 0.09006690979003906, 0.09519577026367188, 0.10032463073730469, 0.1054534912109375, 0.11058235168457031, 0.11571121215820312, 0.12084007263183594, 0.12596893310546875, 0.13109779357910156, 0.13622665405273438, 0.1413555145263672, 0.146484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 13.0, 6.0, 13.0, 13.0, 32.0, 39.0, 66.0, 102.0, 133.0, 224.0, 345.0, 613.0, 1034.0, 1675.0, 2876.0, 5320.0, 10158.0, 20088.0, 42779.0, 93162.0, 195943.0, 314964.0, 187898.0, 88593.0, 40912.0, 19350.0, 9847.0, 5295.0, 2794.0, 1675.0, 1004.0, 563.0, 391.0, 218.0, 138.0, 80.0, 55.0, 50.0, 31.0, 20.0, 14.0, 10.0, 6.0, 5.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158935546875, -0.1538848876953125, -0.148834228515625, -0.1437835693359375, -0.13873291015625, -0.1336822509765625, -0.128631591796875, -0.1235809326171875, -0.1185302734375, -0.1134796142578125, -0.108428955078125, -0.1033782958984375, -0.09832763671875, -0.0932769775390625, -0.088226318359375, -0.0831756591796875, -0.078125, -0.0730743408203125, -0.068023681640625, -0.0629730224609375, -0.05792236328125, -0.0528717041015625, -0.047821044921875, -0.0427703857421875, -0.0377197265625, -0.0326690673828125, -0.027618408203125, -0.0225677490234375, -0.01751708984375, -0.0124664306640625, -0.007415771484375, -0.0023651123046875, 0.002685546875, 0.0077362060546875, 0.012786865234375, 0.0178375244140625, 0.02288818359375, 0.0279388427734375, 0.032989501953125, 0.0380401611328125, 0.0430908203125, 0.0481414794921875, 0.053192138671875, 0.0582427978515625, 0.06329345703125, 0.0683441162109375, 0.073394775390625, 0.0784454345703125, 0.08349609375, 0.0885467529296875, 0.093597412109375, 0.0986480712890625, 0.10369873046875, 0.1087493896484375, 0.113800048828125, 0.1188507080078125, 0.1239013671875, 0.1289520263671875, 0.134002685546875, 0.1390533447265625, 0.14410400390625, 0.1491546630859375, 0.154205322265625, 0.1592559814453125, 0.164306640625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 8.0, 7.0, 9.0, 6.0, 14.0, 28.0, 23.0, 30.0, 33.0, 32.0, 44.0, 42.0, 61.0, 64.0, 75.0, 54.0, 53.0, 59.0, 68.0, 58.0, 45.0, 27.0, 31.0, 32.0, 26.0, 20.0, 18.0, 14.0, 8.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.6283721923828125, -0.608306884765625, -0.5882415771484375, -0.56817626953125, -0.5481109619140625, -0.528045654296875, -0.5079803466796875, -0.4879150390625, -0.4678497314453125, -0.447784423828125, -0.4277191162109375, -0.40765380859375, -0.3875885009765625, -0.367523193359375, -0.3474578857421875, -0.327392578125, -0.3073272705078125, -0.287261962890625, -0.2671966552734375, -0.24713134765625, -0.2270660400390625, -0.207000732421875, -0.1869354248046875, -0.1668701171875, -0.1468048095703125, -0.126739501953125, -0.1066741943359375, -0.08660888671875, -0.0665435791015625, -0.046478271484375, -0.0264129638671875, -0.00634765625, 0.0137176513671875, 0.033782958984375, 0.0538482666015625, 0.07391357421875, 0.0939788818359375, 0.114044189453125, 0.1341094970703125, 0.1541748046875, 0.1742401123046875, 0.194305419921875, 0.2143707275390625, 0.23443603515625, 0.2545013427734375, 0.274566650390625, 0.2946319580078125, 0.314697265625, 0.3347625732421875, 0.354827880859375, 0.3748931884765625, 0.39495849609375, 0.4150238037109375, 0.435089111328125, 0.4551544189453125, 0.4752197265625, 0.4952850341796875, 0.515350341796875, 0.5354156494140625, 0.55548095703125, 0.5755462646484375, 0.595611572265625, 0.6156768798828125, 0.6357421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 4.0, 10.0, 14.0, 13.0, 21.0, 35.0, 44.0, 56.0, 80.0, 132.0, 198.0, 283.0, 429.0, 698.0, 1019.0, 1675.0, 2772.0, 4424.0, 7482.0, 12600.0, 21763.0, 37610.0, 66059.0, 112651.0, 175954.0, 233868.0, 149692.0, 91962.0, 53271.0, 30109.0, 17527.0, 10162.0, 6122.0, 3626.0, 2271.0, 1444.0, 819.0, 552.0, 366.0, 253.0, 149.0, 112.0, 75.0, 49.0, 36.0, 18.0, 14.0, 13.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.03179931640625, -0.030844449996948242, -0.029889583587646484, -0.028934717178344727, -0.02797985076904297, -0.02702498435974121, -0.026070117950439453, -0.025115251541137695, -0.024160385131835938, -0.02320551872253418, -0.022250652313232422, -0.021295785903930664, -0.020340919494628906, -0.01938605308532715, -0.01843118667602539, -0.017476320266723633, -0.016521453857421875, -0.015566587448120117, -0.01461172103881836, -0.013656854629516602, -0.012701988220214844, -0.011747121810913086, -0.010792255401611328, -0.00983738899230957, -0.008882522583007812, -0.007927656173706055, -0.006972789764404297, -0.006017923355102539, -0.005063056945800781, -0.0041081905364990234, -0.0031533241271972656, -0.002198457717895508, -0.00124359130859375, -0.0002887248992919922, 0.0006661415100097656, 0.0016210079193115234, 0.0025758743286132812, 0.003530740737915039, 0.004485607147216797, 0.005440473556518555, 0.0063953399658203125, 0.00735020637512207, 0.008305072784423828, 0.009259939193725586, 0.010214805603027344, 0.011169672012329102, 0.01212453842163086, 0.013079404830932617, 0.014034271240234375, 0.014989137649536133, 0.01594400405883789, 0.01689887046813965, 0.017853736877441406, 0.018808603286743164, 0.019763469696044922, 0.02071833610534668, 0.021673202514648438, 0.022628068923950195, 0.023582935333251953, 0.02453780174255371, 0.02549266815185547, 0.026447534561157227, 0.027402400970458984, 0.028357267379760742, 0.0293121337890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 2.0, 11.0, 10.0, 11.0, 11.0, 20.0, 21.0, 24.0, 29.0, 41.0, 48.0, 50.0, 50.0, 81.0, 66.0, 63.0, 61.0, 67.0, 42.0, 51.0, 56.0, 35.0, 30.0, 27.0, 21.0, 12.0, 12.0, 7.0, 7.0, 8.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.8715858459472656e-05, -1.8184073269367218e-05, -1.765228807926178e-05, -1.712050288915634e-05, -1.6588717699050903e-05, -1.6056932508945465e-05, -1.5525147318840027e-05, -1.4993362128734589e-05, -1.446157693862915e-05, -1.3929791748523712e-05, -1.3398006558418274e-05, -1.2866221368312836e-05, -1.2334436178207397e-05, -1.180265098810196e-05, -1.1270865797996521e-05, -1.0739080607891083e-05, -1.0207295417785645e-05, -9.675510227680206e-06, -9.143725037574768e-06, -8.61193984746933e-06, -8.080154657363892e-06, -7.548369467258453e-06, -7.016584277153015e-06, -6.484799087047577e-06, -5.953013896942139e-06, -5.4212287068367004e-06, -4.889443516731262e-06, -4.357658326625824e-06, -3.825873136520386e-06, -3.2940879464149475e-06, -2.7623027563095093e-06, -2.230517566204071e-06, -1.6987323760986328e-06, -1.1669471859931946e-06, -6.351619958877563e-07, -1.0337680578231812e-07, 4.284083843231201e-07, 9.601935744285583e-07, 1.4919787645339966e-06, 2.023763954639435e-06, 2.555549144744873e-06, 3.0873343348503113e-06, 3.6191195249557495e-06, 4.150904715061188e-06, 4.682689905166626e-06, 5.214475095272064e-06, 5.7462602853775024e-06, 6.278045475482941e-06, 6.809830665588379e-06, 7.341615855693817e-06, 7.873401045799255e-06, 8.405186235904694e-06, 8.936971426010132e-06, 9.46875661611557e-06, 1.0000541806221008e-05, 1.0532326996326447e-05, 1.1064112186431885e-05, 1.1595897376537323e-05, 1.2127682566642761e-05, 1.26594677567482e-05, 1.3191252946853638e-05, 1.3723038136959076e-05, 1.4254823327064514e-05, 1.4786608517169952e-05, 1.531839370727539e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 13.0, 9.0, 14.0, 22.0, 21.0, 30.0, 63.0, 81.0, 125.0, 182.0, 271.0, 402.0, 625.0, 1027.0, 1661.0, 2969.0, 5272.0, 9826.0, 18802.0, 36084.0, 70259.0, 134065.0, 234421.0, 246755.0, 135457.0, 71544.0, 36573.0, 18769.0, 9947.0, 5449.0, 3060.0, 1717.0, 1065.0, 667.0, 434.0, 261.0, 202.0, 121.0, 88.0, 64.0, 29.0, 29.0, 26.0, 16.0, 8.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.04437255859375, -0.04306793212890625, -0.0417633056640625, -0.04045867919921875, -0.039154052734375, -0.03784942626953125, -0.0365447998046875, -0.03524017333984375, -0.033935546875, -0.03263092041015625, -0.0313262939453125, -0.03002166748046875, -0.028717041015625, -0.02741241455078125, -0.0261077880859375, -0.02480316162109375, -0.02349853515625, -0.02219390869140625, -0.0208892822265625, -0.01958465576171875, -0.018280029296875, -0.01697540283203125, -0.0156707763671875, -0.01436614990234375, -0.0130615234375, -0.01175689697265625, -0.0104522705078125, -0.00914764404296875, -0.007843017578125, -0.00653839111328125, -0.0052337646484375, -0.00392913818359375, -0.00262451171875, -0.00131988525390625, -1.52587890625e-05, 0.00128936767578125, 0.002593994140625, 0.00389862060546875, 0.0052032470703125, 0.00650787353515625, 0.0078125, 0.00911712646484375, 0.0104217529296875, 0.01172637939453125, 0.013031005859375, 0.01433563232421875, 0.0156402587890625, 0.01694488525390625, 0.01824951171875, 0.01955413818359375, 0.0208587646484375, 0.02216339111328125, 0.023468017578125, 0.02477264404296875, 0.0260772705078125, 0.02738189697265625, 0.0286865234375, 0.02999114990234375, 0.0312957763671875, 0.03260040283203125, 0.033905029296875, 0.03520965576171875, 0.0365142822265625, 0.03781890869140625, 0.03912353515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 5.0, 7.0, 8.0, 13.0, 15.0, 14.0, 15.0, 27.0, 25.0, 41.0, 35.0, 44.0, 50.0, 46.0, 54.0, 68.0, 61.0, 65.0, 52.0, 57.0, 38.0, 35.0, 35.0, 26.0, 35.0, 25.0, 22.0, 17.0, 11.0, 6.0, 9.0, 7.0, 6.0, 6.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06982421875, -0.0679326057434082, -0.0660409927368164, -0.06414937973022461, -0.06225776672363281, -0.060366153717041016, -0.05847454071044922, -0.05658292770385742, -0.054691314697265625, -0.05279970169067383, -0.05090808868408203, -0.049016475677490234, -0.04712486267089844, -0.04523324966430664, -0.043341636657714844, -0.04145002365112305, -0.03955841064453125, -0.03766679763793945, -0.035775184631347656, -0.03388357162475586, -0.03199195861816406, -0.030100345611572266, -0.02820873260498047, -0.026317119598388672, -0.024425506591796875, -0.022533893585205078, -0.02064228057861328, -0.018750667572021484, -0.016859054565429688, -0.01496744155883789, -0.013075828552246094, -0.011184215545654297, -0.0092926025390625, -0.007400989532470703, -0.005509376525878906, -0.0036177635192871094, -0.0017261505126953125, 0.00016546249389648438, 0.0020570755004882812, 0.003948688507080078, 0.005840301513671875, 0.007731914520263672, 0.009623527526855469, 0.011515140533447266, 0.013406753540039062, 0.01529836654663086, 0.017189979553222656, 0.019081592559814453, 0.02097320556640625, 0.022864818572998047, 0.024756431579589844, 0.02664804458618164, 0.028539657592773438, 0.030431270599365234, 0.03232288360595703, 0.03421449661254883, 0.036106109619140625, 0.03799772262573242, 0.03988933563232422, 0.041780948638916016, 0.04367256164550781, 0.04556417465209961, 0.047455787658691406, 0.0493474006652832, 0.051239013671875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 12.0, 19.0, 25.0, 28.0, 54.0, 85.0, 106.0, 129.0, 150.0, 102.0, 101.0, 78.0, 41.0, 30.0, 12.0, 12.0, 4.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3113667964935303, -1.2613438367843628, -1.2113208770751953, -1.1612979173660278, -1.1112749576568604, -1.0612521171569824, -1.011229157447815, -0.9612061977386475, -0.91118323802948, -0.8611602783203125, -0.811137318611145, -0.7611144185066223, -0.7110914587974548, -0.6610684990882874, -0.6110455989837646, -0.5610226392745972, -0.5109996795654297, -0.4609767198562622, -0.4109537899494171, -0.360930860042572, -0.31090790033340454, -0.26088494062423706, -0.21086201071739197, -0.16083908081054688, -0.1108161211013794, -0.06079317629337311, -0.010770231485366821, 0.039252713322639465, 0.08927565813064575, 0.13929861783981323, 0.18932154774665833, 0.23934447765350342, 0.2893674373626709, 0.3393903970718384, 0.38941332697868347, 0.43943625688552856, 0.48945921659469604, 0.5394821763038635, 0.5895050764083862, 0.6395280361175537, 0.6895509958267212, 0.7395739555358887, 0.7895969152450562, 0.8396198153495789, 0.8896427750587463, 0.9396657347679138, 0.9896886348724365, 1.039711594581604, 1.0897345542907715, 1.139757513999939, 1.1897804737091064, 1.239803433418274, 1.2898263931274414, 1.3398492336273193, 1.3898721933364868, 1.4398951530456543, 1.4899181127548218, 1.5399410724639893, 1.5899640321731567, 1.6399869918823242, 1.6900098323822021, 1.7400329113006592, 1.790055751800537, 1.8400787115097046, 1.890101671218872]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 7.0, 8.0, 8.0, 3.0, 6.0, 11.0, 17.0, 17.0, 27.0, 21.0, 32.0, 26.0, 35.0, 36.0, 46.0, 46.0, 40.0, 49.0, 50.0, 43.0, 39.0, 47.0, 42.0, 38.0, 34.0, 36.0, 35.0, 28.0, 25.0, 25.0, 22.0, 22.0, 18.0, 11.0, 8.0, 9.0, 9.0, 3.0, 5.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1847440004348755, -1.1457836627960205, -1.1068233251571655, -1.0678629875183105, -1.028902530670166, -0.9899422526359558, -0.950981855392456, -0.9120215177536011, -0.8730611801147461, -0.8341008424758911, -0.7951405048370361, -0.7561801075935364, -0.7172197699546814, -0.6782594323158264, -0.6392990350723267, -0.6003386974334717, -0.5613783597946167, -0.5224180221557617, -0.48345765471458435, -0.444497287273407, -0.405536949634552, -0.366576611995697, -0.32761624455451965, -0.2886558771133423, -0.2496955394744873, -0.21073518693447113, -0.17177483439445496, -0.13281448185443878, -0.09385412931442261, -0.05489377677440643, -0.01593342423439026, 0.02302694320678711, 0.06198740005493164, 0.10094775259494781, 0.139908105134964, 0.17886845767498016, 0.21782881021499634, 0.2567891478538513, 0.2957495152950287, 0.33470988273620605, 0.37367022037506104, 0.412630558013916, 0.4515909254550934, 0.49055129289627075, 0.5295116305351257, 0.5684719681739807, 0.6074323654174805, 0.6463927030563354, 0.6853530406951904, 0.7243133783340454, 0.7632737159729004, 0.8022341132164001, 0.8411944508552551, 0.8801547884941101, 0.9191151857376099, 0.9580755233764648, 0.9970358610153198, 1.0359961986541748, 1.0749565362930298, 1.1139168739318848, 1.1528773307800293, 1.1918376684188843, 1.2307980060577393, 1.2697583436965942, 1.3087186813354492]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 12.0, 18.0, 20.0, 20.0, 32.0, 51.0, 64.0, 101.0, 188.0, 262.0, 429.0, 696.0, 1323.0, 2505.0, 5435.0, 12994.0, 38885.0, 153610.0, 564590.0, 1290797.0, 1299236.0, 591550.0, 163985.0, 42183.0, 13846.0, 5427.0, 2567.0, 1325.0, 760.0, 493.0, 291.0, 159.0, 122.0, 83.0, 68.0, 43.0, 36.0, 17.0, 11.0, 12.0, 5.0, 14.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.20556640625, -0.19871902465820312, -0.19187164306640625, -0.18502426147460938, -0.1781768798828125, -0.17132949829101562, -0.16448211669921875, -0.15763473510742188, -0.150787353515625, -0.14393997192382812, -0.13709259033203125, -0.13024520874023438, -0.1233978271484375, -0.11655044555664062, -0.10970306396484375, -0.10285568237304688, -0.09600830078125, -0.08916091918945312, -0.08231353759765625, -0.07546615600585938, -0.0686187744140625, -0.061771392822265625, -0.05492401123046875, -0.048076629638671875, -0.041229248046875, -0.034381866455078125, -0.02753448486328125, -0.020687103271484375, -0.0138397216796875, -0.006992340087890625, -0.00014495849609375, 0.006702423095703125, 0.0135498046875, 0.020397186279296875, 0.02724456787109375, 0.034091949462890625, 0.0409393310546875, 0.047786712646484375, 0.05463409423828125, 0.061481475830078125, 0.068328857421875, 0.07517623901367188, 0.08202362060546875, 0.08887100219726562, 0.0957183837890625, 0.10256576538085938, 0.10941314697265625, 0.11626052856445312, 0.12310791015625, 0.12995529174804688, 0.13680267333984375, 0.14365005493164062, 0.1504974365234375, 0.15734481811523438, 0.16419219970703125, 0.17103958129882812, 0.177886962890625, 0.18473434448242188, 0.19158172607421875, 0.19842910766601562, 0.2052764892578125, 0.21212387084960938, 0.21897125244140625, 0.22581863403320312, 0.232666015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 2.0, 6.0, 9.0, 12.0, 11.0, 12.0, 14.0, 25.0, 17.0, 28.0, 28.0, 27.0, 33.0, 39.0, 33.0, 37.0, 41.0, 47.0, 52.0, 58.0, 48.0, 43.0, 56.0, 43.0, 39.0, 29.0, 38.0, 31.0, 21.0, 16.0, 18.0, 13.0, 14.0, 20.0, 13.0, 9.0, 3.0, 5.0, 4.0, 4.0, 0.0, 4.0, 3.0, 2.0, 1.0], "bins": [-0.2109375, -0.20542335510253906, -0.19990921020507812, -0.1943950653076172, -0.18888092041015625, -0.1833667755126953, -0.17785263061523438, -0.17233848571777344, -0.1668243408203125, -0.16131019592285156, -0.15579605102539062, -0.1502819061279297, -0.14476776123046875, -0.1392536163330078, -0.13373947143554688, -0.12822532653808594, -0.122711181640625, -0.11719703674316406, -0.11168289184570312, -0.10616874694824219, -0.10065460205078125, -0.09514045715332031, -0.08962631225585938, -0.08411216735839844, -0.0785980224609375, -0.07308387756347656, -0.06756973266601562, -0.06205558776855469, -0.05654144287109375, -0.05102729797363281, -0.045513153076171875, -0.03999900817871094, -0.03448486328125, -0.028970718383789062, -0.023456573486328125, -0.017942428588867188, -0.01242828369140625, -0.0069141387939453125, -0.001399993896484375, 0.0041141510009765625, 0.0096282958984375, 0.015142440795898438, 0.020656585693359375, 0.026170730590820312, 0.03168487548828125, 0.03719902038574219, 0.042713165283203125, 0.04822731018066406, 0.053741455078125, 0.05925559997558594, 0.06476974487304688, 0.07028388977050781, 0.07579803466796875, 0.08131217956542969, 0.08682632446289062, 0.09234046936035156, 0.0978546142578125, 0.10336875915527344, 0.10888290405273438, 0.11439704895019531, 0.11991119384765625, 0.1254253387451172, 0.13093948364257812, 0.13645362854003906, 0.1419677734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 10.0, 11.0, 14.0, 19.0, 26.0, 28.0, 48.0, 68.0, 92.0, 140.0, 221.0, 339.0, 573.0, 967.0, 1839.0, 3673.0, 8538.0, 22906.0, 76288.0, 339903.0, 1945198.0, 1456522.0, 245573.0, 58360.0, 18535.0, 7230.0, 3225.0, 1673.0, 879.0, 507.0, 288.0, 170.0, 131.0, 80.0, 47.0, 36.0, 27.0, 17.0, 15.0, 12.0, 12.0, 4.0, 5.0, 11.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.25927734375, -0.2506065368652344, -0.24193572998046875, -0.23326492309570312, -0.2245941162109375, -0.21592330932617188, -0.20725250244140625, -0.19858169555664062, -0.189910888671875, -0.18124008178710938, -0.17256927490234375, -0.16389846801757812, -0.1552276611328125, -0.14655685424804688, -0.13788604736328125, -0.12921524047851562, -0.12054443359375, -0.11187362670898438, -0.10320281982421875, -0.09453201293945312, -0.0858612060546875, -0.07719039916992188, -0.06851959228515625, -0.059848785400390625, -0.051177978515625, -0.042507171630859375, -0.03383636474609375, -0.025165557861328125, -0.0164947509765625, -0.007823944091796875, 0.00084686279296875, 0.009517669677734375, 0.0181884765625, 0.026859283447265625, 0.03553009033203125, 0.044200897216796875, 0.0528717041015625, 0.061542510986328125, 0.07021331787109375, 0.07888412475585938, 0.087554931640625, 0.09622573852539062, 0.10489654541015625, 0.11356735229492188, 0.1222381591796875, 0.13090896606445312, 0.13957977294921875, 0.14825057983398438, 0.15692138671875, 0.16559219360351562, 0.17426300048828125, 0.18293380737304688, 0.1916046142578125, 0.20027542114257812, 0.20894622802734375, 0.21761703491210938, 0.226287841796875, 0.23495864868164062, 0.24362945556640625, 0.2523002624511719, 0.2609710693359375, 0.2696418762207031, 0.27831268310546875, 0.2869834899902344, 0.295654296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 11.0, 29.0, 27.0, 33.0, 57.0, 66.0, 109.0, 132.0, 186.0, 253.0, 299.0, 398.0, 489.0, 431.0, 424.0, 305.0, 225.0, 157.0, 113.0, 87.0, 50.0, 43.0, 43.0, 15.0, 14.0, 14.0, 5.0, 9.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.37744140625, -0.36594390869140625, -0.3544464111328125, -0.34294891357421875, -0.331451416015625, -0.31995391845703125, -0.3084564208984375, -0.29695892333984375, -0.28546142578125, -0.27396392822265625, -0.2624664306640625, -0.25096893310546875, -0.239471435546875, -0.22797393798828125, -0.2164764404296875, -0.20497894287109375, -0.1934814453125, -0.18198394775390625, -0.1704864501953125, -0.15898895263671875, -0.147491455078125, -0.13599395751953125, -0.1244964599609375, -0.11299896240234375, -0.10150146484375, -0.09000396728515625, -0.0785064697265625, -0.06700897216796875, -0.055511474609375, -0.04401397705078125, -0.0325164794921875, -0.02101898193359375, -0.009521484375, 0.00197601318359375, 0.0134735107421875, 0.02497100830078125, 0.036468505859375, 0.04796600341796875, 0.0594635009765625, 0.07096099853515625, 0.08245849609375, 0.09395599365234375, 0.1054534912109375, 0.11695098876953125, 0.128448486328125, 0.13994598388671875, 0.1514434814453125, 0.16294097900390625, 0.1744384765625, 0.18593597412109375, 0.1974334716796875, 0.20893096923828125, 0.220428466796875, 0.23192596435546875, 0.2434234619140625, 0.25492095947265625, 0.26641845703125, 0.27791595458984375, 0.2894134521484375, 0.30091094970703125, 0.312408447265625, 0.32390594482421875, 0.3354034423828125, 0.34690093994140625, 0.3583984375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 11.0, 6.0, 11.0, 8.0, 14.0, 23.0, 35.0, 51.0, 59.0, 77.0, 93.0, 98.0, 118.0, 74.0, 88.0, 63.0, 37.0, 33.0, 27.0, 16.0, 15.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3598837852478027, -2.264758586883545, -2.169633388519287, -2.0745081901550293, -1.9793829917907715, -1.8842577934265137, -1.7891327142715454, -1.6940075159072876, -1.5988823175430298, -1.503757119178772, -1.4086319208145142, -1.313506841659546, -1.218381643295288, -1.1232564449310303, -1.0281312465667725, -0.9330060482025146, -0.8378808498382568, -0.742755651473999, -0.6476304531097412, -0.5525053143501282, -0.45738011598587036, -0.36225491762161255, -0.2671297788619995, -0.1720045804977417, -0.07687938213348389, 0.018245801329612732, 0.11337098479270935, 0.20849615335464478, 0.3036213517189026, 0.3987465500831604, 0.49387168884277344, 0.5889968872070312, 0.68412184715271, 0.7792470455169678, 0.8743722438812256, 0.9694973826408386, 1.0646226406097412, 1.159747838973999, 1.2548729181289673, 1.349998116493225, 1.445123314857483, 1.5402485132217407, 1.6353737115859985, 1.7304987907409668, 1.8256239891052246, 1.9207491874694824, 2.0158743858337402, 2.110999584197998, 2.206124782562256, 2.3012499809265137, 2.3963751792907715, 2.4915003776550293, 2.586625576019287, 2.681750774383545, 2.7768759727478027, 2.8720011711120605, 2.9671263694763184, 3.062251567840576, 3.157376766204834, 3.252501964569092, 3.3476271629333496, 3.4427523612976074, 3.5378775596618652, 3.633002758026123, 3.7281277179718018]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 8.0, 4.0, 11.0, 10.0, 18.0, 7.0, 12.0, 27.0, 24.0, 29.0, 26.0, 35.0, 42.0, 42.0, 38.0, 47.0, 45.0, 51.0, 53.0, 48.0, 50.0, 57.0, 41.0, 51.0, 33.0, 36.0, 22.0, 27.0, 25.0, 14.0, 17.0, 11.0, 9.0, 12.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5655415058135986, -1.5129655599594116, -1.4603896141052246, -1.407813549041748, -1.355237603187561, -1.302661657333374, -1.250085711479187, -1.197509765625, -1.1449337005615234, -1.0923577547073364, -1.0397818088531494, -0.9872058033943176, -0.9346297979354858, -0.8820538520812988, -0.8294779062271118, -0.7769019603729248, -0.7243260145187378, -0.6717500686645508, -0.619174063205719, -0.566598117351532, -0.5140221118927002, -0.4614461660385132, -0.40887022018432617, -0.3562942445278168, -0.3037182688713074, -0.251142293214798, -0.19856633245944977, -0.14599037170410156, -0.09341439604759216, -0.040838420391082764, 0.011737525463104248, 0.06431350111961365, 0.11688947677612305, 0.16946545243263245, 0.22204141318798065, 0.27461737394332886, 0.32719334959983826, 0.37976932525634766, 0.43234527111053467, 0.48492124676704407, 0.5374972224235535, 0.5900731682777405, 0.6426491737365723, 0.6952251195907593, 0.7478010654449463, 0.8003770709037781, 0.8529530167579651, 0.9055290222167969, 0.9581049680709839, 1.010680913925171, 1.063256859779358, 1.115832805633545, 1.1684088706970215, 1.2209848165512085, 1.2735607624053955, 1.3261367082595825, 1.3787126541137695, 1.4312885999679565, 1.4838645458221436, 1.5364406108856201, 1.5890165567398071, 1.6415925025939941, 1.6941684484481812, 1.7467443943023682, 1.7993204593658447]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 4.0, 5.0, 13.0, 18.0, 10.0, 21.0, 36.0, 35.0, 72.0, 89.0, 150.0, 246.0, 365.0, 693.0, 1128.0, 2159.0, 4287.0, 9098.0, 21746.0, 62326.0, 215610.0, 451638.0, 187239.0, 54972.0, 19466.0, 8263.0, 4023.0, 2075.0, 1092.0, 593.0, 392.0, 243.0, 126.0, 99.0, 59.0, 52.0, 25.0, 17.0, 23.0, 7.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.1917724609375, -0.1862049102783203, -0.18063735961914062, -0.17506980895996094, -0.16950225830078125, -0.16393470764160156, -0.15836715698242188, -0.1527996063232422, -0.1472320556640625, -0.1416645050048828, -0.13609695434570312, -0.13052940368652344, -0.12496185302734375, -0.11939430236816406, -0.11382675170898438, -0.10825920104980469, -0.102691650390625, -0.09712409973144531, -0.09155654907226562, -0.08598899841308594, -0.08042144775390625, -0.07485389709472656, -0.06928634643554688, -0.06371879577636719, -0.0581512451171875, -0.05258369445800781, -0.047016143798828125, -0.04144859313964844, -0.03588104248046875, -0.030313491821289062, -0.024745941162109375, -0.019178390502929688, -0.01361083984375, -0.008043289184570312, -0.002475738525390625, 0.0030918121337890625, 0.00865936279296875, 0.014226913452148438, 0.019794464111328125, 0.025362014770507812, 0.0309295654296875, 0.03649711608886719, 0.042064666748046875, 0.04763221740722656, 0.05319976806640625, 0.05876731872558594, 0.06433486938476562, 0.06990242004394531, 0.075469970703125, 0.08103752136230469, 0.08660507202148438, 0.09217262268066406, 0.09774017333984375, 0.10330772399902344, 0.10887527465820312, 0.11444282531738281, 0.1200103759765625, 0.1255779266357422, 0.13114547729492188, 0.13671302795410156, 0.14228057861328125, 0.14784812927246094, 0.15341567993164062, 0.1589832305908203, 0.16455078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 5.0, 2.0, 7.0, 6.0, 4.0, 14.0, 9.0, 10.0, 12.0, 15.0, 22.0, 28.0, 26.0, 28.0, 29.0, 47.0, 43.0, 36.0, 44.0, 46.0, 52.0, 49.0, 50.0, 44.0, 36.0, 45.0, 48.0, 25.0, 31.0, 41.0, 21.0, 21.0, 23.0, 20.0, 16.0, 13.0, 6.0, 6.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.236083984375, -0.2289867401123047, -0.22188949584960938, -0.21479225158691406, -0.20769500732421875, -0.20059776306152344, -0.19350051879882812, -0.1864032745361328, -0.1793060302734375, -0.1722087860107422, -0.16511154174804688, -0.15801429748535156, -0.15091705322265625, -0.14381980895996094, -0.13672256469726562, -0.1296253204345703, -0.122528076171875, -0.11543083190917969, -0.10833358764648438, -0.10123634338378906, -0.09413909912109375, -0.08704185485839844, -0.07994461059570312, -0.07284736633300781, -0.0657501220703125, -0.05865287780761719, -0.051555633544921875, -0.04445838928222656, -0.03736114501953125, -0.030263900756835938, -0.023166656494140625, -0.016069412231445312, -0.00897216796875, -0.0018749237060546875, 0.005222320556640625, 0.012319564819335938, 0.01941680908203125, 0.026514053344726562, 0.033611297607421875, 0.04070854187011719, 0.0478057861328125, 0.05490303039550781, 0.062000274658203125, 0.06909751892089844, 0.07619476318359375, 0.08329200744628906, 0.09038925170898438, 0.09748649597167969, 0.104583740234375, 0.11168098449707031, 0.11877822875976562, 0.12587547302246094, 0.13297271728515625, 0.14006996154785156, 0.14716720581054688, 0.1542644500732422, 0.1613616943359375, 0.1684589385986328, 0.17555618286132812, 0.18265342712402344, 0.18975067138671875, 0.19684791564941406, 0.20394515991210938, 0.2110424041748047, 0.2181396484375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 11.0, 29.0, 40.0, 77.0, 111.0, 179.0, 323.0, 524.0, 1100.0, 2047.0, 4397.0, 10465.0, 28117.0, 94501.0, 495870.0, 302655.0, 69636.0, 22236.0, 8556.0, 3731.0, 1927.0, 820.0, 490.0, 280.0, 175.0, 90.0, 47.0, 37.0, 24.0, 23.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1502685546875, -0.1448802947998047, -0.13949203491210938, -0.13410377502441406, -0.12871551513671875, -0.12332725524902344, -0.11793899536132812, -0.11255073547363281, -0.1071624755859375, -0.10177421569824219, -0.09638595581054688, -0.09099769592285156, -0.08560943603515625, -0.08022117614746094, -0.07483291625976562, -0.06944465637207031, -0.064056396484375, -0.05866813659667969, -0.053279876708984375, -0.04789161682128906, -0.04250335693359375, -0.03711509704589844, -0.031726837158203125, -0.026338577270507812, -0.0209503173828125, -0.015562057495117188, -0.010173797607421875, -0.0047855377197265625, 0.00060272216796875, 0.0059909820556640625, 0.011379241943359375, 0.016767501831054688, 0.02215576171875, 0.027544021606445312, 0.032932281494140625, 0.03832054138183594, 0.04370880126953125, 0.04909706115722656, 0.054485321044921875, 0.05987358093261719, 0.0652618408203125, 0.07065010070800781, 0.07603836059570312, 0.08142662048339844, 0.08681488037109375, 0.09220314025878906, 0.09759140014648438, 0.10297966003417969, 0.108367919921875, 0.11375617980957031, 0.11914443969726562, 0.12453269958496094, 0.12992095947265625, 0.13530921936035156, 0.14069747924804688, 0.1460857391357422, 0.1514739990234375, 0.1568622589111328, 0.16225051879882812, 0.16763877868652344, 0.17302703857421875, 0.17841529846191406, 0.18380355834960938, 0.1891918182373047, 0.194580078125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 7.0, 6.0, 4.0, 13.0, 20.0, 21.0, 14.0, 20.0, 28.0, 33.0, 36.0, 49.0, 37.0, 57.0, 63.0, 61.0, 56.0, 56.0, 61.0, 61.0, 52.0, 36.0, 39.0, 36.0, 20.0, 14.0, 23.0, 20.0, 10.0, 10.0, 7.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.591796875, -0.5739669799804688, -0.5561370849609375, -0.5383071899414062, -0.520477294921875, -0.5026473999023438, -0.4848175048828125, -0.46698760986328125, -0.44915771484375, -0.43132781982421875, -0.4134979248046875, -0.39566802978515625, -0.377838134765625, -0.36000823974609375, -0.3421783447265625, -0.32434844970703125, -0.3065185546875, -0.28868865966796875, -0.2708587646484375, -0.25302886962890625, -0.235198974609375, -0.21736907958984375, -0.1995391845703125, -0.18170928955078125, -0.16387939453125, -0.14604949951171875, -0.1282196044921875, -0.11038970947265625, -0.092559814453125, -0.07472991943359375, -0.0569000244140625, -0.03907012939453125, -0.021240234375, -0.00341033935546875, 0.0144195556640625, 0.03224945068359375, 0.050079345703125, 0.06790924072265625, 0.0857391357421875, 0.10356903076171875, 0.12139892578125, 0.13922882080078125, 0.1570587158203125, 0.17488861083984375, 0.192718505859375, 0.21054840087890625, 0.2283782958984375, 0.24620819091796875, 0.2640380859375, 0.28186798095703125, 0.2996978759765625, 0.31752777099609375, 0.335357666015625, 0.35318756103515625, 0.3710174560546875, 0.38884735107421875, 0.40667724609375, 0.42450714111328125, 0.4423370361328125, 0.46016693115234375, 0.477996826171875, 0.49582672119140625, 0.5136566162109375, 0.5314865112304688, 0.54931640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 9.0, 7.0, 9.0, 21.0, 39.0, 56.0, 88.0, 138.0, 198.0, 273.0, 467.0, 1003.0, 2062.0, 6354.0, 32073.0, 320239.0, 621347.0, 50305.0, 8706.0, 2514.0, 1015.0, 576.0, 344.0, 213.0, 141.0, 98.0, 59.0, 66.0, 35.0, 31.0, 15.0, 11.0, 10.0, 5.0, 2.0, 1.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.0882568359375, -0.08566951751708984, -0.08308219909667969, -0.08049488067626953, -0.07790756225585938, -0.07532024383544922, -0.07273292541503906, -0.0701456069946289, -0.06755828857421875, -0.0649709701538086, -0.06238365173339844, -0.05979633331298828, -0.057209014892578125, -0.05462169647216797, -0.05203437805175781, -0.049447059631347656, -0.0468597412109375, -0.044272422790527344, -0.04168510437011719, -0.03909778594970703, -0.036510467529296875, -0.03392314910888672, -0.03133583068847656, -0.028748512268066406, -0.02616119384765625, -0.023573875427246094, -0.020986557006835938, -0.01839923858642578, -0.015811920166015625, -0.013224601745605469, -0.010637283325195312, -0.008049964904785156, -0.005462646484375, -0.0028753280639648438, -0.0002880096435546875, 0.0022993087768554688, 0.004886627197265625, 0.007473945617675781, 0.010061264038085938, 0.012648582458496094, 0.01523590087890625, 0.017823219299316406, 0.020410537719726562, 0.02299785614013672, 0.025585174560546875, 0.02817249298095703, 0.030759811401367188, 0.033347129821777344, 0.0359344482421875, 0.038521766662597656, 0.04110908508300781, 0.04369640350341797, 0.046283721923828125, 0.04887104034423828, 0.05145835876464844, 0.054045677185058594, 0.05663299560546875, 0.059220314025878906, 0.06180763244628906, 0.06439495086669922, 0.06698226928710938, 0.06956958770751953, 0.07215690612792969, 0.07474422454833984, 0.07733154296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 7.0, 2.0, 8.0, 7.0, 18.0, 20.0, 21.0, 25.0, 35.0, 38.0, 54.0, 67.0, 86.0, 105.0, 95.0, 101.0, 61.0, 75.0, 35.0, 48.0, 23.0, 20.0, 13.0, 7.0, 3.0, 7.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.378225326538086e-05, -2.3214146494865417e-05, -2.2646039724349976e-05, -2.2077932953834534e-05, -2.1509826183319092e-05, -2.094171941280365e-05, -2.0373612642288208e-05, -1.9805505871772766e-05, -1.9237399101257324e-05, -1.8669292330741882e-05, -1.810118556022644e-05, -1.7533078789711e-05, -1.6964972019195557e-05, -1.6396865248680115e-05, -1.5828758478164673e-05, -1.526065170764923e-05, -1.4692544937133789e-05, -1.4124438166618347e-05, -1.3556331396102905e-05, -1.2988224625587463e-05, -1.2420117855072021e-05, -1.185201108455658e-05, -1.1283904314041138e-05, -1.0715797543525696e-05, -1.0147690773010254e-05, -9.579584002494812e-06, -9.01147723197937e-06, -8.443370461463928e-06, -7.875263690948486e-06, -7.3071569204330444e-06, -6.7390501499176025e-06, -6.170943379402161e-06, -5.602836608886719e-06, -5.034729838371277e-06, -4.466623067855835e-06, -3.898516297340393e-06, -3.330409526824951e-06, -2.7623027563095093e-06, -2.1941959857940674e-06, -1.6260892152786255e-06, -1.0579824447631836e-06, -4.898756742477417e-07, 7.82310962677002e-08, 6.463378667831421e-07, 1.214444637298584e-06, 1.7825514078140259e-06, 2.3506581783294678e-06, 2.9187649488449097e-06, 3.4868717193603516e-06, 4.0549784898757935e-06, 4.623085260391235e-06, 5.191192030906677e-06, 5.759298801422119e-06, 6.327405571937561e-06, 6.895512342453003e-06, 7.463619112968445e-06, 8.031725883483887e-06, 8.599832653999329e-06, 9.16793942451477e-06, 9.736046195030212e-06, 1.0304152965545654e-05, 1.0872259736061096e-05, 1.1440366506576538e-05, 1.200847327709198e-05, 1.2576580047607422e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 5.0, 9.0, 7.0, 6.0, 5.0, 7.0, 13.0, 16.0, 14.0, 47.0, 23.0, 38.0, 82.0, 129.0, 211.0, 586.0, 1487.0, 5935.0, 38013.0, 677040.0, 295976.0, 22384.0, 4304.0, 1207.0, 450.0, 184.0, 132.0, 81.0, 42.0, 39.0, 19.0, 21.0, 11.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1385498046875, -0.1346874237060547, -0.13082504272460938, -0.12696266174316406, -0.12310028076171875, -0.11923789978027344, -0.11537551879882812, -0.11151313781738281, -0.1076507568359375, -0.10378837585449219, -0.09992599487304688, -0.09606361389160156, -0.09220123291015625, -0.08833885192871094, -0.08447647094726562, -0.08061408996582031, -0.076751708984375, -0.07288932800292969, -0.06902694702148438, -0.06516456604003906, -0.06130218505859375, -0.05743980407714844, -0.053577423095703125, -0.04971504211425781, -0.0458526611328125, -0.04199028015136719, -0.038127899169921875, -0.03426551818847656, -0.03040313720703125, -0.026540756225585938, -0.022678375244140625, -0.018815994262695312, -0.01495361328125, -0.011091232299804688, -0.007228851318359375, -0.0033664703369140625, 0.00049591064453125, 0.0043582916259765625, 0.008220672607421875, 0.012083053588867188, 0.0159454345703125, 0.019807815551757812, 0.023670196533203125, 0.027532577514648438, 0.03139495849609375, 0.03525733947753906, 0.039119720458984375, 0.04298210144042969, 0.046844482421875, 0.05070686340332031, 0.054569244384765625, 0.05843162536621094, 0.06229400634765625, 0.06615638732910156, 0.07001876831054688, 0.07388114929199219, 0.0777435302734375, 0.08160591125488281, 0.08546829223632812, 0.08933067321777344, 0.09319305419921875, 0.09705543518066406, 0.10091781616210938, 0.10478019714355469, 0.108642578125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 16.0, 20.0, 39.0, 70.0, 111.0, 204.0, 217.0, 157.0, 78.0, 39.0, 24.0, 10.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250244140625, -0.2438678741455078, -0.23749160766601562, -0.23111534118652344, -0.22473907470703125, -0.21836280822753906, -0.21198654174804688, -0.2056102752685547, -0.1992340087890625, -0.1928577423095703, -0.18648147583007812, -0.18010520935058594, -0.17372894287109375, -0.16735267639160156, -0.16097640991210938, -0.1546001434326172, -0.148223876953125, -0.1418476104736328, -0.13547134399414062, -0.12909507751464844, -0.12271881103515625, -0.11634254455566406, -0.10996627807617188, -0.10359001159667969, -0.0972137451171875, -0.09083747863769531, -0.08446121215820312, -0.07808494567871094, -0.07170867919921875, -0.06533241271972656, -0.058956146240234375, -0.05257987976074219, -0.04620361328125, -0.03982734680175781, -0.033451080322265625, -0.027074813842773438, -0.02069854736328125, -0.014322280883789062, -0.007946014404296875, -0.0015697479248046875, 0.0048065185546875, 0.011182785034179688, 0.017559051513671875, 0.023935317993164062, 0.03031158447265625, 0.03668785095214844, 0.043064117431640625, 0.04944038391113281, 0.055816650390625, 0.06219291687011719, 0.06856918334960938, 0.07494544982910156, 0.08132171630859375, 0.08769798278808594, 0.09407424926757812, 0.10045051574707031, 0.1068267822265625, 0.11320304870605469, 0.11957931518554688, 0.12595558166503906, 0.13233184814453125, 0.13870811462402344, 0.14508438110351562, 0.1514606475830078, 0.1578369140625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 17.0, 43.0, 79.0, 148.0, 222.0, 222.0, 124.0, 67.0, 32.0, 13.0, 5.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.477720260620117, -3.3858680725097656, -3.294015884399414, -3.2021634578704834, -3.110311269760132, -3.0184590816497803, -2.9266068935394287, -2.834754467010498, -2.7429022789001465, -2.651050090789795, -2.5591979026794434, -2.4673454761505127, -2.375493288040161, -2.2836410999298096, -2.191788911819458, -2.0999364852905273, -2.008084297180176, -1.9162321090698242, -1.824379801750183, -1.7325276136398315, -1.6406753063201904, -1.5488231182098389, -1.4569709300994873, -1.3651186227798462, -1.2732665538787842, -1.1814143657684326, -1.0895620584487915, -0.9977098703384399, -0.9058575630187988, -0.8140053749084473, -0.7221531271934509, -0.6303008794784546, -0.5384485721588135, -0.44659632444381714, -0.3547440767288208, -0.26289185881614685, -0.1710396111011505, -0.07918736338615417, 0.012664854526519775, 0.10451710224151611, 0.19636934995651245, 0.2882215976715088, 0.3800738453865051, 0.4719260632991791, 0.563778281211853, 0.6556305885314941, 0.7474827766418457, 0.839335024356842, 0.9311872720718384, 1.02303946018219, 1.114891767501831, 1.2067439556121826, 1.2985962629318237, 1.3904484510421753, 1.4823007583618164, 1.574152946472168, 1.6660051345825195, 1.757857322692871, 1.8497096300125122, 1.9415618181228638, 2.033414125442505, 2.1252663135528564, 2.217118501663208, 2.3089709281921387, 2.4008231163024902]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 7.0, 14.0, 16.0, 24.0, 21.0, 30.0, 40.0, 45.0, 57.0, 65.0, 89.0, 88.0, 85.0, 70.0, 58.0, 54.0, 43.0, 42.0, 38.0, 36.0, 20.0, 12.0, 15.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.714712619781494, -2.6513795852661133, -2.5880467891693115, -2.5247137546539307, -2.46138072013855, -2.398047924041748, -2.334714889526367, -2.2713818550109863, -2.2080490589141846, -2.1447160243988037, -2.081383228302002, -2.018050193786621, -1.9547172784805298, -1.8913843631744385, -1.8280513286590576, -1.7647184133529663, -1.7013853788375854, -1.6380524635314941, -1.5747194290161133, -1.511386513710022, -1.4480535984039307, -1.3847205638885498, -1.3213876485824585, -1.2580547332763672, -1.1947216987609863, -1.131388783454895, -1.0680557489395142, -1.0047228336334229, -0.9413899183273315, -0.8780569434165955, -0.8147239685058594, -0.7513910531997681, -0.6880581378936768, -0.6247251629829407, -0.5613922476768494, -0.4980592727661133, -0.4347263276576996, -0.3713933825492859, -0.3080604076385498, -0.2447274625301361, -0.1813945174217224, -0.11806156486272812, -0.054728612303733826, 0.008604347705841064, 0.07193729281425476, 0.13527023792266846, 0.19860321283340454, 0.26193615794181824, 0.32526910305023193, 0.38860204815864563, 0.4519349932670593, 0.5152679681777954, 0.5786008834838867, 0.6419338583946228, 0.7052668333053589, 0.7685997486114502, 0.8319327235221863, 0.8952656984329224, 0.9585986137390137, 1.0219316482543945, 1.0852645635604858, 1.1485974788665771, 1.211930513381958, 1.2752634286880493, 1.3385963439941406]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 6.0, 4.0, 5.0, 7.0, 6.0, 10.0, 8.0, 10.0, 12.0, 15.0, 14.0, 22.0, 17.0, 30.0, 16.0, 35.0, 35.0, 92.0, 191.0, 157.0, 72.0, 27.0, 18.0, 27.0, 27.0, 16.0, 18.0, 11.0, 9.0, 11.0, 11.0, 14.0, 10.0, 4.0, 10.0, 3.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2230224609375, -0.21643447875976562, -0.20984649658203125, -0.20325851440429688, -0.1966705322265625, -0.19008255004882812, -0.18349456787109375, -0.17690658569335938, -0.170318603515625, -0.16373062133789062, -0.15714263916015625, -0.15055465698242188, -0.1439666748046875, -0.13737869262695312, -0.13079071044921875, -0.12420272827148438, -0.11761474609375, -0.11102676391601562, -0.10443878173828125, -0.09785079956054688, -0.0912628173828125, -0.08467483520507812, -0.07808685302734375, -0.07149887084960938, -0.064910888671875, -0.058322906494140625, -0.05173492431640625, -0.045146942138671875, -0.0385589599609375, -0.031970977783203125, -0.02538299560546875, -0.018795013427734375, -0.01220703125, -0.005619049072265625, 0.00096893310546875, 0.007556915283203125, 0.0141448974609375, 0.020732879638671875, 0.02732086181640625, 0.033908843994140625, 0.040496826171875, 0.047084808349609375, 0.05367279052734375, 0.060260772705078125, 0.0668487548828125, 0.07343673706054688, 0.08002471923828125, 0.08661270141601562, 0.09320068359375, 0.09978866577148438, 0.10637664794921875, 0.11296463012695312, 0.1195526123046875, 0.12614059448242188, 0.13272857666015625, 0.13931655883789062, 0.145904541015625, 0.15249252319335938, 0.15908050537109375, 0.16566848754882812, 0.1722564697265625, 0.17884445190429688, 0.18543243408203125, 0.19202041625976562, 0.1986083984375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 2.0, 8.0, 16.0, 16.0, 19.0, 26.0, 49.0, 59.0, 81.0, 147.0, 215.0, 363.0, 602.0, 1141.0, 2242.0, 4579.0, 11547.0, 55247.0, 8212708.0, 75528.0, 13056.0, 5231.0, 2410.0, 1370.0, 664.0, 433.0, 272.0, 177.0, 109.0, 76.0, 51.0, 31.0, 23.0, 27.0, 19.0, 8.0, 7.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.6615508198738098, -0.6412308812141418, -0.6209110021591187, -0.6005910634994507, -0.5802711248397827, -0.5599511861801147, -0.5396313071250916, -0.5193113684654236, -0.498991459608078, -0.4786715507507324, -0.45835161209106445, -0.43803170323371887, -0.4177117943763733, -0.3973918557167053, -0.37707194685935974, -0.35675203800201416, -0.3364320993423462, -0.3161121904850006, -0.29579225182533264, -0.27547234296798706, -0.2551524043083191, -0.2348324954509735, -0.21451258659362793, -0.19419266283512115, -0.17387273907661438, -0.1535528153181076, -0.13323289155960083, -0.11291298270225525, -0.09259305894374847, -0.0722731351852417, -0.05195321887731552, -0.03163330256938934, -0.011313438415527344, 0.009006481617689133, 0.02932640165090561, 0.049646321684122086, 0.06996624171733856, 0.09028616547584534, 0.11060608178377151, 0.1309259980916977, 0.15124592185020447, 0.17156584560871124, 0.19188576936721802, 0.2122056782245636, 0.23252560198307037, 0.25284552574157715, 0.27316543459892273, 0.2934853434562683, 0.3138052821159363, 0.33412519097328186, 0.35444512963294983, 0.3747650384902954, 0.3950849771499634, 0.41540488600730896, 0.43572479486465454, 0.4560447335243225, 0.4763646423816681, 0.49668455123901367, 0.5170044898986816, 0.5373244285583496, 0.5576443076133728, 0.5779642462730408, 0.5982841849327087, 0.6186040639877319, 0.6389240026473999]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 3.0, 4.0, 2.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 1.0, 8.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.0519682168960571, -1.0217103958129883, -0.9914525747299194, -0.9611947536468506, -0.930936872959137, -0.9006790518760681, -0.8704212307929993, -0.8401634097099304, -0.8099055886268616, -0.7796477675437927, -0.7493899464607239, -0.7191320657730103, -0.6888742446899414, -0.6586164236068726, -0.6283586025238037, -0.5981007814407349, -0.567842960357666, -0.5375851392745972, -0.5073273181915283, -0.4770694673061371, -0.44681164622306824, -0.416553795337677, -0.38629597425460815, -0.3560381531715393, -0.3257802724838257, -0.29552245140075684, -0.2652646005153656, -0.23500677943229675, -0.2047489583492279, -0.17449112236499786, -0.14423328638076782, -0.11397546529769897, -0.08371764421463013, -0.05345981568098068, -0.02320198342204094, 0.007055848836898804, 0.03731367737054825, 0.06757150590419769, 0.09782934188842773, 0.12808716297149658, 0.15834499895572662, 0.18860283493995667, 0.2188606560230255, 0.24911849200725555, 0.2793763279914856, 0.30963414907455444, 0.3398919701576233, 0.37014979124069214, 0.4004076421260834, 0.4306654632091522, 0.46092331409454346, 0.4911811351776123, 0.5214389562606812, 0.55169677734375, 0.5819545984268188, 0.6122124195098877, 0.6424703001976013, 0.6727281212806702, 0.702985942363739, 0.7332438230514526, 0.7635016441345215, 0.7937594652175903, 0.8240172863006592, 0.854275107383728, 0.8845329284667969]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 7.0, 19.0, 12.0, 17.0, 33.0, 71.0, 56.0, 79.0, 99.0, 79.0, 84.0, 97.0, 74.0, 63.0, 59.0, 31.0, 31.0, 33.0, 18.0, 11.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1629638671875, -0.1569957733154297, -0.15102767944335938, -0.14505958557128906, -0.13909149169921875, -0.13312339782714844, -0.12715530395507812, -0.12118721008300781, -0.1152191162109375, -0.10925102233886719, -0.10328292846679688, -0.09731483459472656, -0.09134674072265625, -0.08537864685058594, -0.07941055297851562, -0.07344245910644531, -0.067474365234375, -0.06150627136230469, -0.055538177490234375, -0.04957008361816406, -0.04360198974609375, -0.03763389587402344, -0.031665802001953125, -0.025697708129882812, -0.0197296142578125, -0.013761520385742188, -0.007793426513671875, -0.0018253326416015625, 0.00414276123046875, 0.010110855102539062, 0.016078948974609375, 0.022047042846679688, 0.02801513671875, 0.03398323059082031, 0.039951324462890625, 0.04591941833496094, 0.05188751220703125, 0.05785560607910156, 0.06382369995117188, 0.06979179382324219, 0.0757598876953125, 0.08172798156738281, 0.08769607543945312, 0.09366416931152344, 0.09963226318359375, 0.10560035705566406, 0.11156845092773438, 0.11753654479980469, 0.123504638671875, 0.1294727325439453, 0.13544082641601562, 0.14140892028808594, 0.14737701416015625, 0.15334510803222656, 0.15931320190429688, 0.1652812957763672, 0.1712493896484375, 0.1772174835205078, 0.18318557739257812, 0.18915367126464844, 0.19512176513671875, 0.20108985900878906, 0.20705795288085938, 0.2130260467529297, 0.218994140625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 6.0, 7.0, 11.0, 17.0, 21.0, 39.0, 35.0, 91.0, 140.0, 219.0, 351.0, 680.0, 1330.0, 2831.0, 6495.0, 18425.0, 74760.0, 270853.0, 109257.0, 24055.0, 8040.0, 3237.0, 1524.0, 741.0, 436.0, 257.0, 132.0, 103.0, 56.0, 37.0, 26.0, 12.0, 13.0, 7.0, 3.0, 4.0, 1.0, 4.0, 6.0, 1.0, 1.0, 2.0], "bins": [-3.919921875, -3.820953369140625, -3.72198486328125, -3.623016357421875, -3.5240478515625, -3.425079345703125, -3.32611083984375, -3.227142333984375, -3.128173828125, -3.029205322265625, -2.93023681640625, -2.831268310546875, -2.7322998046875, -2.633331298828125, -2.53436279296875, -2.435394287109375, -2.33642578125, -2.237457275390625, -2.13848876953125, -2.039520263671875, -1.9405517578125, -1.841583251953125, -1.74261474609375, -1.643646240234375, -1.544677734375, -1.445709228515625, -1.34674072265625, -1.247772216796875, -1.1488037109375, -1.049835205078125, -0.95086669921875, -0.851898193359375, -0.7529296875, -0.653961181640625, -0.55499267578125, -0.456024169921875, -0.3570556640625, -0.258087158203125, -0.15911865234375, -0.060150146484375, 0.038818359375, 0.137786865234375, 0.23675537109375, 0.335723876953125, 0.4346923828125, 0.533660888671875, 0.63262939453125, 0.731597900390625, 0.83056640625, 0.929534912109375, 1.02850341796875, 1.127471923828125, 1.2264404296875, 1.325408935546875, 1.42437744140625, 1.523345947265625, 1.622314453125, 1.721282958984375, 1.82025146484375, 1.919219970703125, 2.0181884765625, 2.117156982421875, 2.21612548828125, 2.315093994140625, 2.4140625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 13.0, 5.0, 15.0, 17.0, 21.0, 30.0, 31.0, 31.0, 44.0, 43.0, 67.0, 66.0, 56.0, 58.0, 66.0, 59.0, 64.0, 53.0, 44.0, 36.0, 42.0, 25.0, 9.0, 20.0, 23.0, 11.0, 9.0, 9.0, 11.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2998046875, -0.2915973663330078, -0.2833900451660156, -0.27518272399902344, -0.26697540283203125, -0.25876808166503906, -0.2505607604980469, -0.2423534393310547, -0.2341461181640625, -0.2259387969970703, -0.21773147583007812, -0.20952415466308594, -0.20131683349609375, -0.19310951232910156, -0.18490219116210938, -0.1766948699951172, -0.168487548828125, -0.1602802276611328, -0.15207290649414062, -0.14386558532714844, -0.13565826416015625, -0.12745094299316406, -0.11924362182617188, -0.11103630065917969, -0.1028289794921875, -0.09462165832519531, -0.08641433715820312, -0.07820701599121094, -0.06999969482421875, -0.06179237365722656, -0.053585052490234375, -0.04537773132324219, -0.03717041015625, -0.028963088989257812, -0.020755767822265625, -0.012548446655273438, -0.00434112548828125, 0.0038661956787109375, 0.012073516845703125, 0.020280838012695312, 0.0284881591796875, 0.03669548034667969, 0.044902801513671875, 0.05311012268066406, 0.06131744384765625, 0.06952476501464844, 0.07773208618164062, 0.08593940734863281, 0.094146728515625, 0.10235404968261719, 0.11056137084960938, 0.11876869201660156, 0.12697601318359375, 0.13518333435058594, 0.14339065551757812, 0.1515979766845703, 0.1598052978515625, 0.1680126190185547, 0.17621994018554688, 0.18442726135253906, 0.19263458251953125, 0.20084190368652344, 0.20904922485351562, 0.2172565460205078, 0.2254638671875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 11.0, 8.0, 16.0, 30.0, 37.0, 61.0, 73.0, 72.0, 57.0, 25.0, 16.0, 24.0, 4.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.073624610900879, -1.0435541868209839, -1.0134837627410889, -0.9834133386611938, -0.9533429145812988, -0.9232724905014038, -0.8932020664215088, -0.8631316423416138, -0.8330612182617188, -0.8029907941818237, -0.7729203701019287, -0.7428499460220337, -0.7127795219421387, -0.6827090978622437, -0.6526386737823486, -0.6225682497024536, -0.5924977660179138, -0.5624273419380188, -0.5323569178581238, -0.5022864937782288, -0.47221606969833374, -0.4421456456184387, -0.4120751917362213, -0.3820047676563263, -0.3519343435764313, -0.32186391949653625, -0.29179349541664124, -0.26172304153442383, -0.23165263235569, -0.20158220827579498, -0.17151176929473877, -0.14144134521484375, -0.11137092113494873, -0.08130049705505371, -0.051230065524578094, -0.021159633994102478, 0.008910790085792542, 0.03898121416568756, 0.06905165314674377, 0.0991220772266388, 0.1291925013065338, 0.15926292538642883, 0.18933334946632385, 0.21940378844738007, 0.24947421252727509, 0.2795446515083313, 0.3096150755882263, 0.33968549966812134, 0.36975592374801636, 0.3998263478279114, 0.4298967719078064, 0.4599671959877014, 0.49003762006759644, 0.5201080441474915, 0.5501785278320312, 0.5802489519119263, 0.6103193759918213, 0.6403898000717163, 0.6704602241516113, 0.7005306482315063, 0.7306010723114014, 0.7606714963912964, 0.7907419204711914, 0.8208123445510864, 0.8508827686309814]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 3.0, 7.0, 8.0, 13.0, 13.0, 8.0, 14.0, 38.0, 70.0, 110.0, 67.0, 24.0, 8.0, 14.0, 15.0, 5.0, 15.0, 4.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.3950127363204956, -1.3576780557632446, -1.3203433752059937, -1.2830085754394531, -1.2456738948822021, -1.2083392143249512, -1.1710045337677002, -1.1336698532104492, -1.0963350534439087, -1.0590003728866577, -1.0216656923294067, -0.984330952167511, -0.9469962120056152, -0.9096615314483643, -0.8723268508911133, -0.8349921107292175, -0.7976574301719666, -0.7603227496147156, -0.7229880094528198, -0.6856533288955688, -0.6483185887336731, -0.6109839081764221, -0.5736491680145264, -0.5363144874572754, -0.498979777097702, -0.46164506673812866, -0.4243103563785553, -0.38697564601898193, -0.34964096546173096, -0.3123062252998352, -0.27497154474258423, -0.23763683438301086, -0.20030206441879272, -0.16296735405921936, -0.125632643699646, -0.08829794824123383, -0.05096323788166046, -0.013628527522087097, 0.023706167936325073, 0.06104087829589844, 0.0983755886554718, 0.13571029901504517, 0.17304500937461853, 0.2103797048330307, 0.24771441519260406, 0.2850491404533386, 0.3223838210105896, 0.35971853137016296, 0.39705324172973633, 0.4343879520893097, 0.47172266244888306, 0.509057343006134, 0.5463920831680298, 0.5837267637252808, 0.6210614442825317, 0.6583961844444275, 0.6957309246063232, 0.7330656051635742, 0.77040034532547, 0.807735025882721, 0.8450697660446167, 0.8824044466018677, 0.9197391271591187, 0.9570738673210144, 0.9944085478782654]}, "eval/loss": 1.794046401977539, "eval/bleu": 3.550386321342364e-14, "eval/runtime": 2535.6975, "eval/samples_per_second": 5.821, "eval/steps_per_second": 0.728} \ No newline at end of file