diff --git "a/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" --- "a/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" +++ "b/wandb/run-20220505_173818-i9acyhfo/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 1.4587, "train/learning_rate": 0.00012846330275229358, "train/epoch": 1.85, "train/global_step": 3000, "_runtime": 42967, "_timestamp": 1651815265, "_step": 3005, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 6.0, 29.0, 87.0, 255.0, 304.0, 219.0, 87.0, 22.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6663763523101807, -0.5630879998207092, -0.4597996473312378, -0.35651129484176636, -0.2532229423522949, -0.1499345898628235, -0.04664623737335205, 0.056642115116119385, 0.15993046760559082, 0.26321882009506226, 0.3665071725845337, 0.4697955250740051, 0.5730838775634766, 0.676372230052948, 0.7796605825424194, 0.8829489350318909, 0.9862372875213623, 1.0895256996154785, 1.1928139925003052, 1.2961022853851318, 1.399390697479248, 1.5026791095733643, 1.605967402458191, 1.7092556953430176, 1.8125441074371338, 1.91583251953125, 2.019120693206787, 2.1224091053009033, 2.2256975173950195, 2.3289859294891357, 2.432274341583252, 2.535562515258789, 2.6388511657714844, 2.7421395778656006, 2.845427989959717, 2.948716163635254, 3.05200457572937, 3.1552929878234863, 3.2585811614990234, 3.3618695735931396, 3.465157985687256, 3.568446397781372, 3.6717348098754883, 3.7750229835510254, 3.8783113956451416, 3.981599807739258, 4.084887981414795, 4.18817663192749, 4.291464805603027, 4.3947529792785645, 4.49804162979126, 4.601329803466797, 4.704618453979492, 4.807906627655029, 4.911194801330566, 5.014483451843262, 5.117771625518799, 5.221059799194336, 5.324348449707031, 5.427636623382568, 5.5309247970581055, 5.634213447570801, 5.737501621246338, 5.840790271759033, 5.94407844543457]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 4.0, 4.0, 3.0, 7.0, 13.0, 9.0, 11.0, 15.0, 20.0, 20.0, 14.0, 18.0, 29.0, 35.0, 31.0, 38.0, 36.0, 23.0, 30.0, 51.0, 36.0, 43.0, 43.0, 49.0, 38.0, 45.0, 37.0, 46.0, 25.0, 26.0, 22.0, 28.0, 23.0, 15.0, 18.0, 15.0, 17.0, 13.0, 15.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.9655946493148804, -0.9377118945121765, -0.9098291993141174, -0.8819464445114136, -0.8540637493133545, -0.8261809945106506, -0.7982982397079468, -0.7704155445098877, -0.7425327897071838, -0.71465003490448, -0.6867673397064209, -0.658884584903717, -0.631001889705658, -0.6031191349029541, -0.575236439704895, -0.5473536849021912, -0.5194709300994873, -0.49158820509910583, -0.46370548009872437, -0.4358227252960205, -0.40794000029563904, -0.38005727529525757, -0.3521745502948761, -0.32429182529449463, -0.29640913009643555, -0.2685264050960541, -0.2406436651945114, -0.21276094019412994, -0.18487820029258728, -0.1569954752922058, -0.12911275029182434, -0.10123001039028168, -0.07334727048873901, -0.04546453803777695, -0.01758180931210518, 0.01030091941356659, 0.038183651864528656, 0.06606638431549072, 0.09394910931587219, 0.12183184921741486, 0.14971457421779633, 0.1775972992181778, 0.20548003911972046, 0.23336276412010193, 0.2612454891204834, 0.28912824392318726, 0.31701093912124634, 0.3448936939239502, 0.37277641892433167, 0.40065914392471313, 0.4285418689250946, 0.4564245939254761, 0.48430734872817993, 0.5121901035308838, 0.5400727987289429, 0.5679555535316467, 0.5958382487297058, 0.6237210035324097, 0.6516036987304688, 0.6794864535331726, 0.7073691487312317, 0.7352519035339355, 0.7631345987319946, 0.7910173535346985, 0.8189001083374023]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 7.0, 5.0, 7.0, 19.0, 19.0, 27.0, 29.0, 72.0, 116.0, 190.0, 307.0, 576.0, 1234.0, 2425.0, 5198.0, 12341.0, 33212.0, 101312.0, 378460.0, 2005787.0, 1274740.0, 258428.0, 75230.0, 25874.0, 10173.0, 4277.0, 2065.0, 934.0, 512.0, 294.0, 164.0, 99.0, 58.0, 38.0, 16.0, 11.0, 10.0, 9.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3671875, -1.325592041015625, -1.28399658203125, -1.242401123046875, -1.2008056640625, -1.159210205078125, -1.11761474609375, -1.076019287109375, -1.034423828125, -0.992828369140625, -0.95123291015625, -0.909637451171875, -0.8680419921875, -0.826446533203125, -0.78485107421875, -0.743255615234375, -0.70166015625, -0.660064697265625, -0.61846923828125, -0.576873779296875, -0.5352783203125, -0.493682861328125, -0.45208740234375, -0.410491943359375, -0.368896484375, -0.327301025390625, -0.28570556640625, -0.244110107421875, -0.2025146484375, -0.160919189453125, -0.11932373046875, -0.077728271484375, -0.0361328125, 0.005462646484375, 0.04705810546875, 0.088653564453125, 0.1302490234375, 0.171844482421875, 0.21343994140625, 0.255035400390625, 0.296630859375, 0.338226318359375, 0.37982177734375, 0.421417236328125, 0.4630126953125, 0.504608154296875, 0.54620361328125, 0.587799072265625, 0.62939453125, 0.670989990234375, 0.71258544921875, 0.754180908203125, 0.7957763671875, 0.837371826171875, 0.87896728515625, 0.920562744140625, 0.962158203125, 1.003753662109375, 1.04534912109375, 1.086944580078125, 1.1285400390625, 1.170135498046875, 1.21173095703125, 1.253326416015625, 1.294921875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 7.0, 6.0, 7.0, 7.0, 16.0, 17.0, 19.0, 21.0, 14.0, 23.0, 21.0, 29.0, 32.0, 34.0, 45.0, 38.0, 42.0, 49.0, 44.0, 50.0, 48.0, 47.0, 45.0, 39.0, 34.0, 18.0, 31.0, 30.0, 24.0, 28.0, 24.0, 18.0, 15.0, 15.0, 13.0, 5.0, 4.0, 13.0, 5.0, 4.0, 1.0, 5.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2578125, -1.2187652587890625, -1.179718017578125, -1.1406707763671875, -1.10162353515625, -1.0625762939453125, -1.023529052734375, -0.9844818115234375, -0.9454345703125, -0.9063873291015625, -0.867340087890625, -0.8282928466796875, -0.78924560546875, -0.7501983642578125, -0.711151123046875, -0.6721038818359375, -0.633056640625, -0.5940093994140625, -0.554962158203125, -0.5159149169921875, -0.47686767578125, -0.4378204345703125, -0.398773193359375, -0.3597259521484375, -0.3206787109375, -0.2816314697265625, -0.242584228515625, -0.2035369873046875, -0.16448974609375, -0.1254425048828125, -0.086395263671875, -0.0473480224609375, -0.00830078125, 0.0307464599609375, 0.069793701171875, 0.1088409423828125, 0.14788818359375, 0.1869354248046875, 0.225982666015625, 0.2650299072265625, 0.3040771484375, 0.3431243896484375, 0.382171630859375, 0.4212188720703125, 0.46026611328125, 0.4993133544921875, 0.538360595703125, 0.5774078369140625, 0.616455078125, 0.6555023193359375, 0.694549560546875, 0.7335968017578125, 0.77264404296875, 0.8116912841796875, 0.850738525390625, 0.8897857666015625, 0.9288330078125, 0.9678802490234375, 1.006927490234375, 1.0459747314453125, 1.08502197265625, 1.1240692138671875, 1.163116455078125, 1.2021636962890625, 1.2412109375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 9.0, 7.0, 10.0, 23.0, 36.0, 52.0, 89.0, 140.0, 546.0, 185111.0, 4007128.0, 648.0, 188.0, 110.0, 70.0, 35.0, 31.0, 19.0, 9.0, 10.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -32.22412109375, -31.3544921875, -30.48486328125, -29.615234375, -28.74560546875, -27.8759765625, -27.00634765625, -26.13671875, -25.26708984375, -24.3974609375, -23.52783203125, -22.658203125, -21.78857421875, -20.9189453125, -20.04931640625, -19.1796875, -18.31005859375, -17.4404296875, -16.57080078125, -15.701171875, -14.83154296875, -13.9619140625, -13.09228515625, -12.22265625, -11.35302734375, -10.4833984375, -9.61376953125, -8.744140625, -7.87451171875, -7.0048828125, -6.13525390625, -5.265625, -4.39599609375, -3.5263671875, -2.65673828125, -1.787109375, -0.91748046875, -0.0478515625, 0.82177734375, 1.69140625, 2.56103515625, 3.4306640625, 4.30029296875, 5.169921875, 6.03955078125, 6.9091796875, 7.77880859375, 8.6484375, 9.51806640625, 10.3876953125, 11.25732421875, 12.126953125, 12.99658203125, 13.8662109375, 14.73583984375, 15.60546875, 16.47509765625, 17.3447265625, 18.21435546875, 19.083984375, 19.95361328125, 20.8232421875, 21.69287109375, 22.5625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 12.0, 18.0, 33.0, 48.0, 88.0, 163.0, 413.0, 1604.0, 1016.0, 303.0, 138.0, 89.0, 52.0, 38.0, 19.0, 5.0, 10.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2177734375, -1.1871719360351562, -1.1565704345703125, -1.1259689331054688, -1.095367431640625, -1.0647659301757812, -1.0341644287109375, -1.0035629272460938, -0.97296142578125, -0.9423599243164062, -0.9117584228515625, -0.8811569213867188, -0.850555419921875, -0.8199539184570312, -0.7893524169921875, -0.7587509155273438, -0.7281494140625, -0.6975479125976562, -0.6669464111328125, -0.6363449096679688, -0.605743408203125, -0.5751419067382812, -0.5445404052734375, -0.5139389038085938, -0.48333740234375, -0.45273590087890625, -0.4221343994140625, -0.39153289794921875, -0.360931396484375, -0.33032989501953125, -0.2997283935546875, -0.26912689208984375, -0.238525390625, -0.20792388916015625, -0.1773223876953125, -0.14672088623046875, -0.116119384765625, -0.08551788330078125, -0.0549163818359375, -0.02431488037109375, 0.00628662109375, 0.03688812255859375, 0.0674896240234375, 0.09809112548828125, 0.128692626953125, 0.15929412841796875, 0.1898956298828125, 0.22049713134765625, 0.2510986328125, 0.28170013427734375, 0.3123016357421875, 0.34290313720703125, 0.373504638671875, 0.40410614013671875, 0.4347076416015625, 0.46530914306640625, 0.49591064453125, 0.5265121459960938, 0.5571136474609375, 0.5877151489257812, 0.618316650390625, 0.6489181518554688, 0.6795196533203125, 0.7101211547851562, 0.74072265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 10.0, 8.0, 8.0, 15.0, 26.0, 43.0, 46.0, 61.0, 66.0, 85.0, 86.0, 76.0, 89.0, 82.0, 66.0, 57.0, 48.0, 36.0, 31.0, 21.0, 16.0, 10.0, 4.0, 0.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.711857318878174, -2.6433637142181396, -2.5748698711395264, -2.506376266479492, -2.437882661819458, -2.369389057159424, -2.3008952140808105, -2.2324016094207764, -2.163908004760742, -2.095414400100708, -2.0269205570220947, -1.9584269523620605, -1.8899333477020264, -1.8214396238327026, -1.752945899963379, -1.6844522953033447, -1.6159584522247314, -1.5474647283554077, -1.4789711236953735, -1.4104773998260498, -1.3419837951660156, -1.273490071296692, -1.2049963474273682, -1.136502742767334, -1.0680090188980103, -0.9995153546333313, -0.9310216903686523, -0.8625279664993286, -0.7940343022346497, -0.7255406379699707, -0.657046914100647, -0.588553249835968, -0.52005934715271, -0.451565682888031, -0.38307198882102966, -0.3145782947540283, -0.24608463048934937, -0.1775909662246704, -0.10909727215766907, -0.040603578090667725, 0.02789008617401123, 0.09638376533985138, 0.16487744450569153, 0.23337112367153168, 0.3018648028373718, 0.3703584671020508, 0.4388521611690521, 0.5073458552360535, 0.5758395195007324, 0.6443331837654114, 0.7128268480300903, 0.7813205718994141, 0.849814236164093, 0.918307900428772, 0.9868016242980957, 1.0552952289581299, 1.1237889528274536, 1.1922826766967773, 1.2607762813568115, 1.3292700052261353, 1.397763729095459, 1.4662573337554932, 1.534751057624817, 1.6032447814941406, 1.6717383861541748]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 7.0, 10.0, 11.0, 15.0, 23.0, 15.0, 40.0, 36.0, 33.0, 47.0, 37.0, 50.0, 46.0, 57.0, 53.0, 46.0, 44.0, 55.0, 48.0, 53.0, 42.0, 35.0, 33.0, 26.0, 20.0, 21.0, 16.0, 16.0, 14.0, 11.0, 11.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3398993015289307, -1.2938693761825562, -1.2478395700454712, -1.2018096446990967, -1.1557797193527222, -1.1097497940063477, -1.0637199878692627, -1.0176900625228882, -0.9716601967811584, -0.9256303310394287, -0.8796004056930542, -0.8335705399513245, -0.7875406742095947, -0.7415107488632202, -0.6954808831214905, -0.6494510173797607, -0.6034210920333862, -0.5573912262916565, -0.511361300945282, -0.46533143520355225, -0.4193015396595001, -0.373271644115448, -0.32724177837371826, -0.28121188282966614, -0.235181987285614, -0.1891520917415619, -0.14312221109867096, -0.09709233045578003, -0.051062434911727905, -0.005032539367675781, 0.040997326374053955, 0.08702722191810608, 0.13305699825286865, 0.17908689379692078, 0.2251167744398117, 0.27114665508270264, 0.31717655062675476, 0.3632064461708069, 0.4092363119125366, 0.45526620745658875, 0.5012961030006409, 0.5473259687423706, 0.5933558940887451, 0.6393857598304749, 0.6854156255722046, 0.7314455509185791, 0.7774754166603088, 0.8235052824020386, 0.8695352077484131, 0.9155650734901428, 0.9615949988365173, 1.007624864578247, 1.0536547899246216, 1.099684715270996, 1.145714521408081, 1.1917444467544556, 1.23777437210083, 1.2838042974472046, 1.3298341035842896, 1.375864028930664, 1.4218939542770386, 1.467923879623413, 1.513953685760498, 1.5599836111068726, 1.6060134172439575]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 9.0, 13.0, 21.0, 24.0, 47.0, 57.0, 85.0, 129.0, 207.0, 303.0, 460.0, 644.0, 914.0, 1420.0, 2132.0, 3143.0, 4622.0, 7108.0, 10617.0, 15998.0, 24335.0, 37793.0, 58309.0, 89610.0, 131712.0, 166128.0, 156347.0, 115210.0, 76468.0, 50121.0, 32315.0, 20941.0, 13806.0, 9125.0, 6086.0, 4014.0, 2667.0, 1736.0, 1231.0, 861.0, 547.0, 402.0, 264.0, 179.0, 112.0, 93.0, 53.0, 46.0, 28.0, 23.0, 15.0, 20.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.275390625, -0.2667350769042969, -0.25807952880859375, -0.24942398071289062, -0.2407684326171875, -0.23211288452148438, -0.22345733642578125, -0.21480178833007812, -0.206146240234375, -0.19749069213867188, -0.18883514404296875, -0.18017959594726562, -0.1715240478515625, -0.16286849975585938, -0.15421295166015625, -0.14555740356445312, -0.13690185546875, -0.12824630737304688, -0.11959075927734375, -0.11093521118164062, -0.1022796630859375, -0.09362411499023438, -0.08496856689453125, -0.07631301879882812, -0.067657470703125, -0.059001922607421875, -0.05034637451171875, -0.041690826416015625, -0.0330352783203125, -0.024379730224609375, -0.01572418212890625, -0.007068634033203125, 0.0015869140625, 0.010242462158203125, 0.01889801025390625, 0.027553558349609375, 0.0362091064453125, 0.044864654541015625, 0.05352020263671875, 0.062175750732421875, 0.070831298828125, 0.07948684692382812, 0.08814239501953125, 0.09679794311523438, 0.1054534912109375, 0.11410903930664062, 0.12276458740234375, 0.13142013549804688, 0.14007568359375, 0.14873123168945312, 0.15738677978515625, 0.16604232788085938, 0.1746978759765625, 0.18335342407226562, 0.19200897216796875, 0.20066452026367188, 0.209320068359375, 0.21797561645507812, 0.22663116455078125, 0.23528671264648438, 0.2439422607421875, 0.2525978088378906, 0.26125335693359375, 0.2699089050292969, 0.278564453125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 9.0, 7.0, 12.0, 8.0, 8.0, 10.0, 17.0, 19.0, 28.0, 35.0, 31.0, 37.0, 45.0, 34.0, 42.0, 43.0, 55.0, 39.0, 37.0, 40.0, 45.0, 54.0, 47.0, 39.0, 27.0, 32.0, 25.0, 33.0, 28.0, 26.0, 12.0, 12.0, 13.0, 10.0, 11.0, 12.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.9767532348632812, -0.9466705322265625, -0.9165878295898438, -0.886505126953125, -0.8564224243164062, -0.8263397216796875, -0.7962570190429688, -0.76617431640625, -0.7360916137695312, -0.7060089111328125, -0.6759262084960938, -0.645843505859375, -0.6157608032226562, -0.5856781005859375, -0.5555953979492188, -0.5255126953125, -0.49542999267578125, -0.4653472900390625, -0.43526458740234375, -0.405181884765625, -0.37509918212890625, -0.3450164794921875, -0.31493377685546875, -0.28485107421875, -0.25476837158203125, -0.2246856689453125, -0.19460296630859375, -0.164520263671875, -0.13443756103515625, -0.1043548583984375, -0.07427215576171875, -0.044189453125, -0.01410675048828125, 0.0159759521484375, 0.04605865478515625, 0.076141357421875, 0.10622406005859375, 0.1363067626953125, 0.16638946533203125, 0.19647216796875, 0.22655487060546875, 0.2566375732421875, 0.28672027587890625, 0.316802978515625, 0.34688568115234375, 0.3769683837890625, 0.40705108642578125, 0.4371337890625, 0.46721649169921875, 0.4972991943359375, 0.5273818969726562, 0.557464599609375, 0.5875473022460938, 0.6176300048828125, 0.6477127075195312, 0.67779541015625, 0.7078781127929688, 0.7379608154296875, 0.7680435180664062, 0.798126220703125, 0.8282089233398438, 0.8582916259765625, 0.8883743286132812, 0.91845703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 19.0, 27.0, 13.0, 34.0, 38.0, 53.0, 107.0, 141.0, 199.0, 297.0, 561.0, 1139.0, 2520.0, 7349.0, 25925.0, 112553.0, 462737.0, 336345.0, 71439.0, 17521.0, 5346.0, 2011.0, 861.0, 457.0, 255.0, 174.0, 133.0, 72.0, 58.0, 38.0, 34.0, 21.0, 15.0, 10.0, 8.0, 5.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.71435546875, -0.6926116943359375, -0.670867919921875, -0.6491241455078125, -0.62738037109375, -0.6056365966796875, -0.583892822265625, -0.5621490478515625, -0.5404052734375, -0.5186614990234375, -0.496917724609375, -0.4751739501953125, -0.45343017578125, -0.4316864013671875, -0.409942626953125, -0.3881988525390625, -0.366455078125, -0.3447113037109375, -0.322967529296875, -0.3012237548828125, -0.27947998046875, -0.2577362060546875, -0.235992431640625, -0.2142486572265625, -0.1925048828125, -0.1707611083984375, -0.149017333984375, -0.1272735595703125, -0.10552978515625, -0.0837860107421875, -0.062042236328125, -0.0402984619140625, -0.0185546875, 0.0031890869140625, 0.024932861328125, 0.0466766357421875, 0.06842041015625, 0.0901641845703125, 0.111907958984375, 0.1336517333984375, 0.1553955078125, 0.1771392822265625, 0.198883056640625, 0.2206268310546875, 0.24237060546875, 0.2641143798828125, 0.285858154296875, 0.3076019287109375, 0.329345703125, 0.3510894775390625, 0.372833251953125, 0.3945770263671875, 0.41632080078125, 0.4380645751953125, 0.459808349609375, 0.4815521240234375, 0.5032958984375, 0.5250396728515625, 0.546783447265625, 0.5685272216796875, 0.59027099609375, 0.6120147705078125, 0.633758544921875, 0.6555023193359375, 0.67724609375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 2.0, 4.0, 8.0, 6.0, 4.0, 5.0, 17.0, 14.0, 21.0, 21.0, 24.0, 34.0, 27.0, 29.0, 28.0, 31.0, 27.0, 37.0, 41.0, 39.0, 47.0, 55.0, 50.0, 30.0, 40.0, 55.0, 33.0, 33.0, 34.0, 34.0, 21.0, 26.0, 18.0, 20.0, 9.0, 6.0, 15.0, 14.0, 7.0, 7.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.771484375, -1.7128143310546875, -1.654144287109375, -1.5954742431640625, -1.53680419921875, -1.4781341552734375, -1.419464111328125, -1.3607940673828125, -1.3021240234375, -1.2434539794921875, -1.184783935546875, -1.1261138916015625, -1.06744384765625, -1.0087738037109375, -0.950103759765625, -0.8914337158203125, -0.832763671875, -0.7740936279296875, -0.715423583984375, -0.6567535400390625, -0.59808349609375, -0.5394134521484375, -0.480743408203125, -0.4220733642578125, -0.3634033203125, -0.3047332763671875, -0.246063232421875, -0.1873931884765625, -0.12872314453125, -0.0700531005859375, -0.011383056640625, 0.0472869873046875, 0.10595703125, 0.1646270751953125, 0.223297119140625, 0.2819671630859375, 0.34063720703125, 0.3993072509765625, 0.457977294921875, 0.5166473388671875, 0.5753173828125, 0.6339874267578125, 0.692657470703125, 0.7513275146484375, 0.80999755859375, 0.8686676025390625, 0.927337646484375, 0.9860076904296875, 1.044677734375, 1.1033477783203125, 1.162017822265625, 1.2206878662109375, 1.27935791015625, 1.3380279541015625, 1.396697998046875, 1.4553680419921875, 1.5140380859375, 1.5727081298828125, 1.631378173828125, 1.6900482177734375, 1.74871826171875, 1.8073883056640625, 1.866058349609375, 1.9247283935546875, 1.9833984375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 12.0, 9.0, 22.0, 28.0, 48.0, 87.0, 195.0, 379.0, 1047.0, 3117.0, 13018.0, 126616.0, 819386.0, 71274.0, 9429.0, 2355.0, 853.0, 325.0, 141.0, 89.0, 35.0, 29.0, 21.0, 16.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5735549926757812, -0.5533599853515625, -0.5331649780273438, -0.512969970703125, -0.49277496337890625, -0.4725799560546875, -0.45238494873046875, -0.43218994140625, -0.41199493408203125, -0.3917999267578125, -0.37160491943359375, -0.351409912109375, -0.33121490478515625, -0.3110198974609375, -0.29082489013671875, -0.2706298828125, -0.25043487548828125, -0.2302398681640625, -0.21004486083984375, -0.189849853515625, -0.16965484619140625, -0.1494598388671875, -0.12926483154296875, -0.10906982421875, -0.08887481689453125, -0.0686798095703125, -0.04848480224609375, -0.028289794921875, -0.00809478759765625, 0.0121002197265625, 0.03229522705078125, 0.052490234375, 0.07268524169921875, 0.0928802490234375, 0.11307525634765625, 0.133270263671875, 0.15346527099609375, 0.1736602783203125, 0.19385528564453125, 0.21405029296875, 0.23424530029296875, 0.2544403076171875, 0.27463531494140625, 0.294830322265625, 0.31502532958984375, 0.3352203369140625, 0.35541534423828125, 0.3756103515625, 0.39580535888671875, 0.4160003662109375, 0.43619537353515625, 0.456390380859375, 0.47658538818359375, 0.4967803955078125, 0.5169754028320312, 0.53717041015625, 0.5573654174804688, 0.5775604248046875, 0.5977554321289062, 0.617950439453125, 0.6381454467773438, 0.6583404541015625, 0.6785354614257812, 0.69873046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 23.0, 40.0, 77.0, 149.0, 202.0, 202.0, 142.0, 71.0, 40.0, 21.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002448558807373047, -0.00023319199681282043, -0.00022152811288833618, -0.00020986422896385193, -0.00019820034503936768, -0.00018653646111488342, -0.00017487257719039917, -0.00016320869326591492, -0.00015154480934143066, -0.0001398809254169464, -0.00012821704149246216, -0.0001165531575679779, -0.00010488927364349365, -9.32253897190094e-05, -8.156150579452515e-05, -6.98976218700409e-05, -5.823373794555664e-05, -4.656985402107239e-05, -3.4905970096588135e-05, -2.3242086172103882e-05, -1.1578202247619629e-05, 8.568167686462402e-08, 1.1749565601348877e-05, 2.341344952583313e-05, 3.507733345031738e-05, 4.6741217374801636e-05, 5.840510129928589e-05, 7.006898522377014e-05, 8.17328691482544e-05, 9.339675307273865e-05, 0.0001050606369972229, 0.00011672452092170715, 0.0001283884048461914, 0.00014005228877067566, 0.0001517161726951599, 0.00016338005661964417, 0.00017504394054412842, 0.00018670782446861267, 0.00019837170839309692, 0.00021003559231758118, 0.00022169947624206543, 0.00023336336016654968, 0.00024502724409103394, 0.0002566911280155182, 0.00026835501194000244, 0.0002800188958644867, 0.00029168277978897095, 0.0003033466637134552, 0.00031501054763793945, 0.0003266744315624237, 0.00033833831548690796, 0.0003500021994113922, 0.00036166608333587646, 0.0003733299672603607, 0.00038499385118484497, 0.0003966577351093292, 0.0004083216190338135, 0.00041998550295829773, 0.000431649386882782, 0.00044331327080726624, 0.0004549771547317505, 0.00046664103865623474, 0.000478304922580719, 0.0004899688065052032, 0.0005016326904296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 3.0, 6.0, 8.0, 12.0, 28.0, 39.0, 101.0, 367.0, 3627.0, 352230.0, 686447.0, 4899.0, 485.0, 115.0, 58.0, 37.0, 17.0, 12.0, 16.0, 8.0, 4.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.162109375, -2.10675048828125, -2.0513916015625, -1.99603271484375, -1.940673828125, -1.88531494140625, -1.8299560546875, -1.77459716796875, -1.71923828125, -1.66387939453125, -1.6085205078125, -1.55316162109375, -1.497802734375, -1.44244384765625, -1.3870849609375, -1.33172607421875, -1.2763671875, -1.22100830078125, -1.1656494140625, -1.11029052734375, -1.054931640625, -0.99957275390625, -0.9442138671875, -0.88885498046875, -0.83349609375, -0.77813720703125, -0.7227783203125, -0.66741943359375, -0.612060546875, -0.55670166015625, -0.5013427734375, -0.44598388671875, -0.390625, -0.33526611328125, -0.2799072265625, -0.22454833984375, -0.169189453125, -0.11383056640625, -0.0584716796875, -0.00311279296875, 0.05224609375, 0.10760498046875, 0.1629638671875, 0.21832275390625, 0.273681640625, 0.32904052734375, 0.3843994140625, 0.43975830078125, 0.4951171875, 0.55047607421875, 0.6058349609375, 0.66119384765625, 0.716552734375, 0.77191162109375, 0.8272705078125, 0.88262939453125, 0.93798828125, 0.99334716796875, 1.0487060546875, 1.10406494140625, 1.159423828125, 1.21478271484375, 1.2701416015625, 1.32550048828125, 1.380859375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 10.0, 11.0, 20.0, 32.0, 63.0, 92.0, 136.0, 133.0, 146.0, 107.0, 75.0, 53.0, 33.0, 17.0, 18.0, 9.0, 9.0, 5.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1934814453125, -0.1882171630859375, -0.182952880859375, -0.1776885986328125, -0.17242431640625, -0.1671600341796875, -0.161895751953125, -0.1566314697265625, -0.1513671875, -0.1461029052734375, -0.140838623046875, -0.1355743408203125, -0.13031005859375, -0.1250457763671875, -0.119781494140625, -0.1145172119140625, -0.1092529296875, -0.1039886474609375, -0.098724365234375, -0.0934600830078125, -0.08819580078125, -0.0829315185546875, -0.077667236328125, -0.0724029541015625, -0.067138671875, -0.0618743896484375, -0.056610107421875, -0.0513458251953125, -0.04608154296875, -0.0408172607421875, -0.035552978515625, -0.0302886962890625, -0.0250244140625, -0.0197601318359375, -0.014495849609375, -0.0092315673828125, -0.00396728515625, 0.0012969970703125, 0.006561279296875, 0.0118255615234375, 0.01708984375, 0.0223541259765625, 0.027618408203125, 0.0328826904296875, 0.03814697265625, 0.0434112548828125, 0.048675537109375, 0.0539398193359375, 0.0592041015625, 0.0644683837890625, 0.069732666015625, 0.0749969482421875, 0.08026123046875, 0.0855255126953125, 0.090789794921875, 0.0960540771484375, 0.101318359375, 0.1065826416015625, 0.111846923828125, 0.1171112060546875, 0.12237548828125, 0.1276397705078125, 0.132904052734375, 0.1381683349609375, 0.1434326171875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 13.0, 19.0, 46.0, 95.0, 141.0, 204.0, 161.0, 148.0, 84.0, 45.0, 19.0, 13.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.26093864440918, -4.1614203453063965, -4.061902046203613, -3.962383985519409, -3.862865686416626, -3.763347625732422, -3.6638293266296387, -3.5643110275268555, -3.4647929668426514, -3.365274667739868, -3.265756607055664, -3.166238307952881, -3.0667200088500977, -2.9672019481658936, -2.8676836490631104, -2.7681655883789062, -2.668647289276123, -2.56912899017334, -2.4696109294891357, -2.3700926303863525, -2.2705743312835693, -2.1710562705993652, -2.071537971496582, -1.9720197916030884, -1.8725013732910156, -1.772983193397522, -1.6734648942947388, -1.5739467144012451, -1.4744285345077515, -1.3749103546142578, -1.2753920555114746, -1.175873875617981, -1.0763556957244873, -0.9768374562263489, -0.8773192763328552, -0.7778010368347168, -0.6782828569412231, -0.5787646174430847, -0.4792463779449463, -0.37972819805145264, -0.2802099585533142, -0.18069174885749817, -0.08117352426052094, 0.0183447003364563, 0.11786291003227234, 0.21738111972808838, 0.3168993592262268, 0.41641753911972046, 0.5159357786178589, 0.6154540181159973, 0.714972198009491, 0.8144904375076294, 0.914008617401123, 1.0135269165039062, 1.1130450963974, 1.2125632762908936, 1.3120815753936768, 1.4115997552871704, 1.5111180543899536, 1.6106362342834473, 1.710154414176941, 1.8096725940704346, 1.9091908931732178, 2.008708953857422, 2.108227252960205]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 9.0, 9.0, 15.0, 13.0, 11.0, 19.0, 17.0, 18.0, 22.0, 25.0, 34.0, 38.0, 32.0, 42.0, 44.0, 34.0, 48.0, 53.0, 46.0, 49.0, 58.0, 49.0, 36.0, 40.0, 32.0, 36.0, 20.0, 24.0, 24.0, 17.0, 10.0, 17.0, 9.0, 13.0, 11.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94023197889328, -0.9097111225128174, -0.8791902661323547, -0.8486694097518921, -0.8181486129760742, -0.7876276969909668, -0.7571069002151489, -0.7265860438346863, -0.6960651874542236, -0.665544331073761, -0.6350234746932983, -0.6045026183128357, -0.573981761932373, -0.5434609651565552, -0.5129401087760925, -0.4824192523956299, -0.45189839601516724, -0.4213775396347046, -0.39085668325424194, -0.3603358566761017, -0.32981500029563904, -0.2992941439151764, -0.26877331733703613, -0.2382524609565735, -0.20773160457611084, -0.1772107481956482, -0.14668990671634674, -0.11616905778646469, -0.08564820885658264, -0.055127352476119995, -0.024606510996818542, 0.00591433048248291, 0.03643512725830078, 0.06695597618818283, 0.09747682511806488, 0.12799766659736633, 0.15851852297782898, 0.18903937935829163, 0.21956022083759308, 0.25008106231689453, 0.2806019186973572, 0.3111227750778198, 0.34164363145828247, 0.37216445803642273, 0.4026853144168854, 0.433206170797348, 0.4637269973754883, 0.4942478537559509, 0.5247687101364136, 0.5552895665168762, 0.5858104228973389, 0.6163312792778015, 0.6468521356582642, 0.677372932434082, 0.7078937888145447, 0.7384146451950073, 0.76893550157547, 0.7994563579559326, 0.8299772143363953, 0.8604980707168579, 0.8910188674926758, 0.9215397834777832, 0.9520605802536011, 0.9825814366340637, 1.0131022930145264]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 14.0, 16.0, 32.0, 32.0, 52.0, 65.0, 132.0, 148.0, 193.0, 322.0, 463.0, 652.0, 1033.0, 1562.0, 2641.0, 4417.0, 7815.0, 15481.0, 34542.0, 89646.0, 237029.0, 354033.0, 177458.0, 65627.0, 26133.0, 12507.0, 6511.0, 3620.0, 2159.0, 1433.0, 902.0, 623.0, 368.0, 282.0, 180.0, 141.0, 93.0, 76.0, 36.0, 32.0, 18.0, 7.0, 12.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.59765625, -0.5807456970214844, -0.5638351440429688, -0.5469245910644531, -0.5300140380859375, -0.5131034851074219, -0.49619293212890625, -0.4792823791503906, -0.462371826171875, -0.4454612731933594, -0.42855072021484375, -0.4116401672363281, -0.3947296142578125, -0.3778190612792969, -0.36090850830078125, -0.3439979553222656, -0.32708740234375, -0.3101768493652344, -0.29326629638671875, -0.2763557434082031, -0.2594451904296875, -0.24253463745117188, -0.22562408447265625, -0.20871353149414062, -0.191802978515625, -0.17489242553710938, -0.15798187255859375, -0.14107131958007812, -0.1241607666015625, -0.10725021362304688, -0.09033966064453125, -0.07342910766601562, -0.0565185546875, -0.039608001708984375, -0.02269744873046875, -0.005786895751953125, 0.0111236572265625, 0.028034210205078125, 0.04494476318359375, 0.061855316162109375, 0.078765869140625, 0.09567642211914062, 0.11258697509765625, 0.12949752807617188, 0.1464080810546875, 0.16331863403320312, 0.18022918701171875, 0.19713973999023438, 0.21405029296875, 0.23096084594726562, 0.24787139892578125, 0.2647819519042969, 0.2816925048828125, 0.2986030578613281, 0.31551361083984375, 0.3324241638183594, 0.349334716796875, 0.3662452697753906, 0.38315582275390625, 0.4000663757324219, 0.4169769287109375, 0.4338874816894531, 0.45079803466796875, 0.4677085876464844, 0.484619140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 6.0, 7.0, 9.0, 9.0, 16.0, 16.0, 17.0, 27.0, 13.0, 22.0, 34.0, 32.0, 40.0, 44.0, 32.0, 52.0, 45.0, 42.0, 58.0, 39.0, 35.0, 36.0, 51.0, 39.0, 37.0, 39.0, 31.0, 18.0, 20.0, 30.0, 18.0, 10.0, 16.0, 7.0, 10.0, 5.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.775390625, -3.665435791015625, -3.55548095703125, -3.445526123046875, -3.3355712890625, -3.225616455078125, -3.11566162109375, -3.005706787109375, -2.895751953125, -2.785797119140625, -2.67584228515625, -2.565887451171875, -2.4559326171875, -2.345977783203125, -2.23602294921875, -2.126068115234375, -2.01611328125, -1.906158447265625, -1.79620361328125, -1.686248779296875, -1.5762939453125, -1.466339111328125, -1.35638427734375, -1.246429443359375, -1.136474609375, -1.026519775390625, -0.91656494140625, -0.806610107421875, -0.6966552734375, -0.586700439453125, -0.47674560546875, -0.366790771484375, -0.2568359375, -0.146881103515625, -0.03692626953125, 0.073028564453125, 0.1829833984375, 0.292938232421875, 0.40289306640625, 0.512847900390625, 0.622802734375, 0.732757568359375, 0.84271240234375, 0.952667236328125, 1.0626220703125, 1.172576904296875, 1.28253173828125, 1.392486572265625, 1.50244140625, 1.612396240234375, 1.72235107421875, 1.832305908203125, 1.9422607421875, 2.052215576171875, 2.16217041015625, 2.272125244140625, 2.382080078125, 2.492034912109375, 2.60198974609375, 2.711944580078125, 2.8218994140625, 2.931854248046875, 3.04180908203125, 3.151763916015625, 3.26171875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 12.0, 10.0, 16.0, 23.0, 23.0, 23.0, 39.0, 61.0, 60.0, 97.0, 161.0, 235.0, 387.0, 1097.0, 9461.0, 794553.0, 236384.0, 4115.0, 709.0, 345.0, 223.0, 147.0, 91.0, 68.0, 52.0, 31.0, 40.0, 13.0, 21.0, 12.0, 3.0, 5.0, 9.0, 0.0, 4.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.953125, -2.870758056640625, -2.78839111328125, -2.706024169921875, -2.6236572265625, -2.541290283203125, -2.45892333984375, -2.376556396484375, -2.294189453125, -2.211822509765625, -2.12945556640625, -2.047088623046875, -1.9647216796875, -1.882354736328125, -1.79998779296875, -1.717620849609375, -1.63525390625, -1.552886962890625, -1.47052001953125, -1.388153076171875, -1.3057861328125, -1.223419189453125, -1.14105224609375, -1.058685302734375, -0.976318359375, -0.893951416015625, -0.81158447265625, -0.729217529296875, -0.6468505859375, -0.564483642578125, -0.48211669921875, -0.399749755859375, -0.3173828125, -0.235015869140625, -0.15264892578125, -0.070281982421875, 0.0120849609375, 0.094451904296875, 0.17681884765625, 0.259185791015625, 0.341552734375, 0.423919677734375, 0.50628662109375, 0.588653564453125, 0.6710205078125, 0.753387451171875, 0.83575439453125, 0.918121337890625, 1.00048828125, 1.082855224609375, 1.16522216796875, 1.247589111328125, 1.3299560546875, 1.412322998046875, 1.49468994140625, 1.577056884765625, 1.659423828125, 1.741790771484375, 1.82415771484375, 1.906524658203125, 1.9888916015625, 2.071258544921875, 2.15362548828125, 2.235992431640625, 2.318359375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 7.0, 6.0, 14.0, 9.0, 16.0, 21.0, 25.0, 25.0, 27.0, 34.0, 34.0, 37.0, 54.0, 43.0, 53.0, 56.0, 63.0, 45.0, 45.0, 45.0, 38.0, 47.0, 32.0, 32.0, 38.0, 43.0, 21.0, 20.0, 12.0, 11.0, 7.0, 9.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.2481689453125, -4.121337890625, -3.9945068359375, -3.86767578125, -3.7408447265625, -3.614013671875, -3.4871826171875, -3.3603515625, -3.2335205078125, -3.106689453125, -2.9798583984375, -2.85302734375, -2.7261962890625, -2.599365234375, -2.4725341796875, -2.345703125, -2.2188720703125, -2.092041015625, -1.9652099609375, -1.83837890625, -1.7115478515625, -1.584716796875, -1.4578857421875, -1.3310546875, -1.2042236328125, -1.077392578125, -0.9505615234375, -0.82373046875, -0.6968994140625, -0.570068359375, -0.4432373046875, -0.31640625, -0.1895751953125, -0.062744140625, 0.0640869140625, 0.19091796875, 0.3177490234375, 0.444580078125, 0.5714111328125, 0.6982421875, 0.8250732421875, 0.951904296875, 1.0787353515625, 1.20556640625, 1.3323974609375, 1.459228515625, 1.5860595703125, 1.712890625, 1.8397216796875, 1.966552734375, 2.0933837890625, 2.22021484375, 2.3470458984375, 2.473876953125, 2.6007080078125, 2.7275390625, 2.8543701171875, 2.981201171875, 3.1080322265625, 3.23486328125, 3.3616943359375, 3.488525390625, 3.6153564453125, 3.7421875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 18.0, 15.0, 27.0, 79.0, 156.0, 461.0, 2051.0, 18034.0, 953900.0, 68498.0, 4091.0, 771.0, 238.0, 88.0, 39.0, 27.0, 16.0, 7.0, 8.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55419921875, -0.5341873168945312, -0.5141754150390625, -0.49416351318359375, -0.474151611328125, -0.45413970947265625, -0.4341278076171875, -0.41411590576171875, -0.39410400390625, -0.37409210205078125, -0.3540802001953125, -0.33406829833984375, -0.314056396484375, -0.29404449462890625, -0.2740325927734375, -0.25402069091796875, -0.2340087890625, -0.21399688720703125, -0.1939849853515625, -0.17397308349609375, -0.153961181640625, -0.13394927978515625, -0.1139373779296875, -0.09392547607421875, -0.07391357421875, -0.05390167236328125, -0.0338897705078125, -0.01387786865234375, 0.006134033203125, 0.02614593505859375, 0.0461578369140625, 0.06616973876953125, 0.086181640625, 0.10619354248046875, 0.1262054443359375, 0.14621734619140625, 0.166229248046875, 0.18624114990234375, 0.2062530517578125, 0.22626495361328125, 0.24627685546875, 0.26628875732421875, 0.2863006591796875, 0.30631256103515625, 0.326324462890625, 0.34633636474609375, 0.3663482666015625, 0.38636016845703125, 0.4063720703125, 0.42638397216796875, 0.4463958740234375, 0.46640777587890625, 0.486419677734375, 0.5064315795898438, 0.5264434814453125, 0.5464553833007812, 0.56646728515625, 0.5864791870117188, 0.6064910888671875, 0.6265029907226562, 0.646514892578125, 0.6665267944335938, 0.6865386962890625, 0.7065505981445312, 0.7265625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 17.0, 29.0, 47.0, 146.0, 349.0, 225.0, 83.0, 40.0, 15.0, 16.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010257959365844727, -9.95369628071785e-05, -9.649433195590973e-05, -9.345170110464096e-05, -9.040907025337219e-05, -8.736643940210342e-05, -8.432380855083466e-05, -8.128117769956589e-05, -7.823854684829712e-05, -7.519591599702835e-05, -7.215328514575958e-05, -6.911065429449081e-05, -6.606802344322205e-05, -6.302539259195328e-05, -5.998276174068451e-05, -5.694013088941574e-05, -5.389750003814697e-05, -5.0854869186878204e-05, -4.7812238335609436e-05, -4.476960748434067e-05, -4.17269766330719e-05, -3.868434578180313e-05, -3.564171493053436e-05, -3.2599084079265594e-05, -2.9556453227996826e-05, -2.6513822376728058e-05, -2.347119152545929e-05, -2.042856067419052e-05, -1.7385929822921753e-05, -1.4343298971652985e-05, -1.1300668120384216e-05, -8.258037269115448e-06, -5.21540641784668e-06, -2.1727755665779114e-06, 8.698552846908569e-07, 3.912486135959625e-06, 6.9551169872283936e-06, 9.997747838497162e-06, 1.304037868976593e-05, 1.60830095410347e-05, 1.9125640392303467e-05, 2.2168271243572235e-05, 2.5210902094841003e-05, 2.8253532946109772e-05, 3.129616379737854e-05, 3.433879464864731e-05, 3.738142549991608e-05, 4.0424056351184845e-05, 4.346668720245361e-05, 4.650931805372238e-05, 4.955194890499115e-05, 5.259457975625992e-05, 5.5637210607528687e-05, 5.8679841458797455e-05, 6.172247231006622e-05, 6.476510316133499e-05, 6.780773401260376e-05, 7.085036486387253e-05, 7.38929957151413e-05, 7.693562656641006e-05, 7.997825741767883e-05, 8.30208882689476e-05, 8.606351912021637e-05, 8.910614997148514e-05, 9.21487808227539e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 9.0, 26.0, 38.0, 63.0, 161.0, 386.0, 1243.0, 5748.0, 69248.0, 937020.0, 29653.0, 3615.0, 800.0, 274.0, 125.0, 66.0, 30.0, 13.0, 10.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69921875, -0.6814537048339844, -0.6636886596679688, -0.6459236145019531, -0.6281585693359375, -0.6103935241699219, -0.5926284790039062, -0.5748634338378906, -0.557098388671875, -0.5393333435058594, -0.5215682983398438, -0.5038032531738281, -0.4860382080078125, -0.4682731628417969, -0.45050811767578125, -0.4327430725097656, -0.41497802734375, -0.3972129821777344, -0.37944793701171875, -0.3616828918457031, -0.3439178466796875, -0.3261528015136719, -0.30838775634765625, -0.2906227111816406, -0.272857666015625, -0.2550926208496094, -0.23732757568359375, -0.21956253051757812, -0.2017974853515625, -0.18403244018554688, -0.16626739501953125, -0.14850234985351562, -0.1307373046875, -0.11297225952148438, -0.09520721435546875, -0.07744216918945312, -0.0596771240234375, -0.041912078857421875, -0.02414703369140625, -0.006381988525390625, 0.011383056640625, 0.029148101806640625, 0.04691314697265625, 0.06467819213867188, 0.0824432373046875, 0.10020828247070312, 0.11797332763671875, 0.13573837280273438, 0.15350341796875, 0.17126846313476562, 0.18903350830078125, 0.20679855346679688, 0.2245635986328125, 0.24232864379882812, 0.26009368896484375, 0.2778587341308594, 0.295623779296875, 0.3133888244628906, 0.33115386962890625, 0.3489189147949219, 0.3666839599609375, 0.3844490051269531, 0.40221405029296875, 0.4199790954589844, 0.437744140625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 9.0, 13.0, 12.0, 12.0, 20.0, 16.0, 48.0, 53.0, 106.0, 231.0, 214.0, 85.0, 54.0, 23.0, 15.0, 18.0, 15.0, 13.0, 9.0, 7.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12674713134765625, -0.1230010986328125, -0.11925506591796875, -0.115509033203125, -0.11176300048828125, -0.1080169677734375, -0.10427093505859375, -0.10052490234375, -0.09677886962890625, -0.0930328369140625, -0.08928680419921875, -0.085540771484375, -0.08179473876953125, -0.0780487060546875, -0.07430267333984375, -0.070556640625, -0.06681060791015625, -0.0630645751953125, -0.05931854248046875, -0.055572509765625, -0.05182647705078125, -0.0480804443359375, -0.04433441162109375, -0.04058837890625, -0.03684234619140625, -0.0330963134765625, -0.02935028076171875, -0.025604248046875, -0.02185821533203125, -0.0181121826171875, -0.01436614990234375, -0.0106201171875, -0.00687408447265625, -0.0031280517578125, 0.00061798095703125, 0.004364013671875, 0.00811004638671875, 0.0118560791015625, 0.01560211181640625, 0.01934814453125, 0.02309417724609375, 0.0268402099609375, 0.03058624267578125, 0.034332275390625, 0.03807830810546875, 0.0418243408203125, 0.04557037353515625, 0.04931640625, 0.05306243896484375, 0.0568084716796875, 0.06055450439453125, 0.064300537109375, 0.06804656982421875, 0.0717926025390625, 0.07553863525390625, 0.07928466796875, 0.08303070068359375, 0.0867767333984375, 0.09052276611328125, 0.094268798828125, 0.09801483154296875, 0.1017608642578125, 0.10550689697265625, 0.1092529296875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 27.0, 106.0, 309.0, 364.0, 162.0, 33.0, 4.0, 4.0, 1.0, 1.0], "bins": [-18.851255416870117, -18.52089500427246, -18.190536499023438, -17.86017608642578, -17.529817581176758, -17.1994571685791, -16.869098663330078, -16.538738250732422, -16.208377838134766, -15.878018379211426, -15.547658920288086, -15.21729850769043, -14.88693904876709, -14.55657958984375, -14.22622013092041, -13.89586067199707, -13.565502166748047, -13.235142707824707, -12.904783248901367, -12.574422836303711, -12.244063377380371, -11.913703918457031, -11.583344459533691, -11.252985000610352, -10.922624588012695, -10.592265129089355, -10.261905670166016, -9.93154525756836, -9.60118579864502, -9.27082633972168, -8.94046688079834, -8.610107421875, -8.279747009277344, -7.949387550354004, -7.619027614593506, -7.288668155670166, -6.958308696746826, -6.627948760986328, -6.297589302062988, -5.967229843139648, -5.636870384216309, -5.306510925292969, -4.976150989532471, -4.645791530609131, -4.315432071685791, -3.985072374343872, -3.654712677001953, -3.3243532180786133, -2.9939935207366943, -2.6636338233947754, -2.3332743644714355, -2.0029146671295166, -1.6725550889968872, -1.3421955108642578, -1.0118358135223389, -0.681476354598999, -0.3511166572570801, -0.020757049322128296, 0.3096025586128235, 0.6399621963500977, 0.970321774482727, 1.3006813526153564, 1.6310410499572754, 1.9614005088806152, 2.291760206222534]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 6.0, 6.0, 6.0, 14.0, 17.0, 20.0, 19.0, 21.0, 23.0, 31.0, 38.0, 47.0, 40.0, 26.0, 41.0, 59.0, 41.0, 59.0, 48.0, 40.0, 45.0, 47.0, 41.0, 36.0, 23.0, 31.0, 27.0, 32.0, 13.0, 21.0, 21.0, 9.0, 9.0, 4.0, 3.0, 9.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.556023597717285, -5.387862205505371, -5.219700813293457, -5.051539421081543, -4.883378028869629, -4.715216636657715, -4.547055244445801, -4.378893852233887, -4.210732460021973, -4.042571067810059, -3.8744096755981445, -3.7062482833862305, -3.5380868911743164, -3.3699254989624023, -3.2017643451690674, -3.0336029529571533, -2.8654417991638184, -2.6972804069519043, -2.5291190147399902, -2.360957622528076, -2.192796230316162, -2.024634838104248, -1.856473684310913, -1.688312292098999, -1.520150899887085, -1.351989507675171, -1.1838281154632568, -1.0156668424606323, -0.8475054502487183, -0.6793440580368042, -0.5111827850341797, -0.3430213928222656, -0.17486047744750977, -0.006699115037918091, 0.16146224737167358, 0.32962357997894287, 0.49778497219085693, 0.665946364402771, 0.8341076374053955, 1.0022690296173096, 1.1704304218292236, 1.3385918140411377, 1.5067532062530518, 1.6749144792556763, 1.8430758714675903, 2.011237144470215, 2.179398536682129, 2.347559928894043, 2.515721321105957, 2.683882713317871, 2.852044105529785, 3.020205497741699, 3.1883668899536133, 3.3565282821655273, 3.5246894359588623, 3.6928508281707764, 3.8610122203826904, 4.029173374176025, 4.1973347663879395, 4.3654961585998535, 4.533657550811768, 4.701818943023682, 4.869980335235596, 5.03814172744751, 5.206303119659424]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 12.0, 10.0, 24.0, 24.0, 42.0, 45.0, 59.0, 106.0, 153.0, 265.0, 484.0, 986.0, 2157.0, 5433.0, 15676.0, 63095.0, 455866.0, 2774955.0, 747426.0, 93956.0, 21472.0, 6932.0, 2672.0, 1112.0, 584.0, 292.0, 158.0, 109.0, 52.0, 34.0, 24.0, 11.0, 16.0, 8.0, 4.0, 2.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.6533203125, -1.6041259765625, -1.554931640625, -1.5057373046875, -1.45654296875, -1.4073486328125, -1.358154296875, -1.3089599609375, -1.259765625, -1.2105712890625, -1.161376953125, -1.1121826171875, -1.06298828125, -1.0137939453125, -0.964599609375, -0.9154052734375, -0.8662109375, -0.8170166015625, -0.767822265625, -0.7186279296875, -0.66943359375, -0.6202392578125, -0.571044921875, -0.5218505859375, -0.47265625, -0.4234619140625, -0.374267578125, -0.3250732421875, -0.27587890625, -0.2266845703125, -0.177490234375, -0.1282958984375, -0.0791015625, -0.0299072265625, 0.019287109375, 0.0684814453125, 0.11767578125, 0.1668701171875, 0.216064453125, 0.2652587890625, 0.314453125, 0.3636474609375, 0.412841796875, 0.4620361328125, 0.51123046875, 0.5604248046875, 0.609619140625, 0.6588134765625, 0.7080078125, 0.7572021484375, 0.806396484375, 0.8555908203125, 0.90478515625, 0.9539794921875, 1.003173828125, 1.0523681640625, 1.1015625, 1.1507568359375, 1.199951171875, 1.2491455078125, 1.29833984375, 1.3475341796875, 1.396728515625, 1.4459228515625, 1.4951171875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 3.0, 7.0, 11.0, 13.0, 10.0, 17.0, 11.0, 21.0, 14.0, 28.0, 25.0, 40.0, 28.0, 39.0, 44.0, 37.0, 53.0, 50.0, 55.0, 64.0, 54.0, 46.0, 36.0, 45.0, 34.0, 23.0, 29.0, 23.0, 29.0, 19.0, 15.0, 12.0, 12.0, 12.0, 8.0, 2.0, 9.0, 4.0, 5.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.087890625, -1.0562210083007812, -1.0245513916015625, -0.9928817749023438, -0.961212158203125, -0.9295425415039062, -0.8978729248046875, -0.8662033081054688, -0.83453369140625, -0.8028640747070312, -0.7711944580078125, -0.7395248413085938, -0.707855224609375, -0.6761856079101562, -0.6445159912109375, -0.6128463745117188, -0.5811767578125, -0.5495071411132812, -0.5178375244140625, -0.48616790771484375, -0.454498291015625, -0.42282867431640625, -0.3911590576171875, -0.35948944091796875, -0.32781982421875, -0.29615020751953125, -0.2644805908203125, -0.23281097412109375, -0.201141357421875, -0.16947174072265625, -0.1378021240234375, -0.10613250732421875, -0.074462890625, -0.04279327392578125, -0.0111236572265625, 0.02054595947265625, 0.052215576171875, 0.08388519287109375, 0.1155548095703125, 0.14722442626953125, 0.17889404296875, 0.21056365966796875, 0.2422332763671875, 0.27390289306640625, 0.305572509765625, 0.33724212646484375, 0.3689117431640625, 0.40058135986328125, 0.4322509765625, 0.46392059326171875, 0.4955902099609375, 0.5272598266601562, 0.558929443359375, 0.5905990600585938, 0.6222686767578125, 0.6539382934570312, 0.68560791015625, 0.7172775268554688, 0.7489471435546875, 0.7806167602539062, 0.812286376953125, 0.8439559936523438, 0.8756256103515625, 0.9072952270507812, 0.93896484375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 9.0, 13.0, 16.0, 45.0, 102.0, 299.0, 7566.0, 4184946.0, 964.0, 175.0, 74.0, 36.0, 12.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.390625, -20.7666015625, -20.142578125, -19.5185546875, -18.89453125, -18.2705078125, -17.646484375, -17.0224609375, -16.3984375, -15.7744140625, -15.150390625, -14.5263671875, -13.90234375, -13.2783203125, -12.654296875, -12.0302734375, -11.40625, -10.7822265625, -10.158203125, -9.5341796875, -8.91015625, -8.2861328125, -7.662109375, -7.0380859375, -6.4140625, -5.7900390625, -5.166015625, -4.5419921875, -3.91796875, -3.2939453125, -2.669921875, -2.0458984375, -1.421875, -0.7978515625, -0.173828125, 0.4501953125, 1.07421875, 1.6982421875, 2.322265625, 2.9462890625, 3.5703125, 4.1943359375, 4.818359375, 5.4423828125, 6.06640625, 6.6904296875, 7.314453125, 7.9384765625, 8.5625, 9.1865234375, 9.810546875, 10.4345703125, 11.05859375, 11.6826171875, 12.306640625, 12.9306640625, 13.5546875, 14.1787109375, 14.802734375, 15.4267578125, 16.05078125, 16.6748046875, 17.298828125, 17.9228515625, 18.546875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 8.0, 23.0, 22.0, 54.0, 77.0, 153.0, 304.0, 709.0, 1272.0, 724.0, 317.0, 186.0, 76.0, 53.0, 39.0, 23.0, 15.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60888671875, -0.5859375, -0.56298828125, -0.5400390625, -0.51708984375, -0.494140625, -0.47119140625, -0.4482421875, -0.42529296875, -0.40234375, -0.37939453125, -0.3564453125, -0.33349609375, -0.310546875, -0.28759765625, -0.2646484375, -0.24169921875, -0.21875, -0.19580078125, -0.1728515625, -0.14990234375, -0.126953125, -0.10400390625, -0.0810546875, -0.05810546875, -0.03515625, -0.01220703125, 0.0107421875, 0.03369140625, 0.056640625, 0.07958984375, 0.1025390625, 0.12548828125, 0.1484375, 0.17138671875, 0.1943359375, 0.21728515625, 0.240234375, 0.26318359375, 0.2861328125, 0.30908203125, 0.33203125, 0.35498046875, 0.3779296875, 0.40087890625, 0.423828125, 0.44677734375, 0.4697265625, 0.49267578125, 0.515625, 0.53857421875, 0.5615234375, 0.58447265625, 0.607421875, 0.63037109375, 0.6533203125, 0.67626953125, 0.69921875, 0.72216796875, 0.7451171875, 0.76806640625, 0.791015625, 0.81396484375, 0.8369140625, 0.85986328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 7.0, 8.0, 15.0, 28.0, 53.0, 67.0, 107.0, 121.0, 142.0, 139.0, 100.0, 69.0, 62.0, 29.0, 23.0, 14.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.014052391052246, -3.923814296722412, -3.833576202392578, -3.743338108062744, -3.65310001373291, -3.562861919403076, -3.472623825073242, -3.382385730743408, -3.292147636413574, -3.2019095420837402, -3.1116714477539062, -3.0214333534240723, -2.9311952590942383, -2.8409571647644043, -2.7507190704345703, -2.6604809761047363, -2.5702428817749023, -2.4800047874450684, -2.3897666931152344, -2.2995285987854004, -2.2092905044555664, -2.1190524101257324, -2.0288143157958984, -1.9385762214660645, -1.8483381271362305, -1.7581000328063965, -1.6678619384765625, -1.5776238441467285, -1.4873857498168945, -1.3971476554870605, -1.3069095611572266, -1.2166714668273926, -1.1264334917068481, -1.0361953973770142, -0.9459573030471802, -0.8557192087173462, -0.7654811143875122, -0.6752430200576782, -0.5850049257278442, -0.49476683139801025, -0.40452873706817627, -0.3142906427383423, -0.2240525484085083, -0.13381445407867432, -0.04357635974884033, 0.04666173458099365, 0.13689982891082764, 0.22713792324066162, 0.3173760175704956, 0.4076141119003296, 0.4978522062301636, 0.5880903005599976, 0.6783283948898315, 0.7685664892196655, 0.8588045835494995, 0.9490426778793335, 1.0392807722091675, 1.1295188665390015, 1.2197569608688354, 1.3099950551986694, 1.4002331495285034, 1.4904712438583374, 1.5807093381881714, 1.6709474325180054, 1.7611855268478394]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 5.0, 13.0, 8.0, 13.0, 12.0, 19.0, 23.0, 34.0, 19.0, 28.0, 30.0, 39.0, 36.0, 31.0, 45.0, 38.0, 46.0, 47.0, 48.0, 51.0, 47.0, 40.0, 39.0, 38.0, 29.0, 19.0, 36.0, 30.0, 18.0, 17.0, 23.0, 14.0, 15.0, 8.0, 7.0, 1.0, 3.0, 7.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1543492078781128, -1.1197924613952637, -1.0852357149124146, -1.0506789684295654, -1.0161223411560059, -0.9815655946731567, -0.9470088481903076, -0.9124521017074585, -0.8778953552246094, -0.8433386087417603, -0.8087819218635559, -0.7742251753807068, -0.7396684288978577, -0.7051117420196533, -0.6705549955368042, -0.6359982490539551, -0.6014415621757507, -0.5668848156929016, -0.5323281288146973, -0.49777138233184814, -0.463214635848999, -0.4286579191684723, -0.39410120248794556, -0.35954445600509644, -0.3249877393245697, -0.29043102264404297, -0.25587427616119385, -0.22131755948066711, -0.1867608278989792, -0.15220409631729126, -0.11764737963676453, -0.0830906480550766, -0.04853391647338867, -0.013977188616991043, 0.020579539239406586, 0.055136263370513916, 0.08969299495220184, 0.12424972653388977, 0.1588064432144165, 0.19336317479610443, 0.22791990637779236, 0.2624766230583191, 0.2970333695411682, 0.33159008622169495, 0.3661468029022217, 0.4007035493850708, 0.43526026606559753, 0.46981698274612427, 0.5043737292289734, 0.5389304757118225, 0.5734871625900269, 0.608043909072876, 0.6426006555557251, 0.6771574020385742, 0.7117140889167786, 0.7462708353996277, 0.780827522277832, 0.8153842687606812, 0.8499409556388855, 0.8844977021217346, 0.9190544486045837, 0.9536111354827881, 0.9881678819656372, 1.0227246284484863, 1.0572813749313354]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 10.0, 13.0, 19.0, 25.0, 49.0, 55.0, 119.0, 153.0, 283.0, 479.0, 844.0, 1393.0, 2790.0, 5568.0, 12768.0, 31514.0, 84781.0, 220138.0, 389364.0, 181751.0, 68882.0, 26409.0, 10666.0, 4910.0, 2410.0, 1302.0, 735.0, 417.0, 251.0, 178.0, 93.0, 56.0, 39.0, 20.0, 22.0, 16.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.485595703125, -0.4706077575683594, -0.45561981201171875, -0.4406318664550781, -0.4256439208984375, -0.4106559753417969, -0.39566802978515625, -0.3806800842285156, -0.365692138671875, -0.3507041931152344, -0.33571624755859375, -0.3207283020019531, -0.3057403564453125, -0.2907524108886719, -0.27576446533203125, -0.2607765197753906, -0.24578857421875, -0.23080062866210938, -0.21581268310546875, -0.20082473754882812, -0.1858367919921875, -0.17084884643554688, -0.15586090087890625, -0.14087295532226562, -0.125885009765625, -0.11089706420898438, -0.09590911865234375, -0.08092117309570312, -0.0659332275390625, -0.050945281982421875, -0.03595733642578125, -0.020969390869140625, -0.0059814453125, 0.009006500244140625, 0.02399444580078125, 0.038982391357421875, 0.0539703369140625, 0.06895828247070312, 0.08394622802734375, 0.09893417358398438, 0.113922119140625, 0.12891006469726562, 0.14389801025390625, 0.15888595581054688, 0.1738739013671875, 0.18886184692382812, 0.20384979248046875, 0.21883773803710938, 0.23382568359375, 0.24881362915039062, 0.26380157470703125, 0.2787895202636719, 0.2937774658203125, 0.3087654113769531, 0.32375335693359375, 0.3387413024902344, 0.353729248046875, 0.3687171936035156, 0.38370513916015625, 0.3986930847167969, 0.4136810302734375, 0.4286689758300781, 0.44365692138671875, 0.4586448669433594, 0.4736328125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 8.0, 6.0, 8.0, 6.0, 6.0, 9.0, 19.0, 16.0, 19.0, 30.0, 28.0, 27.0, 26.0, 28.0, 44.0, 45.0, 65.0, 56.0, 52.0, 52.0, 58.0, 58.0, 50.0, 50.0, 38.0, 31.0, 39.0, 26.0, 23.0, 16.0, 21.0, 10.0, 5.0, 10.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.92822265625, -0.9008407592773438, -0.8734588623046875, -0.8460769653320312, -0.818695068359375, -0.7913131713867188, -0.7639312744140625, -0.7365493774414062, -0.70916748046875, -0.6817855834960938, -0.6544036865234375, -0.6270217895507812, -0.599639892578125, -0.5722579956054688, -0.5448760986328125, -0.5174942016601562, -0.4901123046875, -0.46273040771484375, -0.4353485107421875, -0.40796661376953125, -0.380584716796875, -0.35320281982421875, -0.3258209228515625, -0.29843902587890625, -0.27105712890625, -0.24367523193359375, -0.2162933349609375, -0.18891143798828125, -0.161529541015625, -0.13414764404296875, -0.1067657470703125, -0.07938385009765625, -0.052001953125, -0.02462005615234375, 0.0027618408203125, 0.03014373779296875, 0.057525634765625, 0.08490753173828125, 0.1122894287109375, 0.13967132568359375, 0.16705322265625, 0.19443511962890625, 0.2218170166015625, 0.24919891357421875, 0.276580810546875, 0.30396270751953125, 0.3313446044921875, 0.35872650146484375, 0.3861083984375, 0.41349029541015625, 0.4408721923828125, 0.46825408935546875, 0.495635986328125, 0.5230178833007812, 0.5503997802734375, 0.5777816772460938, 0.60516357421875, 0.6325454711914062, 0.6599273681640625, 0.6873092651367188, 0.714691162109375, 0.7420730590820312, 0.7694549560546875, 0.7968368530273438, 0.82421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 4.0, 8.0, 24.0, 16.0, 39.0, 45.0, 62.0, 109.0, 165.0, 311.0, 530.0, 1285.0, 3458.0, 12932.0, 67685.0, 468751.0, 415751.0, 59696.0, 11776.0, 3308.0, 1269.0, 588.0, 289.0, 149.0, 85.0, 58.0, 45.0, 27.0, 22.0, 10.0, 9.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.74267578125, -0.721435546875, -0.7001953125, -0.678955078125, -0.65771484375, -0.636474609375, -0.615234375, -0.593994140625, -0.57275390625, -0.551513671875, -0.5302734375, -0.509033203125, -0.48779296875, -0.466552734375, -0.4453125, -0.424072265625, -0.40283203125, -0.381591796875, -0.3603515625, -0.339111328125, -0.31787109375, -0.296630859375, -0.275390625, -0.254150390625, -0.23291015625, -0.211669921875, -0.1904296875, -0.169189453125, -0.14794921875, -0.126708984375, -0.10546875, -0.084228515625, -0.06298828125, -0.041748046875, -0.0205078125, 0.000732421875, 0.02197265625, 0.043212890625, 0.064453125, 0.085693359375, 0.10693359375, 0.128173828125, 0.1494140625, 0.170654296875, 0.19189453125, 0.213134765625, 0.234375, 0.255615234375, 0.27685546875, 0.298095703125, 0.3193359375, 0.340576171875, 0.36181640625, 0.383056640625, 0.404296875, 0.425537109375, 0.44677734375, 0.468017578125, 0.4892578125, 0.510498046875, 0.53173828125, 0.552978515625, 0.57421875, 0.595458984375, 0.61669921875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 9.0, 6.0, 14.0, 13.0, 12.0, 21.0, 26.0, 21.0, 30.0, 37.0, 33.0, 38.0, 39.0, 55.0, 43.0, 56.0, 45.0, 63.0, 51.0, 48.0, 48.0, 37.0, 41.0, 41.0, 26.0, 25.0, 23.0, 27.0, 11.0, 13.0, 11.0, 7.0, 4.0, 4.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7880859375, -1.7361602783203125, -1.684234619140625, -1.6323089599609375, -1.58038330078125, -1.5284576416015625, -1.476531982421875, -1.4246063232421875, -1.3726806640625, -1.3207550048828125, -1.268829345703125, -1.2169036865234375, -1.16497802734375, -1.1130523681640625, -1.061126708984375, -1.0092010498046875, -0.957275390625, -0.9053497314453125, -0.853424072265625, -0.8014984130859375, -0.74957275390625, -0.6976470947265625, -0.645721435546875, -0.5937957763671875, -0.5418701171875, -0.4899444580078125, -0.438018798828125, -0.3860931396484375, -0.33416748046875, -0.2822418212890625, -0.230316162109375, -0.1783905029296875, -0.12646484375, -0.0745391845703125, -0.022613525390625, 0.0293121337890625, 0.08123779296875, 0.1331634521484375, 0.185089111328125, 0.2370147705078125, 0.2889404296875, 0.3408660888671875, 0.392791748046875, 0.4447174072265625, 0.49664306640625, 0.5485687255859375, 0.600494384765625, 0.6524200439453125, 0.704345703125, 0.7562713623046875, 0.808197021484375, 0.8601226806640625, 0.91204833984375, 0.9639739990234375, 1.015899658203125, 1.0678253173828125, 1.1197509765625, 1.1716766357421875, 1.223602294921875, 1.2755279541015625, 1.32745361328125, 1.3793792724609375, 1.431304931640625, 1.4832305908203125, 1.53515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 10.0, 10.0, 25.0, 41.0, 67.0, 106.0, 191.0, 352.0, 584.0, 1355.0, 3377.0, 10368.0, 51659.0, 564475.0, 366968.0, 35803.0, 8115.0, 2700.0, 1158.0, 558.0, 240.0, 152.0, 101.0, 45.0, 22.0, 20.0, 21.0, 16.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.2181377410888672, -0.20861434936523438, -0.19909095764160156, -0.18956756591796875, -0.18004417419433594, -0.17052078247070312, -0.1609973907470703, -0.1514739990234375, -0.1419506072998047, -0.13242721557617188, -0.12290382385253906, -0.11338043212890625, -0.10385704040527344, -0.09433364868164062, -0.08481025695800781, -0.075286865234375, -0.06576347351074219, -0.056240081787109375, -0.04671669006347656, -0.03719329833984375, -0.027669906616210938, -0.018146514892578125, -0.008623123168945312, 0.0009002685546875, 0.010423660278320312, 0.019947052001953125, 0.029470443725585938, 0.03899383544921875, 0.04851722717285156, 0.058040618896484375, 0.06756401062011719, 0.07708740234375, 0.08661079406738281, 0.09613418579101562, 0.10565757751464844, 0.11518096923828125, 0.12470436096191406, 0.13422775268554688, 0.1437511444091797, 0.1532745361328125, 0.1627979278564453, 0.17232131958007812, 0.18184471130371094, 0.19136810302734375, 0.20089149475097656, 0.21041488647460938, 0.2199382781982422, 0.229461669921875, 0.2389850616455078, 0.24850845336914062, 0.25803184509277344, 0.26755523681640625, 0.27707862854003906, 0.2866020202636719, 0.2961254119873047, 0.3056488037109375, 0.3151721954345703, 0.3246955871582031, 0.33421897888183594, 0.34374237060546875, 0.35326576232910156, 0.3627891540527344, 0.3723125457763672, 0.3818359375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 11.0, 12.0, 18.0, 43.0, 81.0, 186.0, 288.0, 189.0, 99.0, 33.0, 19.0, 9.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022745132446289062, -0.00021579116582870483, -0.00020413100719451904, -0.00019247084856033325, -0.00018081068992614746, -0.00016915053129196167, -0.00015749037265777588, -0.0001458302140235901, -0.0001341700553894043, -0.0001225098967552185, -0.00011084973812103271, -9.918957948684692e-05, -8.752942085266113e-05, -7.586926221847534e-05, -6.420910358428955e-05, -5.254894495010376e-05, -4.088878631591797e-05, -2.9228627681732178e-05, -1.7568469047546387e-05, -5.908310413360596e-06, 5.751848220825195e-06, 1.7412006855010986e-05, 2.9072165489196777e-05, 4.073232412338257e-05, 5.239248275756836e-05, 6.405264139175415e-05, 7.571280002593994e-05, 8.737295866012573e-05, 9.903311729431152e-05, 0.00011069327592849731, 0.0001223534345626831, 0.0001340135931968689, 0.0001456737518310547, 0.00015733391046524048, 0.00016899406909942627, 0.00018065422773361206, 0.00019231438636779785, 0.00020397454500198364, 0.00021563470363616943, 0.00022729486227035522, 0.00023895502090454102, 0.0002506151795387268, 0.0002622753381729126, 0.0002739354968070984, 0.0002855956554412842, 0.00029725581407546997, 0.00030891597270965576, 0.00032057613134384155, 0.00033223628997802734, 0.00034389644861221313, 0.0003555566072463989, 0.0003672167658805847, 0.0003788769245147705, 0.0003905370831489563, 0.0004021972417831421, 0.0004138574004173279, 0.00042551755905151367, 0.00043717771768569946, 0.00044883787631988525, 0.00046049803495407104, 0.00047215819358825684, 0.0004838183522224426, 0.0004954785108566284, 0.0005071386694908142, 0.000518798828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 15.0, 19.0, 40.0, 112.0, 465.0, 4218.0, 699104.0, 340836.0, 3137.0, 377.0, 108.0, 43.0, 20.0, 12.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.0385589599609375, -1.003875732421875, -0.9691925048828125, -0.93450927734375, -0.8998260498046875, -0.865142822265625, -0.8304595947265625, -0.7957763671875, -0.7610931396484375, -0.726409912109375, -0.6917266845703125, -0.65704345703125, -0.6223602294921875, -0.587677001953125, -0.5529937744140625, -0.518310546875, -0.4836273193359375, -0.448944091796875, -0.4142608642578125, -0.37957763671875, -0.3448944091796875, -0.310211181640625, -0.2755279541015625, -0.2408447265625, -0.2061614990234375, -0.171478271484375, -0.1367950439453125, -0.10211181640625, -0.0674285888671875, -0.032745361328125, 0.0019378662109375, 0.03662109375, 0.0713043212890625, 0.105987548828125, 0.1406707763671875, 0.17535400390625, 0.2100372314453125, 0.244720458984375, 0.2794036865234375, 0.3140869140625, 0.3487701416015625, 0.383453369140625, 0.4181365966796875, 0.45281982421875, 0.4875030517578125, 0.522186279296875, 0.5568695068359375, 0.591552734375, 0.6262359619140625, 0.660919189453125, 0.6956024169921875, 0.73028564453125, 0.7649688720703125, 0.799652099609375, 0.8343353271484375, 0.8690185546875, 0.9037017822265625, 0.938385009765625, 0.9730682373046875, 1.00775146484375, 1.0424346923828125, 1.077117919921875, 1.1118011474609375, 1.146484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 9.0, 6.0, 15.0, 16.0, 20.0, 28.0, 27.0, 25.0, 44.0, 48.0, 63.0, 65.0, 74.0, 75.0, 70.0, 83.0, 70.0, 53.0, 53.0, 32.0, 29.0, 19.0, 11.0, 9.0, 10.0, 13.0, 4.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0469970703125, -0.045290470123291016, -0.04358386993408203, -0.04187726974487305, -0.04017066955566406, -0.03846406936645508, -0.036757469177246094, -0.03505086898803711, -0.033344268798828125, -0.03163766860961914, -0.029931068420410156, -0.028224468231201172, -0.026517868041992188, -0.024811267852783203, -0.02310466766357422, -0.021398067474365234, -0.01969146728515625, -0.017984867095947266, -0.01627826690673828, -0.014571666717529297, -0.012865066528320312, -0.011158466339111328, -0.009451866149902344, -0.007745265960693359, -0.006038665771484375, -0.004332065582275391, -0.0026254653930664062, -0.0009188652038574219, 0.0007877349853515625, 0.002494335174560547, 0.004200935363769531, 0.005907535552978516, 0.0076141357421875, 0.009320735931396484, 0.011027336120605469, 0.012733936309814453, 0.014440536499023438, 0.016147136688232422, 0.017853736877441406, 0.01956033706665039, 0.021266937255859375, 0.02297353744506836, 0.024680137634277344, 0.026386737823486328, 0.028093338012695312, 0.029799938201904297, 0.03150653839111328, 0.033213138580322266, 0.03491973876953125, 0.036626338958740234, 0.03833293914794922, 0.0400395393371582, 0.04174613952636719, 0.04345273971557617, 0.045159339904785156, 0.04686594009399414, 0.048572540283203125, 0.05027914047241211, 0.051985740661621094, 0.05369234085083008, 0.05539894104003906, 0.05710554122924805, 0.05881214141845703, 0.060518741607666016, 0.062225341796875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 10.0, 8.0, 21.0, 32.0, 46.0, 62.0, 104.0, 144.0, 188.0, 129.0, 99.0, 57.0, 45.0, 24.0, 13.0, 11.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.45290207862854, -2.3934848308563232, -2.3340675830841064, -2.2746503353118896, -2.215233087539673, -2.155815839767456, -2.0963985919952393, -2.0369813442230225, -1.9775640964508057, -1.9181468486785889, -1.858729600906372, -1.7993123531341553, -1.7398951053619385, -1.6804778575897217, -1.6210606098175049, -1.561643362045288, -1.5022261142730713, -1.4428088665008545, -1.3833916187286377, -1.323974370956421, -1.264557123184204, -1.2051398754119873, -1.1457226276397705, -1.0863053798675537, -1.026888132095337, -0.9674708843231201, -0.9080536365509033, -0.8486363887786865, -0.7892191410064697, -0.7298018932342529, -0.6703846454620361, -0.6109673976898193, -0.551550030708313, -0.4921327829360962, -0.4327155351638794, -0.3732982873916626, -0.3138810396194458, -0.254463791847229, -0.1950465440750122, -0.1356292963027954, -0.07621204853057861, -0.016794800758361816, 0.04262244701385498, 0.10203969478607178, 0.16145694255828857, 0.22087419033050537, 0.28029143810272217, 0.33970868587493896, 0.39912593364715576, 0.45854318141937256, 0.5179604291915894, 0.5773776769638062, 0.636794924736023, 0.6962121725082397, 0.7556294202804565, 0.8150466680526733, 0.8744639158248901, 0.9338811635971069, 0.9932984113693237, 1.0527156591415405, 1.1121329069137573, 1.1715501546859741, 1.230967402458191, 1.2903846502304077, 1.3498018980026245]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 7.0, 9.0, 8.0, 12.0, 11.0, 18.0, 15.0, 19.0, 29.0, 19.0, 35.0, 19.0, 35.0, 40.0, 34.0, 57.0, 45.0, 44.0, 56.0, 47.0, 59.0, 43.0, 41.0, 48.0, 26.0, 31.0, 26.0, 23.0, 33.0, 16.0, 20.0, 16.0, 10.0, 8.0, 5.0, 5.0, 5.0, 5.0, 2.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7331885695457458, -0.7101259231567383, -0.6870633363723755, -0.6640006899833679, -0.6409380435943604, -0.6178753972053528, -0.5948127508163452, -0.5717501640319824, -0.5486875176429749, -0.5256248712539673, -0.5025622844696045, -0.4794996380805969, -0.45643699169158936, -0.4333743453025818, -0.4103117287158966, -0.3872491121292114, -0.36418646574020386, -0.3411238193511963, -0.3180612027645111, -0.2949985861778259, -0.27193593978881836, -0.24887330830097198, -0.2258106768131256, -0.20274804532527924, -0.17968541383743286, -0.1566227823495865, -0.1335601508617401, -0.11049751937389374, -0.08743488788604736, -0.06437225639820099, -0.041309624910354614, -0.01824699342250824, 0.00481569766998291, 0.027878329157829285, 0.05094096064567566, 0.07400359213352203, 0.09706622362136841, 0.12012885510921478, 0.14319148659706116, 0.16625411808490753, 0.1893167495727539, 0.21237938106060028, 0.23544201254844666, 0.25850462913513184, 0.2815672755241394, 0.304629921913147, 0.32769253849983215, 0.35075515508651733, 0.3738178014755249, 0.39688044786453247, 0.41994306445121765, 0.44300568103790283, 0.4660683274269104, 0.48913097381591797, 0.5121935606002808, 0.5352562069892883, 0.5583188533782959, 0.5813814997673035, 0.604444146156311, 0.6275067329406738, 0.6505693793296814, 0.673632025718689, 0.6966946125030518, 0.7197572588920593, 0.7428199052810669]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 13.0, 17.0, 26.0, 39.0, 42.0, 66.0, 106.0, 127.0, 201.0, 297.0, 506.0, 772.0, 1166.0, 2174.0, 3655.0, 6884.0, 14009.0, 30914.0, 86738.0, 313887.0, 398481.0, 114844.0, 38481.0, 16474.0, 8035.0, 4325.0, 2353.0, 1498.0, 883.0, 535.0, 347.0, 199.0, 131.0, 93.0, 65.0, 41.0, 34.0, 23.0, 20.0, 9.0, 10.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.57958984375, -0.5620880126953125, -0.544586181640625, -0.5270843505859375, -0.50958251953125, -0.4920806884765625, -0.474578857421875, -0.4570770263671875, -0.4395751953125, -0.4220733642578125, -0.404571533203125, -0.3870697021484375, -0.36956787109375, -0.3520660400390625, -0.334564208984375, -0.3170623779296875, -0.299560546875, -0.2820587158203125, -0.264556884765625, -0.2470550537109375, -0.22955322265625, -0.2120513916015625, -0.194549560546875, -0.1770477294921875, -0.1595458984375, -0.1420440673828125, -0.124542236328125, -0.1070404052734375, -0.08953857421875, -0.0720367431640625, -0.054534912109375, -0.0370330810546875, -0.01953125, -0.0020294189453125, 0.015472412109375, 0.0329742431640625, 0.05047607421875, 0.0679779052734375, 0.085479736328125, 0.1029815673828125, 0.1204833984375, 0.1379852294921875, 0.155487060546875, 0.1729888916015625, 0.19049072265625, 0.2079925537109375, 0.225494384765625, 0.2429962158203125, 0.260498046875, 0.2779998779296875, 0.295501708984375, 0.3130035400390625, 0.33050537109375, 0.3480072021484375, 0.365509033203125, 0.3830108642578125, 0.4005126953125, 0.4180145263671875, 0.435516357421875, 0.4530181884765625, 0.47052001953125, 0.4880218505859375, 0.505523681640625, 0.5230255126953125, 0.54052734375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 7.0, 1.0, 2.0, 6.0, 8.0, 8.0, 8.0, 10.0, 11.0, 15.0, 18.0, 13.0, 22.0, 30.0, 38.0, 27.0, 43.0, 45.0, 47.0, 45.0, 52.0, 43.0, 47.0, 41.0, 56.0, 44.0, 33.0, 45.0, 40.0, 34.0, 23.0, 18.0, 18.0, 14.0, 17.0, 15.0, 10.0, 3.0, 10.0, 7.0, 11.0, 4.0, 5.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.7255859375, -1.670196533203125, -1.61480712890625, -1.559417724609375, -1.5040283203125, -1.448638916015625, -1.39324951171875, -1.337860107421875, -1.282470703125, -1.227081298828125, -1.17169189453125, -1.116302490234375, -1.0609130859375, -1.005523681640625, -0.95013427734375, -0.894744873046875, -0.83935546875, -0.783966064453125, -0.72857666015625, -0.673187255859375, -0.6177978515625, -0.562408447265625, -0.50701904296875, -0.451629638671875, -0.396240234375, -0.340850830078125, -0.28546142578125, -0.230072021484375, -0.1746826171875, -0.119293212890625, -0.06390380859375, -0.008514404296875, 0.046875, 0.102264404296875, 0.15765380859375, 0.213043212890625, 0.2684326171875, 0.323822021484375, 0.37921142578125, 0.434600830078125, 0.489990234375, 0.545379638671875, 0.60076904296875, 0.656158447265625, 0.7115478515625, 0.766937255859375, 0.82232666015625, 0.877716064453125, 0.93310546875, 0.988494873046875, 1.04388427734375, 1.099273681640625, 1.1546630859375, 1.210052490234375, 1.26544189453125, 1.320831298828125, 1.376220703125, 1.431610107421875, 1.48699951171875, 1.542388916015625, 1.5977783203125, 1.653167724609375, 1.70855712890625, 1.763946533203125, 1.8193359375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 5.0, 6.0, 12.0, 21.0, 24.0, 39.0, 56.0, 71.0, 94.0, 193.0, 1024771.0, 22784.0, 146.0, 96.0, 70.0, 44.0, 40.0, 19.0, 12.0, 6.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.953125, -16.48095703125, -16.0087890625, -15.53662109375, -15.064453125, -14.59228515625, -14.1201171875, -13.64794921875, -13.17578125, -12.70361328125, -12.2314453125, -11.75927734375, -11.287109375, -10.81494140625, -10.3427734375, -9.87060546875, -9.3984375, -8.92626953125, -8.4541015625, -7.98193359375, -7.509765625, -7.03759765625, -6.5654296875, -6.09326171875, -5.62109375, -5.14892578125, -4.6767578125, -4.20458984375, -3.732421875, -3.26025390625, -2.7880859375, -2.31591796875, -1.84375, -1.37158203125, -0.8994140625, -0.42724609375, 0.044921875, 0.51708984375, 0.9892578125, 1.46142578125, 1.93359375, 2.40576171875, 2.8779296875, 3.35009765625, 3.822265625, 4.29443359375, 4.7666015625, 5.23876953125, 5.7109375, 6.18310546875, 6.6552734375, 7.12744140625, 7.599609375, 8.07177734375, 8.5439453125, 9.01611328125, 9.48828125, 9.96044921875, 10.4326171875, 10.90478515625, 11.376953125, 11.84912109375, 12.3212890625, 12.79345703125, 13.265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 6.0, 7.0, 6.0, 9.0, 23.0, 28.0, 30.0, 61.0, 71.0, 77.0, 92.0, 92.0, 83.0, 95.0, 95.0, 59.0, 44.0, 43.0, 19.0, 13.0, 8.0, 7.0, 5.0, 6.0, 3.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.97265625, -4.834197998046875, -4.69573974609375, -4.557281494140625, -4.4188232421875, -4.280364990234375, -4.14190673828125, -4.003448486328125, -3.864990234375, -3.726531982421875, -3.58807373046875, -3.449615478515625, -3.3111572265625, -3.172698974609375, -3.03424072265625, -2.895782470703125, -2.75732421875, -2.618865966796875, -2.48040771484375, -2.341949462890625, -2.2034912109375, -2.065032958984375, -1.92657470703125, -1.788116455078125, -1.649658203125, -1.511199951171875, -1.37274169921875, -1.234283447265625, -1.0958251953125, -0.957366943359375, -0.81890869140625, -0.680450439453125, -0.5419921875, -0.403533935546875, -0.26507568359375, -0.126617431640625, 0.0118408203125, 0.150299072265625, 0.28875732421875, 0.427215576171875, 0.565673828125, 0.704132080078125, 0.84259033203125, 0.981048583984375, 1.1195068359375, 1.257965087890625, 1.39642333984375, 1.534881591796875, 1.67333984375, 1.811798095703125, 1.95025634765625, 2.088714599609375, 2.2271728515625, 2.365631103515625, 2.50408935546875, 2.642547607421875, 2.781005859375, 2.919464111328125, 3.05792236328125, 3.196380615234375, 3.3348388671875, 3.473297119140625, 3.61175537109375, 3.750213623046875, 3.888671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 10.0, 8.0, 17.0, 26.0, 39.0, 96.0, 276.0, 1188.0, 14444.0, 968470.0, 60976.0, 2268.0, 438.0, 134.0, 62.0, 39.0, 26.0, 12.0, 10.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2685546875, -1.23736572265625, -1.2061767578125, -1.17498779296875, -1.143798828125, -1.11260986328125, -1.0814208984375, -1.05023193359375, -1.01904296875, -0.98785400390625, -0.9566650390625, -0.92547607421875, -0.894287109375, -0.86309814453125, -0.8319091796875, -0.80072021484375, -0.76953125, -0.73834228515625, -0.7071533203125, -0.67596435546875, -0.644775390625, -0.61358642578125, -0.5823974609375, -0.55120849609375, -0.52001953125, -0.48883056640625, -0.4576416015625, -0.42645263671875, -0.395263671875, -0.36407470703125, -0.3328857421875, -0.30169677734375, -0.2705078125, -0.23931884765625, -0.2081298828125, -0.17694091796875, -0.145751953125, -0.11456298828125, -0.0833740234375, -0.05218505859375, -0.02099609375, 0.01019287109375, 0.0413818359375, 0.07257080078125, 0.103759765625, 0.13494873046875, 0.1661376953125, 0.19732666015625, 0.228515625, 0.25970458984375, 0.2908935546875, 0.32208251953125, 0.353271484375, 0.38446044921875, 0.4156494140625, 0.44683837890625, 0.47802734375, 0.50921630859375, 0.5404052734375, 0.57159423828125, 0.602783203125, 0.63397216796875, 0.6651611328125, 0.69635009765625, 0.7275390625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 11.0, 20.0, 25.0, 37.0, 36.0, 69.0, 116.0, 183.0, 145.0, 113.0, 75.0, 51.0, 39.0, 18.0, 13.0, 15.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.208087921142578e-05, -4.032440483570099e-05, -3.8567930459976196e-05, -3.6811456084251404e-05, -3.505498170852661e-05, -3.329850733280182e-05, -3.1542032957077026e-05, -2.9785558581352234e-05, -2.802908420562744e-05, -2.627260982990265e-05, -2.4516135454177856e-05, -2.2759661078453064e-05, -2.100318670272827e-05, -1.924671232700348e-05, -1.7490237951278687e-05, -1.5733763575553894e-05, -1.3977289199829102e-05, -1.2220814824104309e-05, -1.0464340448379517e-05, -8.707866072654724e-06, -6.951391696929932e-06, -5.194917321205139e-06, -3.4384429454803467e-06, -1.6819685697555542e-06, 7.450580596923828e-08, 1.8309801816940308e-06, 3.5874545574188232e-06, 5.343928933143616e-06, 7.100403308868408e-06, 8.8568776845932e-06, 1.0613352060317993e-05, 1.2369826436042786e-05, 1.4126300811767578e-05, 1.588277518749237e-05, 1.7639249563217163e-05, 1.9395723938941956e-05, 2.1152198314666748e-05, 2.290867269039154e-05, 2.4665147066116333e-05, 2.6421621441841125e-05, 2.8178095817565918e-05, 2.993457019329071e-05, 3.16910445690155e-05, 3.3447518944740295e-05, 3.520399332046509e-05, 3.696046769618988e-05, 3.871694207191467e-05, 4.0473416447639465e-05, 4.222989082336426e-05, 4.398636519908905e-05, 4.574283957481384e-05, 4.7499313950538635e-05, 4.925578832626343e-05, 5.101226270198822e-05, 5.276873707771301e-05, 5.4525211453437805e-05, 5.62816858291626e-05, 5.803816020488739e-05, 5.979463458061218e-05, 6.155110895633698e-05, 6.330758333206177e-05, 6.506405770778656e-05, 6.682053208351135e-05, 6.857700645923615e-05, 7.033348083496094e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 14.0, 32.0, 44.0, 61.0, 188.0, 626.0, 4327.0, 100779.0, 920927.0, 19218.0, 1683.0, 361.0, 129.0, 54.0, 30.0, 18.0, 14.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73583984375, -0.7107086181640625, -0.685577392578125, -0.6604461669921875, -0.63531494140625, -0.6101837158203125, -0.585052490234375, -0.5599212646484375, -0.5347900390625, -0.5096588134765625, -0.484527587890625, -0.4593963623046875, -0.43426513671875, -0.4091339111328125, -0.384002685546875, -0.3588714599609375, -0.333740234375, -0.3086090087890625, -0.283477783203125, -0.2583465576171875, -0.23321533203125, -0.2080841064453125, -0.182952880859375, -0.1578216552734375, -0.1326904296875, -0.1075592041015625, -0.082427978515625, -0.0572967529296875, -0.03216552734375, -0.0070343017578125, 0.018096923828125, 0.0432281494140625, 0.068359375, 0.0934906005859375, 0.118621826171875, 0.1437530517578125, 0.16888427734375, 0.1940155029296875, 0.219146728515625, 0.2442779541015625, 0.2694091796875, 0.2945404052734375, 0.319671630859375, 0.3448028564453125, 0.36993408203125, 0.3950653076171875, 0.420196533203125, 0.4453277587890625, 0.470458984375, 0.4955902099609375, 0.520721435546875, 0.5458526611328125, 0.57098388671875, 0.5961151123046875, 0.621246337890625, 0.6463775634765625, 0.6715087890625, 0.6966400146484375, 0.721771240234375, 0.7469024658203125, 0.77203369140625, 0.7971649169921875, 0.822296142578125, 0.8474273681640625, 0.87255859375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 4.0, 9.0, 16.0, 37.0, 44.0, 56.0, 67.0, 109.0, 191.0, 152.0, 80.0, 63.0, 47.0, 29.0, 20.0, 18.0, 13.0, 9.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1270751953125, -0.12216377258300781, -0.11725234985351562, -0.11234092712402344, -0.10742950439453125, -0.10251808166503906, -0.09760665893554688, -0.09269523620605469, -0.0877838134765625, -0.08287239074707031, -0.07796096801757812, -0.07304954528808594, -0.06813812255859375, -0.06322669982910156, -0.058315277099609375, -0.05340385437011719, -0.048492431640625, -0.04358100891113281, -0.038669586181640625, -0.03375816345214844, -0.02884674072265625, -0.023935317993164062, -0.019023895263671875, -0.014112472534179688, -0.0092010498046875, -0.0042896270751953125, 0.000621795654296875, 0.0055332183837890625, 0.01044464111328125, 0.015356063842773438, 0.020267486572265625, 0.025178909301757812, 0.03009033203125, 0.03500175476074219, 0.039913177490234375, 0.04482460021972656, 0.04973602294921875, 0.05464744567871094, 0.059558868408203125, 0.06447029113769531, 0.0693817138671875, 0.07429313659667969, 0.07920455932617188, 0.08411598205566406, 0.08902740478515625, 0.09393882751464844, 0.09885025024414062, 0.10376167297363281, 0.108673095703125, 0.11358451843261719, 0.11849594116210938, 0.12340736389160156, 0.12831878662109375, 0.13323020935058594, 0.13814163208007812, 0.1430530548095703, 0.1479644775390625, 0.1528759002685547, 0.15778732299804688, 0.16269874572753906, 0.16761016845703125, 0.17252159118652344, 0.17743301391601562, 0.1823444366455078, 0.187255859375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 128.0, 671.0, 194.0, 14.0, 4.0], "bins": [-36.07221603393555, -35.4766731262207, -34.88113021850586, -34.28559112548828, -33.69004821777344, -33.094505310058594, -32.49896240234375, -31.90342140197754, -31.307878494262695, -30.71233558654785, -30.11679458618164, -29.521251678466797, -28.925710678100586, -28.330167770385742, -27.73462677001953, -27.139083862304688, -26.543540954589844, -25.947998046875, -25.35245704650879, -24.756914138793945, -24.161373138427734, -23.56583023071289, -22.970287322998047, -22.374746322631836, -21.779205322265625, -21.18366241455078, -20.58812141418457, -19.992578506469727, -19.397037506103516, -18.801494598388672, -18.205951690673828, -17.610410690307617, -17.014869689941406, -16.419326782226562, -15.823785781860352, -15.228242874145508, -14.63270092010498, -14.037158966064453, -13.441617012023926, -12.846075057983398, -12.250532150268555, -11.654990196228027, -11.0594482421875, -10.463905334472656, -9.868363380432129, -9.272821426391602, -8.677279472351074, -8.081737518310547, -7.4861955642700195, -6.890653610229492, -6.295111179351807, -5.699569225311279, -5.104026794433594, -4.508484840393066, -3.912942886352539, -3.3174004554748535, -2.721858263015747, -2.1263160705566406, -1.5307739973068237, -0.9352319240570068, -0.3396897315979004, 0.25585246086120605, 0.8513944149017334, 1.446936845779419, 2.0424787998199463]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 6.0, 5.0, 8.0, 7.0, 12.0, 11.0, 19.0, 19.0, 10.0, 18.0, 27.0, 21.0, 22.0, 39.0, 31.0, 19.0, 41.0, 34.0, 35.0, 27.0, 33.0, 50.0, 31.0, 42.0, 39.0, 40.0, 47.0, 28.0, 36.0, 25.0, 23.0, 21.0, 18.0, 24.0, 12.0, 19.0, 14.0, 13.0, 12.0, 14.0, 9.0, 4.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.6988320350646973, -2.620100736618042, -2.541369676589966, -2.4626383781433105, -2.3839070796966553, -2.30517578125, -2.226444721221924, -2.1477134227752686, -2.0689821243286133, -1.9902509450912476, -1.9115196466445923, -1.8327884674072266, -1.7540571689605713, -1.6753259897232056, -1.5965948104858398, -1.5178635120391846, -1.4391324520111084, -1.3604012727737427, -1.2816699743270874, -1.2029387950897217, -1.1242074966430664, -1.0454763174057007, -0.966745138168335, -0.8880138993263245, -0.809282660484314, -0.7305514216423035, -0.651820182800293, -0.5730890035629272, -0.49435776472091675, -0.41562652587890625, -0.33689531683921814, -0.25816410779953003, -0.17943286895751953, -0.10070164501667023, -0.021970421075820923, 0.05676080286502838, 0.13549202680587769, 0.21422326564788818, 0.2929544746875763, 0.3716856837272644, 0.4504169225692749, 0.5291481614112854, 0.6078794002532959, 0.6866105794906616, 0.7653418183326721, 0.8440730571746826, 0.9228042364120483, 1.001535415649414, 1.0802667140960693, 1.158997893333435, 1.2377291917800903, 1.316460371017456, 1.3951916694641113, 1.473922848701477, 1.5526540279388428, 1.631385326385498, 1.7101165056228638, 1.7888476848602295, 1.8675789833068848, 1.9463101625442505, 2.025041341781616, 2.1037726402282715, 2.1825039386749268, 2.261234998703003, 2.339966297149658]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 13.0, 7.0, 10.0, 21.0, 14.0, 15.0, 29.0, 40.0, 69.0, 96.0, 132.0, 255.0, 471.0, 1046.0, 2586.0, 7908.0, 33261.0, 331209.0, 3339103.0, 423268.0, 40519.0, 9119.0, 2937.0, 1039.0, 480.0, 228.0, 123.0, 81.0, 65.0, 30.0, 33.0, 17.0, 19.0, 16.0, 7.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.072265625, -2.006561279296875, -1.94085693359375, -1.875152587890625, -1.8094482421875, -1.743743896484375, -1.67803955078125, -1.612335205078125, -1.546630859375, -1.480926513671875, -1.41522216796875, -1.349517822265625, -1.2838134765625, -1.218109130859375, -1.15240478515625, -1.086700439453125, -1.02099609375, -0.955291748046875, -0.88958740234375, -0.823883056640625, -0.7581787109375, -0.692474365234375, -0.62677001953125, -0.561065673828125, -0.495361328125, -0.429656982421875, -0.36395263671875, -0.298248291015625, -0.2325439453125, -0.166839599609375, -0.10113525390625, -0.035430908203125, 0.0302734375, 0.095977783203125, 0.16168212890625, 0.227386474609375, 0.2930908203125, 0.358795166015625, 0.42449951171875, 0.490203857421875, 0.555908203125, 0.621612548828125, 0.68731689453125, 0.753021240234375, 0.8187255859375, 0.884429931640625, 0.95013427734375, 1.015838623046875, 1.08154296875, 1.147247314453125, 1.21295166015625, 1.278656005859375, 1.3443603515625, 1.410064697265625, 1.47576904296875, 1.541473388671875, 1.607177734375, 1.672882080078125, 1.73858642578125, 1.804290771484375, 1.8699951171875, 1.935699462890625, 2.00140380859375, 2.067108154296875, 2.1328125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 9.0, 14.0, 19.0, 15.0, 18.0, 30.0, 28.0, 30.0, 30.0, 32.0, 44.0, 46.0, 53.0, 51.0, 62.0, 61.0, 60.0, 62.0, 44.0, 31.0, 34.0, 29.0, 35.0, 30.0, 19.0, 25.0, 17.0, 13.0, 13.0, 7.0, 4.0, 7.0, 9.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.984375, -0.9552993774414062, -0.9262237548828125, -0.8971481323242188, -0.868072509765625, -0.8389968872070312, -0.8099212646484375, -0.7808456420898438, -0.75177001953125, -0.7226943969726562, -0.6936187744140625, -0.6645431518554688, -0.635467529296875, -0.6063919067382812, -0.5773162841796875, -0.5482406616210938, -0.5191650390625, -0.49008941650390625, -0.4610137939453125, -0.43193817138671875, -0.402862548828125, -0.37378692626953125, -0.3447113037109375, -0.31563568115234375, -0.28656005859375, -0.25748443603515625, -0.2284088134765625, -0.19933319091796875, -0.170257568359375, -0.14118194580078125, -0.1121063232421875, -0.08303070068359375, -0.053955078125, -0.02487945556640625, 0.0041961669921875, 0.03327178955078125, 0.062347412109375, 0.09142303466796875, 0.1204986572265625, 0.14957427978515625, 0.17864990234375, 0.20772552490234375, 0.2368011474609375, 0.26587677001953125, 0.294952392578125, 0.32402801513671875, 0.3531036376953125, 0.38217926025390625, 0.4112548828125, 0.44033050537109375, 0.4694061279296875, 0.49848175048828125, 0.527557373046875, 0.5566329956054688, 0.5857086181640625, 0.6147842407226562, 0.64385986328125, 0.6729354858398438, 0.7020111083984375, 0.7310867309570312, 0.760162353515625, 0.7892379760742188, 0.8183135986328125, 0.8473892211914062, 0.87646484375]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 4.0, 18.0, 56.0, 246.0, 7085.0, 4184425.0, 2205.0, 171.0, 28.0, 8.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.60009765625, -17.1533203125, -16.70654296875, -16.259765625, -15.81298828125, -15.3662109375, -14.91943359375, -14.47265625, -14.02587890625, -13.5791015625, -13.13232421875, -12.685546875, -12.23876953125, -11.7919921875, -11.34521484375, -10.8984375, -10.45166015625, -10.0048828125, -9.55810546875, -9.111328125, -8.66455078125, -8.2177734375, -7.77099609375, -7.32421875, -6.87744140625, -6.4306640625, -5.98388671875, -5.537109375, -5.09033203125, -4.6435546875, -4.19677734375, -3.75, -3.30322265625, -2.8564453125, -2.40966796875, -1.962890625, -1.51611328125, -1.0693359375, -0.62255859375, -0.17578125, 0.27099609375, 0.7177734375, 1.16455078125, 1.611328125, 2.05810546875, 2.5048828125, 2.95166015625, 3.3984375, 3.84521484375, 4.2919921875, 4.73876953125, 5.185546875, 5.63232421875, 6.0791015625, 6.52587890625, 6.97265625, 7.41943359375, 7.8662109375, 8.31298828125, 8.759765625, 9.20654296875, 9.6533203125, 10.10009765625, 10.546875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 14.0, 5.0, 8.0, 19.0, 32.0, 28.0, 39.0, 53.0, 72.0, 94.0, 129.0, 199.0, 356.0, 496.0, 741.0, 584.0, 335.0, 236.0, 176.0, 125.0, 85.0, 56.0, 49.0, 27.0, 27.0, 25.0, 18.0, 12.0, 4.0, 7.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.453125, -0.4408073425292969, -0.42848968505859375, -0.4161720275878906, -0.4038543701171875, -0.3915367126464844, -0.37921905517578125, -0.3669013977050781, -0.354583740234375, -0.3422660827636719, -0.32994842529296875, -0.3176307678222656, -0.3053131103515625, -0.2929954528808594, -0.28067779541015625, -0.2683601379394531, -0.25604248046875, -0.24372482299804688, -0.23140716552734375, -0.21908950805664062, -0.2067718505859375, -0.19445419311523438, -0.18213653564453125, -0.16981887817382812, -0.157501220703125, -0.14518356323242188, -0.13286590576171875, -0.12054824829101562, -0.1082305908203125, -0.09591293334960938, -0.08359527587890625, -0.07127761840820312, -0.0589599609375, -0.046642303466796875, -0.03432464599609375, -0.022006988525390625, -0.0096893310546875, 0.002628326416015625, 0.01494598388671875, 0.027263641357421875, 0.039581298828125, 0.051898956298828125, 0.06421661376953125, 0.07653427124023438, 0.0888519287109375, 0.10116958618164062, 0.11348724365234375, 0.12580490112304688, 0.13812255859375, 0.15044021606445312, 0.16275787353515625, 0.17507553100585938, 0.1873931884765625, 0.19971084594726562, 0.21202850341796875, 0.22434616088867188, 0.236663818359375, 0.24898147583007812, 0.26129913330078125, 0.2736167907714844, 0.2859344482421875, 0.2982521057128906, 0.31056976318359375, 0.3228874206542969, 0.335205078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 6.0, 21.0, 23.0, 25.0, 40.0, 56.0, 71.0, 93.0, 116.0, 109.0, 108.0, 91.0, 59.0, 53.0, 38.0, 19.0, 18.0, 11.0, 7.0, 8.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7822902202606201, -1.7193857431411743, -1.656481146812439, -1.5935766696929932, -1.5306720733642578, -1.467767596244812, -1.4048631191253662, -1.3419585227966309, -1.2790539264678955, -1.2161494493484497, -1.1532448530197144, -1.0903403759002686, -1.0274357795715332, -0.9645313024520874, -0.9016267657279968, -0.8387222290039062, -0.7758177518844604, -0.7129132151603699, -0.6500086784362793, -0.5871042013168335, -0.5241996049880981, -0.46129509806632996, -0.39839059114456177, -0.3354860544204712, -0.2725815176963806, -0.20967698097229004, -0.14677245914936066, -0.08386793732643127, -0.020963400602340698, 0.04194113612174988, 0.10484564304351807, 0.16775017976760864, 0.23065471649169922, 0.2935592532157898, 0.35646378993988037, 0.41936829686164856, 0.48227283358573914, 0.5451773405075073, 0.6080818772315979, 0.6709864139556885, 0.733890950679779, 0.7967954874038696, 0.8597000241279602, 0.9226045608520508, 0.9855090379714966, 1.048413634300232, 1.1113181114196777, 1.174222707748413, 1.2371271848678589, 1.3000316619873047, 1.36293625831604, 1.4258407354354858, 1.4887453317642212, 1.551649808883667, 1.6145544052124023, 1.6774588823318481, 1.740363359451294, 1.8032678365707397, 1.866172432899475, 1.929076910018921, 1.9919815063476562, 2.0548861026763916, 2.117790460586548, 2.180695056915283, 2.2435996532440186]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 11.0, 9.0, 11.0, 12.0, 20.0, 12.0, 17.0, 23.0, 28.0, 38.0, 43.0, 35.0, 40.0, 44.0, 47.0, 42.0, 44.0, 60.0, 59.0, 47.0, 52.0, 48.0, 34.0, 41.0, 36.0, 26.0, 30.0, 19.0, 25.0, 14.0, 11.0, 6.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1745353937149048, -1.138534426689148, -1.1025334596633911, -1.0665324926376343, -1.0305315256118774, -0.9945304989814758, -0.958529531955719, -0.9225285053253174, -0.8865275382995605, -0.8505265712738037, -0.8145256042480469, -0.77852463722229, -0.7425236105918884, -0.7065226435661316, -0.6705216765403748, -0.6345206499099731, -0.5985197424888611, -0.5625187754631042, -0.5265178084373474, -0.4905168116092682, -0.45451581478118896, -0.41851484775543213, -0.3825138807296753, -0.34651288390159607, -0.31051191687583923, -0.2745109498500824, -0.23850995302200317, -0.20250898599624634, -0.1665080040693283, -0.13050702214241028, -0.09450605511665344, -0.05850505828857422, -0.022504091262817383, 0.013496886938810349, 0.04949786514043808, 0.08549883961677551, 0.12149982154369354, 0.15750080347061157, 0.1935017704963684, 0.22950276732444763, 0.26550373435020447, 0.3015047013759613, 0.3375056982040405, 0.37350666522979736, 0.4095076322555542, 0.4455086290836334, 0.48150959610939026, 0.5175105929374695, 0.5535115599632263, 0.5895125269889832, 0.62551349401474, 0.6615145206451416, 0.6975154876708984, 0.7335164546966553, 0.7695174217224121, 0.805518388748169, 0.8415193557739258, 0.8775203227996826, 0.9135212898254395, 0.9495222568511963, 0.9855232834815979, 1.02152419090271, 1.0575251579284668, 1.0935262441635132, 1.12952721118927]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 12.0, 24.0, 28.0, 50.0, 115.0, 222.0, 497.0, 1346.0, 3968.0, 14869.0, 82939.0, 535095.0, 347709.0, 47263.0, 9637.0, 2938.0, 1034.0, 402.0, 180.0, 85.0, 44.0, 37.0, 15.0, 11.0, 8.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.826171875, -0.8024673461914062, -0.7787628173828125, -0.7550582885742188, -0.731353759765625, -0.7076492309570312, -0.6839447021484375, -0.6602401733398438, -0.63653564453125, -0.6128311157226562, -0.5891265869140625, -0.5654220581054688, -0.541717529296875, -0.5180130004882812, -0.4943084716796875, -0.47060394287109375, -0.4468994140625, -0.42319488525390625, -0.3994903564453125, -0.37578582763671875, -0.352081298828125, -0.32837677001953125, -0.3046722412109375, -0.28096771240234375, -0.25726318359375, -0.23355865478515625, -0.2098541259765625, -0.18614959716796875, -0.162445068359375, -0.13874053955078125, -0.1150360107421875, -0.09133148193359375, -0.067626953125, -0.04392242431640625, -0.0202178955078125, 0.00348663330078125, 0.027191162109375, 0.05089569091796875, 0.0746002197265625, 0.09830474853515625, 0.12200927734375, 0.14571380615234375, 0.1694183349609375, 0.19312286376953125, 0.216827392578125, 0.24053192138671875, 0.2642364501953125, 0.28794097900390625, 0.3116455078125, 0.33535003662109375, 0.3590545654296875, 0.38275909423828125, 0.406463623046875, 0.43016815185546875, 0.4538726806640625, 0.47757720947265625, 0.50128173828125, 0.5249862670898438, 0.5486907958984375, 0.5723953247070312, 0.596099853515625, 0.6198043823242188, 0.6435089111328125, 0.6672134399414062, 0.69091796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 12.0, 26.0, 27.0, 39.0, 42.0, 60.0, 72.0, 83.0, 88.0, 81.0, 81.0, 78.0, 81.0, 56.0, 46.0, 33.0, 27.0, 28.0, 14.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4697265625, -1.4333724975585938, -1.3970184326171875, -1.3606643676757812, -1.324310302734375, -1.2879562377929688, -1.2516021728515625, -1.2152481079101562, -1.17889404296875, -1.1425399780273438, -1.1061859130859375, -1.0698318481445312, -1.033477783203125, -0.9971237182617188, -0.9607696533203125, -0.9244155883789062, -0.8880615234375, -0.8517074584960938, -0.8153533935546875, -0.7789993286132812, -0.742645263671875, -0.7062911987304688, -0.6699371337890625, -0.6335830688476562, -0.59722900390625, -0.5608749389648438, -0.5245208740234375, -0.48816680908203125, -0.451812744140625, -0.41545867919921875, -0.3791046142578125, -0.34275054931640625, -0.306396484375, -0.27004241943359375, -0.2336883544921875, -0.19733428955078125, -0.160980224609375, -0.12462615966796875, -0.0882720947265625, -0.05191802978515625, -0.01556396484375, 0.02079010009765625, 0.0571441650390625, 0.09349822998046875, 0.129852294921875, 0.16620635986328125, 0.2025604248046875, 0.23891448974609375, 0.2752685546875, 0.31162261962890625, 0.3479766845703125, 0.38433074951171875, 0.420684814453125, 0.45703887939453125, 0.4933929443359375, 0.5297470092773438, 0.56610107421875, 0.6024551391601562, 0.6388092041015625, 0.6751632690429688, 0.711517333984375, 0.7478713989257812, 0.7842254638671875, 0.8205795288085938, 0.85693359375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 3.0, 11.0, 15.0, 23.0, 32.0, 38.0, 55.0, 67.0, 127.0, 155.0, 266.0, 411.0, 698.0, 1438.0, 2918.0, 7538.0, 22365.0, 84461.0, 357025.0, 420103.0, 107292.0, 27151.0, 8922.0, 3575.0, 1572.0, 872.0, 505.0, 290.0, 167.0, 124.0, 72.0, 65.0, 48.0, 26.0, 28.0, 21.0, 19.0, 13.0, 11.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314697265625, -0.3026313781738281, -0.29056549072265625, -0.2784996032714844, -0.2664337158203125, -0.2543678283691406, -0.24230194091796875, -0.23023605346679688, -0.218170166015625, -0.20610427856445312, -0.19403839111328125, -0.18197250366210938, -0.1699066162109375, -0.15784072875976562, -0.14577484130859375, -0.13370895385742188, -0.12164306640625, -0.10957717895507812, -0.09751129150390625, -0.08544540405273438, -0.0733795166015625, -0.061313629150390625, -0.04924774169921875, -0.037181854248046875, -0.025115966796875, -0.013050079345703125, -0.00098419189453125, 0.011081695556640625, 0.0231475830078125, 0.035213470458984375, 0.04727935791015625, 0.059345245361328125, 0.0714111328125, 0.08347702026367188, 0.09554290771484375, 0.10760879516601562, 0.1196746826171875, 0.13174057006835938, 0.14380645751953125, 0.15587234497070312, 0.167938232421875, 0.18000411987304688, 0.19207000732421875, 0.20413589477539062, 0.2162017822265625, 0.22826766967773438, 0.24033355712890625, 0.2523994445800781, 0.26446533203125, 0.2765312194824219, 0.28859710693359375, 0.3006629943847656, 0.3127288818359375, 0.3247947692871094, 0.33686065673828125, 0.3489265441894531, 0.360992431640625, 0.3730583190917969, 0.38512420654296875, 0.3971900939941406, 0.4092559814453125, 0.4213218688964844, 0.43338775634765625, 0.4454536437988281, 0.45751953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 8.0, 7.0, 9.0, 12.0, 16.0, 11.0, 23.0, 24.0, 27.0, 26.0, 30.0, 40.0, 40.0, 42.0, 40.0, 38.0, 44.0, 52.0, 53.0, 41.0, 39.0, 42.0, 38.0, 30.0, 41.0, 29.0, 30.0, 30.0, 28.0, 7.0, 16.0, 12.0, 10.0, 6.0, 12.0, 8.0, 12.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1796875, -1.1446990966796875, -1.109710693359375, -1.0747222900390625, -1.03973388671875, -1.0047454833984375, -0.969757080078125, -0.9347686767578125, -0.8997802734375, -0.8647918701171875, -0.829803466796875, -0.7948150634765625, -0.75982666015625, -0.7248382568359375, -0.689849853515625, -0.6548614501953125, -0.619873046875, -0.5848846435546875, -0.549896240234375, -0.5149078369140625, -0.47991943359375, -0.4449310302734375, -0.409942626953125, -0.3749542236328125, -0.3399658203125, -0.3049774169921875, -0.269989013671875, -0.2350006103515625, -0.20001220703125, -0.1650238037109375, -0.130035400390625, -0.0950469970703125, -0.06005859375, -0.0250701904296875, 0.009918212890625, 0.0449066162109375, 0.07989501953125, 0.1148834228515625, 0.149871826171875, 0.1848602294921875, 0.2198486328125, 0.2548370361328125, 0.289825439453125, 0.3248138427734375, 0.35980224609375, 0.3947906494140625, 0.429779052734375, 0.4647674560546875, 0.499755859375, 0.5347442626953125, 0.569732666015625, 0.6047210693359375, 0.63970947265625, 0.6746978759765625, 0.709686279296875, 0.7446746826171875, 0.7796630859375, 0.8146514892578125, 0.849639892578125, 0.8846282958984375, 0.91961669921875, 0.9546051025390625, 0.989593505859375, 1.0245819091796875, 1.0595703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 9.0, 21.0, 37.0, 43.0, 50.0, 92.0, 155.0, 242.0, 438.0, 923.0, 1783.0, 4164.0, 11552.0, 41263.0, 239023.0, 577626.0, 130502.0, 26204.0, 8151.0, 3121.0, 1448.0, 700.0, 409.0, 229.0, 141.0, 80.0, 40.0, 32.0, 23.0, 9.0, 10.0, 11.0, 8.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1580810546875, -0.1518421173095703, -0.14560317993164062, -0.13936424255371094, -0.13312530517578125, -0.12688636779785156, -0.12064743041992188, -0.11440849304199219, -0.1081695556640625, -0.10193061828613281, -0.09569168090820312, -0.08945274353027344, -0.08321380615234375, -0.07697486877441406, -0.07073593139648438, -0.06449699401855469, -0.058258056640625, -0.05201911926269531, -0.045780181884765625, -0.03954124450683594, -0.03330230712890625, -0.027063369750976562, -0.020824432373046875, -0.014585494995117188, -0.0083465576171875, -0.0021076202392578125, 0.004131317138671875, 0.010370254516601562, 0.01660919189453125, 0.022848129272460938, 0.029087066650390625, 0.03532600402832031, 0.04156494140625, 0.04780387878417969, 0.054042816162109375, 0.06028175354003906, 0.06652069091796875, 0.07275962829589844, 0.07899856567382812, 0.08523750305175781, 0.0914764404296875, 0.09771537780761719, 0.10395431518554688, 0.11019325256347656, 0.11643218994140625, 0.12267112731933594, 0.12891006469726562, 0.1351490020751953, 0.141387939453125, 0.1476268768310547, 0.15386581420898438, 0.16010475158691406, 0.16634368896484375, 0.17258262634277344, 0.17882156372070312, 0.1850605010986328, 0.1912994384765625, 0.1975383758544922, 0.20377731323242188, 0.21001625061035156, 0.21625518798828125, 0.22249412536621094, 0.22873306274414062, 0.2349720001220703, 0.2412109375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 8.0, 8.0, 18.0, 29.0, 38.0, 33.0, 63.0, 71.0, 115.0, 129.0, 135.0, 103.0, 59.0, 59.0, 41.0, 31.0, 18.0, 16.0, 9.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001354217529296875, -0.00013102218508720398, -0.00012662261724472046, -0.00012222304940223694, -0.00011782348155975342, -0.0001134239137172699, -0.00010902434587478638, -0.00010462477803230286, -0.00010022521018981934, -9.582564234733582e-05, -9.14260745048523e-05, -8.702650666236877e-05, -8.262693881988525e-05, -7.822737097740173e-05, -7.382780313491821e-05, -6.942823529243469e-05, -6.502866744995117e-05, -6.062909960746765e-05, -5.622953176498413e-05, -5.182996392250061e-05, -4.743039608001709e-05, -4.303082823753357e-05, -3.863126039505005e-05, -3.423169255256653e-05, -2.9832124710083008e-05, -2.5432556867599487e-05, -2.1032989025115967e-05, -1.6633421182632446e-05, -1.2233853340148926e-05, -7.834285497665405e-06, -3.4347176551818848e-06, 9.648501873016357e-07, 5.364418029785156e-06, 9.763985872268677e-06, 1.4163553714752197e-05, 1.8563121557235718e-05, 2.2962689399719238e-05, 2.736225724220276e-05, 3.176182508468628e-05, 3.61613929271698e-05, 4.056096076965332e-05, 4.496052861213684e-05, 4.936009645462036e-05, 5.375966429710388e-05, 5.81592321395874e-05, 6.255879998207092e-05, 6.695836782455444e-05, 7.135793566703796e-05, 7.575750350952148e-05, 8.0157071352005e-05, 8.455663919448853e-05, 8.895620703697205e-05, 9.335577487945557e-05, 9.775534272193909e-05, 0.00010215491056442261, 0.00010655447840690613, 0.00011095404624938965, 0.00011535361409187317, 0.00011975318193435669, 0.0001241527497768402, 0.00012855231761932373, 0.00013295188546180725, 0.00013735145330429077, 0.0001417510211467743, 0.0001461505889892578]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 10.0, 13.0, 20.0, 25.0, 31.0, 57.0, 67.0, 113.0, 199.0, 338.0, 530.0, 915.0, 1714.0, 3084.0, 6695.0, 16923.0, 54624.0, 217190.0, 473390.0, 194349.0, 49328.0, 15639.0, 6428.0, 3030.0, 1603.0, 861.0, 478.0, 292.0, 205.0, 122.0, 88.0, 51.0, 33.0, 25.0, 24.0, 9.0, 8.0, 6.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1832275390625, -0.17806053161621094, -0.17289352416992188, -0.1677265167236328, -0.16255950927734375, -0.1573925018310547, -0.15222549438476562, -0.14705848693847656, -0.1418914794921875, -0.13672447204589844, -0.13155746459960938, -0.1263904571533203, -0.12122344970703125, -0.11605644226074219, -0.11088943481445312, -0.10572242736816406, -0.100555419921875, -0.09538841247558594, -0.09022140502929688, -0.08505439758300781, -0.07988739013671875, -0.07472038269042969, -0.06955337524414062, -0.06438636779785156, -0.0592193603515625, -0.05405235290527344, -0.048885345458984375, -0.04371833801269531, -0.03855133056640625, -0.03338432312011719, -0.028217315673828125, -0.023050308227539062, -0.01788330078125, -0.012716293334960938, -0.007549285888671875, -0.0023822784423828125, 0.00278472900390625, 0.007951736450195312, 0.013118743896484375, 0.018285751342773438, 0.0234527587890625, 0.028619766235351562, 0.033786773681640625, 0.03895378112792969, 0.04412078857421875, 0.04928779602050781, 0.054454803466796875, 0.05962181091308594, 0.064788818359375, 0.06995582580566406, 0.07512283325195312, 0.08028984069824219, 0.08545684814453125, 0.09062385559082031, 0.09579086303710938, 0.10095787048339844, 0.1061248779296875, 0.11129188537597656, 0.11645889282226562, 0.12162590026855469, 0.12679290771484375, 0.1319599151611328, 0.13712692260742188, 0.14229393005371094, 0.1474609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 9.0, 15.0, 14.0, 12.0, 18.0, 14.0, 30.0, 26.0, 44.0, 62.0, 61.0, 70.0, 80.0, 79.0, 61.0, 68.0, 62.0, 61.0, 41.0, 45.0, 20.0, 26.0, 17.0, 14.0, 7.0, 7.0, 4.0, 4.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.041748046875, -0.040598392486572266, -0.03944873809814453, -0.0382990837097168, -0.03714942932128906, -0.03599977493286133, -0.034850120544433594, -0.03370046615600586, -0.032550811767578125, -0.03140115737915039, -0.030251502990722656, -0.029101848602294922, -0.027952194213867188, -0.026802539825439453, -0.02565288543701172, -0.024503231048583984, -0.02335357666015625, -0.022203922271728516, -0.02105426788330078, -0.019904613494873047, -0.018754959106445312, -0.017605304718017578, -0.016455650329589844, -0.01530599594116211, -0.014156341552734375, -0.01300668716430664, -0.011857032775878906, -0.010707378387451172, -0.009557723999023438, -0.008408069610595703, -0.007258415222167969, -0.006108760833740234, -0.0049591064453125, -0.0038094520568847656, -0.0026597976684570312, -0.0015101432800292969, -0.0003604888916015625, 0.0007891654968261719, 0.0019388198852539062, 0.0030884742736816406, 0.004238128662109375, 0.005387783050537109, 0.006537437438964844, 0.007687091827392578, 0.008836746215820312, 0.009986400604248047, 0.011136054992675781, 0.012285709381103516, 0.01343536376953125, 0.014585018157958984, 0.01573467254638672, 0.016884326934814453, 0.018033981323242188, 0.019183635711669922, 0.020333290100097656, 0.02148294448852539, 0.022632598876953125, 0.02378225326538086, 0.024931907653808594, 0.026081562042236328, 0.027231216430664062, 0.028380870819091797, 0.02953052520751953, 0.030680179595947266, 0.031829833984375]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 9.0, 20.0, 31.0, 38.0, 64.0, 112.0, 154.0, 133.0, 150.0, 92.0, 60.0, 46.0, 21.0, 17.0, 8.0, 9.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2955663204193115, -1.2464118003845215, -1.1972572803497314, -1.1481027603149414, -1.0989482402801514, -1.0497936010360718, -1.0006390810012817, -0.9514845609664917, -0.9023300409317017, -0.8531755208969116, -0.8040210008621216, -0.7548664212226868, -0.7057119011878967, -0.6565573811531067, -0.6074028015136719, -0.5582482814788818, -0.5090937614440918, -0.45993924140930176, -0.41078469157218933, -0.3616301417350769, -0.31247562170028687, -0.2633211016654968, -0.2141665518283844, -0.16501200199127197, -0.11585748195648193, -0.0667029470205307, -0.017548412084579468, 0.031606122851371765, 0.080760657787323, 0.12991519272327423, 0.17906972765922546, 0.2282242774963379, 0.2773786783218384, 0.3265331983566284, 0.37568774819374084, 0.42484229803085327, 0.4739968180656433, 0.5231513381004333, 0.5723059177398682, 0.6214604377746582, 0.6706149578094482, 0.7197694778442383, 0.7689239978790283, 0.8180785775184631, 0.8672330975532532, 0.9163876175880432, 0.965542197227478, 1.014696717262268, 1.063851237297058, 1.1130057573318481, 1.1621602773666382, 1.2113147974014282, 1.2604694366455078, 1.3096239566802979, 1.358778476715088, 1.407932996749878, 1.457087516784668, 1.506242036819458, 1.555396556854248, 1.604551076889038, 1.6537055969238281, 1.7028602361679077, 1.7520147562026978, 1.8011692762374878, 1.8503237962722778]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 7.0, 3.0, 10.0, 12.0, 16.0, 17.0, 22.0, 27.0, 36.0, 34.0, 56.0, 32.0, 65.0, 61.0, 39.0, 65.0, 80.0, 57.0, 57.0, 58.0, 47.0, 42.0, 31.0, 34.0, 31.0, 26.0, 15.0, 9.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.825019896030426, -0.7997254133224487, -0.7744308710098267, -0.7491363883018494, -0.7238419055938721, -0.69854736328125, -0.6732528805732727, -0.6479583978652954, -0.6226638555526733, -0.597369372844696, -0.572074830532074, -0.5467803478240967, -0.5214858055114746, -0.4961913228034973, -0.47089684009552, -0.44560232758522034, -0.42030781507492065, -0.39501330256462097, -0.3697187900543213, -0.344424307346344, -0.3191297948360443, -0.29383528232574463, -0.26854079961776733, -0.24324628710746765, -0.21795177459716797, -0.1926572620868683, -0.1673627644777298, -0.1420682668685913, -0.11677375435829163, -0.09147924184799194, -0.06618474423885345, -0.040890246629714966, -0.015595674514770508, 0.009698830544948578, 0.034993335604667664, 0.06028784066438675, 0.08558234572410583, 0.11087685823440552, 0.136171355843544, 0.1614658534526825, 0.18676036596298218, 0.21205487847328186, 0.23734937608242035, 0.26264387369155884, 0.2879383862018585, 0.3132328987121582, 0.3385273814201355, 0.3638218939304352, 0.38911640644073486, 0.41441091895103455, 0.43970543146133423, 0.4649999141693115, 0.4902944266796112, 0.5155889391899109, 0.5408834218978882, 0.5661779642105103, 0.5914724469184875, 0.6167669296264648, 0.6420614719390869, 0.6673559546470642, 0.6926504373550415, 0.7179449796676636, 0.7432394623756409, 0.7685339450836182, 0.7938284873962402]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 5.0, 14.0, 15.0, 31.0, 36.0, 62.0, 100.0, 175.0, 286.0, 535.0, 957.0, 1704.0, 3444.0, 6683.0, 14787.0, 37165.0, 103085.0, 293554.0, 361934.0, 139140.0, 48866.0, 18941.0, 8501.0, 4002.0, 1984.0, 1041.0, 629.0, 359.0, 179.0, 117.0, 75.0, 55.0, 32.0, 13.0, 19.0, 11.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59130859375, -0.5677871704101562, -0.5442657470703125, -0.5207443237304688, -0.497222900390625, -0.47370147705078125, -0.4501800537109375, -0.42665863037109375, -0.40313720703125, -0.37961578369140625, -0.3560943603515625, -0.33257293701171875, -0.309051513671875, -0.28553009033203125, -0.2620086669921875, -0.23848724365234375, -0.2149658203125, -0.19144439697265625, -0.1679229736328125, -0.14440155029296875, -0.120880126953125, -0.09735870361328125, -0.0738372802734375, -0.05031585693359375, -0.02679443359375, -0.00327301025390625, 0.0202484130859375, 0.04376983642578125, 0.067291259765625, 0.09081268310546875, 0.1143341064453125, 0.13785552978515625, 0.161376953125, 0.18489837646484375, 0.2084197998046875, 0.23194122314453125, 0.255462646484375, 0.27898406982421875, 0.3025054931640625, 0.32602691650390625, 0.34954833984375, 0.37306976318359375, 0.3965911865234375, 0.42011260986328125, 0.443634033203125, 0.46715545654296875, 0.4906768798828125, 0.5141983032226562, 0.5377197265625, 0.5612411499023438, 0.5847625732421875, 0.6082839965820312, 0.631805419921875, 0.6553268432617188, 0.6788482666015625, 0.7023696899414062, 0.72589111328125, 0.7494125366210938, 0.7729339599609375, 0.7964553833007812, 0.819976806640625, 0.8434982299804688, 0.8670196533203125, 0.8905410766601562, 0.9140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 5.0, 6.0, 7.0, 7.0, 7.0, 9.0, 16.0, 21.0, 23.0, 23.0, 24.0, 47.0, 42.0, 41.0, 45.0, 38.0, 53.0, 47.0, 54.0, 60.0, 54.0, 43.0, 38.0, 42.0, 36.0, 30.0, 26.0, 39.0, 22.0, 18.0, 19.0, 18.0, 16.0, 5.0, 5.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-1.8310546875, -1.786041259765625, -1.74102783203125, -1.696014404296875, -1.6510009765625, -1.605987548828125, -1.56097412109375, -1.515960693359375, -1.470947265625, -1.425933837890625, -1.38092041015625, -1.335906982421875, -1.2908935546875, -1.245880126953125, -1.20086669921875, -1.155853271484375, -1.11083984375, -1.065826416015625, -1.02081298828125, -0.975799560546875, -0.9307861328125, -0.885772705078125, -0.84075927734375, -0.795745849609375, -0.750732421875, -0.705718994140625, -0.66070556640625, -0.615692138671875, -0.5706787109375, -0.525665283203125, -0.48065185546875, -0.435638427734375, -0.390625, -0.345611572265625, -0.30059814453125, -0.255584716796875, -0.2105712890625, -0.165557861328125, -0.12054443359375, -0.075531005859375, -0.030517578125, 0.014495849609375, 0.05950927734375, 0.104522705078125, 0.1495361328125, 0.194549560546875, 0.23956298828125, 0.284576416015625, 0.32958984375, 0.374603271484375, 0.41961669921875, 0.464630126953125, 0.5096435546875, 0.554656982421875, 0.59967041015625, 0.644683837890625, 0.689697265625, 0.734710693359375, 0.77972412109375, 0.824737548828125, 0.8697509765625, 0.914764404296875, 0.95977783203125, 1.004791259765625, 1.0498046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 10.0, 7.0, 8.0, 12.0, 16.0, 19.0, 20.0, 14.0, 21.0, 21.0, 45.0, 29.0, 35.0, 34.0, 63.0, 138.0, 2153.0, 709663.0, 334312.0, 1438.0, 122.0, 39.0, 29.0, 34.0, 38.0, 24.0, 32.0, 27.0, 29.0, 17.0, 13.0, 13.0, 12.0, 7.0, 11.0, 8.0, 5.0, 8.0, 3.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2890625, -4.14581298828125, -4.0025634765625, -3.85931396484375, -3.716064453125, -3.57281494140625, -3.4295654296875, -3.28631591796875, -3.14306640625, -2.99981689453125, -2.8565673828125, -2.71331787109375, -2.570068359375, -2.42681884765625, -2.2835693359375, -2.14031982421875, -1.9970703125, -1.85382080078125, -1.7105712890625, -1.56732177734375, -1.424072265625, -1.28082275390625, -1.1375732421875, -0.99432373046875, -0.85107421875, -0.70782470703125, -0.5645751953125, -0.42132568359375, -0.278076171875, -0.13482666015625, 0.0084228515625, 0.15167236328125, 0.294921875, 0.43817138671875, 0.5814208984375, 0.72467041015625, 0.867919921875, 1.01116943359375, 1.1544189453125, 1.29766845703125, 1.44091796875, 1.58416748046875, 1.7274169921875, 1.87066650390625, 2.013916015625, 2.15716552734375, 2.3004150390625, 2.44366455078125, 2.5869140625, 2.73016357421875, 2.8734130859375, 3.01666259765625, 3.159912109375, 3.30316162109375, 3.4464111328125, 3.58966064453125, 3.73291015625, 3.87615966796875, 4.0194091796875, 4.16265869140625, 4.305908203125, 4.44915771484375, 4.5924072265625, 4.73565673828125, 4.87890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 4.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 12.0, 14.0, 13.0, 20.0, 24.0, 32.0, 19.0, 32.0, 36.0, 34.0, 39.0, 46.0, 53.0, 37.0, 53.0, 48.0, 39.0, 47.0, 46.0, 34.0, 34.0, 37.0, 30.0, 26.0, 25.0, 24.0, 19.0, 12.0, 13.0, 7.0, 10.0, 8.0, 9.0, 4.0, 9.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.369140625, -1.324798583984375, -1.28045654296875, -1.236114501953125, -1.1917724609375, -1.147430419921875, -1.10308837890625, -1.058746337890625, -1.014404296875, -0.970062255859375, -0.92572021484375, -0.881378173828125, -0.8370361328125, -0.792694091796875, -0.74835205078125, -0.704010009765625, -0.65966796875, -0.615325927734375, -0.57098388671875, -0.526641845703125, -0.4822998046875, -0.437957763671875, -0.39361572265625, -0.349273681640625, -0.304931640625, -0.260589599609375, -0.21624755859375, -0.171905517578125, -0.1275634765625, -0.083221435546875, -0.03887939453125, 0.005462646484375, 0.0498046875, 0.094146728515625, 0.13848876953125, 0.182830810546875, 0.2271728515625, 0.271514892578125, 0.31585693359375, 0.360198974609375, 0.404541015625, 0.448883056640625, 0.49322509765625, 0.537567138671875, 0.5819091796875, 0.626251220703125, 0.67059326171875, 0.714935302734375, 0.75927734375, 0.803619384765625, 0.84796142578125, 0.892303466796875, 0.9366455078125, 0.980987548828125, 1.02532958984375, 1.069671630859375, 1.114013671875, 1.158355712890625, 1.20269775390625, 1.247039794921875, 1.2913818359375, 1.335723876953125, 1.38006591796875, 1.424407958984375, 1.46875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 8.0, 9.0, 12.0, 15.0, 38.0, 63.0, 104.0, 234.0, 562.0, 1723.0, 8121.0, 65813.0, 674753.0, 269166.0, 22540.0, 3700.0, 954.0, 359.0, 155.0, 81.0, 48.0, 38.0, 23.0, 10.0, 6.0, 1.0, 4.0, 6.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5188331604003906, -0.5029983520507812, -0.4871635437011719, -0.4713287353515625, -0.4554939270019531, -0.43965911865234375, -0.4238243103027344, -0.407989501953125, -0.3921546936035156, -0.37631988525390625, -0.3604850769042969, -0.3446502685546875, -0.3288154602050781, -0.31298065185546875, -0.2971458435058594, -0.28131103515625, -0.2654762268066406, -0.24964141845703125, -0.23380661010742188, -0.2179718017578125, -0.20213699340820312, -0.18630218505859375, -0.17046737670898438, -0.154632568359375, -0.13879776000976562, -0.12296295166015625, -0.10712814331054688, -0.0912933349609375, -0.07545852661132812, -0.05962371826171875, -0.043788909912109375, -0.0279541015625, -0.012119293212890625, 0.00371551513671875, 0.019550323486328125, 0.0353851318359375, 0.051219940185546875, 0.06705474853515625, 0.08288955688476562, 0.098724365234375, 0.11455917358398438, 0.13039398193359375, 0.14622879028320312, 0.1620635986328125, 0.17789840698242188, 0.19373321533203125, 0.20956802368164062, 0.22540283203125, 0.24123764038085938, 0.25707244873046875, 0.2729072570800781, 0.2887420654296875, 0.3045768737792969, 0.32041168212890625, 0.3362464904785156, 0.352081298828125, 0.3679161071777344, 0.38375091552734375, 0.3995857238769531, 0.4154205322265625, 0.4312553405761719, 0.44709014892578125, 0.4629249572753906, 0.478759765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 5.0, 7.0, 16.0, 12.0, 14.0, 18.0, 25.0, 38.0, 48.0, 52.0, 53.0, 74.0, 85.0, 77.0, 69.0, 72.0, 52.0, 44.0, 42.0, 36.0, 34.0, 19.0, 18.0, 19.0, 15.0, 5.0, 12.0, 4.0, 4.0, 7.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.6253204345703125e-05, -4.49158251285553e-05, -4.357844591140747e-05, -4.2241066694259644e-05, -4.0903687477111816e-05, -3.956630825996399e-05, -3.822892904281616e-05, -3.6891549825668335e-05, -3.555417060852051e-05, -3.421679139137268e-05, -3.2879412174224854e-05, -3.1542032957077026e-05, -3.02046537399292e-05, -2.8867274522781372e-05, -2.7529895305633545e-05, -2.6192516088485718e-05, -2.485513687133789e-05, -2.3517757654190063e-05, -2.2180378437042236e-05, -2.084299921989441e-05, -1.9505620002746582e-05, -1.8168240785598755e-05, -1.6830861568450928e-05, -1.54934823513031e-05, -1.4156103134155273e-05, -1.2818723917007446e-05, -1.1481344699859619e-05, -1.0143965482711792e-05, -8.806586265563965e-06, -7.469207048416138e-06, -6.1318278312683105e-06, -4.794448614120483e-06, -3.4570693969726562e-06, -2.119690179824829e-06, -7.82310962677002e-07, 5.550682544708252e-07, 1.8924474716186523e-06, 3.2298266887664795e-06, 4.567205905914307e-06, 5.904585123062134e-06, 7.241964340209961e-06, 8.579343557357788e-06, 9.916722774505615e-06, 1.1254101991653442e-05, 1.259148120880127e-05, 1.3928860425949097e-05, 1.5266239643096924e-05, 1.660361886024475e-05, 1.7940998077392578e-05, 1.9278377294540405e-05, 2.0615756511688232e-05, 2.195313572883606e-05, 2.3290514945983887e-05, 2.4627894163131714e-05, 2.596527338027954e-05, 2.7302652597427368e-05, 2.8640031814575195e-05, 2.9977411031723022e-05, 3.131479024887085e-05, 3.265216946601868e-05, 3.3989548683166504e-05, 3.532692790031433e-05, 3.666430711746216e-05, 3.8001686334609985e-05, 3.933906555175781e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 5.0, 1.0, 11.0, 6.0, 13.0, 16.0, 28.0, 30.0, 56.0, 88.0, 124.0, 222.0, 336.0, 572.0, 1003.0, 1951.0, 3707.0, 7956.0, 19174.0, 52204.0, 156340.0, 384718.0, 271646.0, 92449.0, 31992.0, 12641.0, 5371.0, 2676.0, 1332.0, 763.0, 386.0, 290.0, 152.0, 96.0, 63.0, 40.0, 31.0, 14.0, 19.0, 14.0, 5.0, 5.0, 2.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.208984375, -0.20279502868652344, -0.19660568237304688, -0.1904163360595703, -0.18422698974609375, -0.1780376434326172, -0.17184829711914062, -0.16565895080566406, -0.1594696044921875, -0.15328025817871094, -0.14709091186523438, -0.1409015655517578, -0.13471221923828125, -0.1285228729248047, -0.12233352661132812, -0.11614418029785156, -0.109954833984375, -0.10376548767089844, -0.09757614135742188, -0.09138679504394531, -0.08519744873046875, -0.07900810241699219, -0.07281875610351562, -0.06662940979003906, -0.0604400634765625, -0.05425071716308594, -0.048061370849609375, -0.04187202453613281, -0.03568267822265625, -0.029493331909179688, -0.023303985595703125, -0.017114639282226562, -0.01092529296875, -0.0047359466552734375, 0.001453399658203125, 0.0076427459716796875, 0.01383209228515625, 0.020021438598632812, 0.026210784912109375, 0.03240013122558594, 0.0385894775390625, 0.04477882385253906, 0.050968170166015625, 0.05715751647949219, 0.06334686279296875, 0.06953620910644531, 0.07572555541992188, 0.08191490173339844, 0.088104248046875, 0.09429359436035156, 0.10048294067382812, 0.10667228698730469, 0.11286163330078125, 0.11905097961425781, 0.12524032592773438, 0.13142967224121094, 0.1376190185546875, 0.14380836486816406, 0.14999771118164062, 0.1561870574951172, 0.16237640380859375, 0.1685657501220703, 0.17475509643554688, 0.18094444274902344, 0.1871337890625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 8.0, 9.0, 13.0, 9.0, 10.0, 24.0, 17.0, 26.0, 27.0, 46.0, 41.0, 46.0, 40.0, 51.0, 68.0, 59.0, 53.0, 50.0, 58.0, 36.0, 47.0, 39.0, 38.0, 31.0, 20.0, 22.0, 21.0, 12.0, 13.0, 5.0, 7.0, 6.0, 8.0, 1.0, 3.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1046142578125, -0.10171222686767578, -0.09881019592285156, -0.09590816497802734, -0.09300613403320312, -0.0901041030883789, -0.08720207214355469, -0.08430004119873047, -0.08139801025390625, -0.07849597930908203, -0.07559394836425781, -0.0726919174194336, -0.06978988647460938, -0.06688785552978516, -0.06398582458496094, -0.06108379364013672, -0.0581817626953125, -0.05527973175048828, -0.05237770080566406, -0.049475669860839844, -0.046573638916015625, -0.043671607971191406, -0.04076957702636719, -0.03786754608154297, -0.03496551513671875, -0.03206348419189453, -0.029161453247070312, -0.026259422302246094, -0.023357391357421875, -0.020455360412597656, -0.017553329467773438, -0.014651298522949219, -0.011749267578125, -0.008847236633300781, -0.0059452056884765625, -0.0030431747436523438, -0.000141143798828125, 0.0027608871459960938, 0.0056629180908203125, 0.008564949035644531, 0.01146697998046875, 0.014369010925292969, 0.017271041870117188, 0.020173072814941406, 0.023075103759765625, 0.025977134704589844, 0.028879165649414062, 0.03178119659423828, 0.0346832275390625, 0.03758525848388672, 0.04048728942871094, 0.043389320373535156, 0.046291351318359375, 0.049193382263183594, 0.05209541320800781, 0.05499744415283203, 0.05789947509765625, 0.06080150604248047, 0.06370353698730469, 0.0666055679321289, 0.06950759887695312, 0.07240962982177734, 0.07531166076660156, 0.07821369171142578, 0.08111572265625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 26.0, 92.0, 366.0, 381.0, 110.0, 23.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.631385803222656, -16.305431365966797, -15.97947883605957, -15.653524398803711, -15.327570915222168, -15.001617431640625, -14.675663948059082, -14.349710464477539, -14.02375602722168, -13.697802543640137, -13.371849060058594, -13.045894622802734, -12.719941139221191, -12.393987655639648, -12.068034172058105, -11.742080688476562, -11.41612720489502, -11.090173721313477, -10.764220237731934, -10.438265800476074, -10.112312316894531, -9.786358833312988, -9.460405349731445, -9.134451866149902, -8.80849838256836, -8.482544898986816, -8.156591415405273, -7.830637454986572, -7.504683494567871, -7.178730010986328, -6.852776527404785, -6.526823043823242, -6.200868129730225, -5.874914646148682, -5.5489606857299805, -5.2230072021484375, -4.8970537185668945, -4.571099758148193, -4.24514627456665, -3.9191925525665283, -3.5932388305664062, -3.267285108566284, -2.941331386566162, -2.615377902984619, -2.289424180984497, -1.963470458984375, -1.6375168561935425, -1.31156325340271, -0.9856095314025879, -0.6596558690071106, -0.3337022066116333, -0.007748544216156006, 0.3182051181793213, 0.6441588401794434, 0.9701124429702759, 1.2960660457611084, 1.6220197677612305, 1.9479734897613525, 2.2739272117614746, 2.5998806953430176, 2.9258344173431396, 3.2517881393432617, 3.5777416229248047, 3.9036953449249268, 4.229649066925049]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 2.0, 1.0, 3.0, 1.0, 5.0, 8.0, 3.0, 11.0, 10.0, 8.0, 21.0, 26.0, 14.0, 29.0, 27.0, 24.0, 40.0, 25.0, 33.0, 37.0, 41.0, 43.0, 46.0, 38.0, 55.0, 46.0, 38.0, 51.0, 32.0, 39.0, 37.0, 31.0, 28.0, 23.0, 15.0, 19.0, 11.0, 13.0, 16.0, 15.0, 9.0, 5.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5616743564605713, -1.4964227676391602, -1.431171178817749, -1.365919589996338, -1.3006680011749268, -1.2354164123535156, -1.1701648235321045, -1.1049132347106934, -1.0396616458892822, -0.9744100570678711, -0.90915846824646, -0.8439068794250488, -0.7786552906036377, -0.7134037017822266, -0.6481521129608154, -0.5829005241394043, -0.5176489353179932, -0.45239734649658203, -0.3871457576751709, -0.32189416885375977, -0.25664258003234863, -0.1913909912109375, -0.12613940238952637, -0.060887813568115234, 0.0043637752532958984, 0.06961536407470703, 0.13486695289611816, 0.2001185417175293, 0.26537013053894043, 0.33062171936035156, 0.3958733081817627, 0.46112489700317383, 0.526376485824585, 0.5916280746459961, 0.6568796634674072, 0.7221312522888184, 0.7873828411102295, 0.8526344299316406, 0.9178860187530518, 0.9831376075744629, 1.048389196395874, 1.1136407852172852, 1.1788923740386963, 1.2441439628601074, 1.3093955516815186, 1.3746471405029297, 1.4398987293243408, 1.505150318145752, 1.570401906967163, 1.6356534957885742, 1.7009050846099854, 1.7661566734313965, 1.8314082622528076, 1.8966598510742188, 1.9619114398956299, 2.027163028717041, 2.092414617538452, 2.1576662063598633, 2.2229177951812744, 2.2881693840026855, 2.3534209728240967, 2.418672561645508, 2.483924150466919, 2.54917573928833, 2.614427328109741]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 3.0, 10.0, 10.0, 14.0, 13.0, 24.0, 38.0, 48.0, 66.0, 102.0, 204.0, 361.0, 723.0, 1671.0, 4763.0, 18960.0, 149952.0, 2862371.0, 1076450.0, 62029.0, 10795.0, 3151.0, 1272.0, 518.0, 279.0, 141.0, 88.0, 76.0, 36.0, 24.0, 16.0, 12.0, 12.0, 8.0, 9.0, 12.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.43701171875, -1.3740234375, -1.31103515625, -1.248046875, -1.18505859375, -1.1220703125, -1.05908203125, -0.99609375, -0.93310546875, -0.8701171875, -0.80712890625, -0.744140625, -0.68115234375, -0.6181640625, -0.55517578125, -0.4921875, -0.42919921875, -0.3662109375, -0.30322265625, -0.240234375, -0.17724609375, -0.1142578125, -0.05126953125, 0.01171875, 0.07470703125, 0.1376953125, 0.20068359375, 0.263671875, 0.32666015625, 0.3896484375, 0.45263671875, 0.515625, 0.57861328125, 0.6416015625, 0.70458984375, 0.767578125, 0.83056640625, 0.8935546875, 0.95654296875, 1.01953125, 1.08251953125, 1.1455078125, 1.20849609375, 1.271484375, 1.33447265625, 1.3974609375, 1.46044921875, 1.5234375, 1.58642578125, 1.6494140625, 1.71240234375, 1.775390625, 1.83837890625, 1.9013671875, 1.96435546875, 2.02734375, 2.09033203125, 2.1533203125, 2.21630859375, 2.279296875, 2.34228515625, 2.4052734375, 2.46826171875, 2.53125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 8.0, 6.0, 4.0, 8.0, 14.0, 9.0, 15.0, 17.0, 26.0, 41.0, 34.0, 28.0, 53.0, 46.0, 40.0, 51.0, 50.0, 55.0, 47.0, 52.0, 48.0, 45.0, 38.0, 39.0, 44.0, 34.0, 27.0, 30.0, 11.0, 14.0, 18.0, 7.0, 3.0, 8.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.87109375, -0.8453445434570312, -0.8195953369140625, -0.7938461303710938, -0.768096923828125, -0.7423477172851562, -0.7165985107421875, -0.6908493041992188, -0.66510009765625, -0.6393508911132812, -0.6136016845703125, -0.5878524780273438, -0.562103271484375, -0.5363540649414062, -0.5106048583984375, -0.48485565185546875, -0.4591064453125, -0.43335723876953125, -0.4076080322265625, -0.38185882568359375, -0.356109619140625, -0.33036041259765625, -0.3046112060546875, -0.27886199951171875, -0.25311279296875, -0.22736358642578125, -0.2016143798828125, -0.17586517333984375, -0.150115966796875, -0.12436676025390625, -0.0986175537109375, -0.07286834716796875, -0.047119140625, -0.02136993408203125, 0.0043792724609375, 0.03012847900390625, 0.055877685546875, 0.08162689208984375, 0.1073760986328125, 0.13312530517578125, 0.15887451171875, 0.18462371826171875, 0.2103729248046875, 0.23612213134765625, 0.261871337890625, 0.28762054443359375, 0.3133697509765625, 0.33911895751953125, 0.3648681640625, 0.39061737060546875, 0.4163665771484375, 0.44211578369140625, 0.467864990234375, 0.49361419677734375, 0.5193634033203125, 0.5451126098632812, 0.57086181640625, 0.5966110229492188, 0.6223602294921875, 0.6481094360351562, 0.673858642578125, 0.6996078491210938, 0.7253570556640625, 0.7511062622070312, 0.77685546875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 8.0, 14.0, 21.0, 17.0, 47.0, 78.0, 173.0, 475.0, 1886.0, 20613.0, 3520841.0, 638398.0, 9695.0, 1316.0, 359.0, 153.0, 75.0, 40.0, 19.0, 22.0, 8.0, 9.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.650390625, -3.528167724609375, -3.40594482421875, -3.283721923828125, -3.1614990234375, -3.039276123046875, -2.91705322265625, -2.794830322265625, -2.672607421875, -2.550384521484375, -2.42816162109375, -2.305938720703125, -2.1837158203125, -2.061492919921875, -1.93927001953125, -1.817047119140625, -1.69482421875, -1.572601318359375, -1.45037841796875, -1.328155517578125, -1.2059326171875, -1.083709716796875, -0.96148681640625, -0.839263916015625, -0.717041015625, -0.594818115234375, -0.47259521484375, -0.350372314453125, -0.2281494140625, -0.105926513671875, 0.01629638671875, 0.138519287109375, 0.2607421875, 0.382965087890625, 0.50518798828125, 0.627410888671875, 0.7496337890625, 0.871856689453125, 0.99407958984375, 1.116302490234375, 1.238525390625, 1.360748291015625, 1.48297119140625, 1.605194091796875, 1.7274169921875, 1.849639892578125, 1.97186279296875, 2.094085693359375, 2.21630859375, 2.338531494140625, 2.46075439453125, 2.582977294921875, 2.7052001953125, 2.827423095703125, 2.94964599609375, 3.071868896484375, 3.194091796875, 3.316314697265625, 3.43853759765625, 3.560760498046875, 3.6829833984375, 3.805206298828125, 3.92742919921875, 4.049652099609375, 4.171875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 3.0, 5.0, 5.0, 16.0, 15.0, 24.0, 36.0, 42.0, 91.0, 123.0, 158.0, 231.0, 405.0, 624.0, 735.0, 550.0, 314.0, 217.0, 145.0, 112.0, 51.0, 54.0, 38.0, 24.0, 20.0, 11.0, 7.0, 4.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4638671875, -0.4499664306640625, -0.436065673828125, -0.4221649169921875, -0.40826416015625, -0.3943634033203125, -0.380462646484375, -0.3665618896484375, -0.3526611328125, -0.3387603759765625, -0.324859619140625, -0.3109588623046875, -0.29705810546875, -0.2831573486328125, -0.269256591796875, -0.2553558349609375, -0.241455078125, -0.2275543212890625, -0.213653564453125, -0.1997528076171875, -0.18585205078125, -0.1719512939453125, -0.158050537109375, -0.1441497802734375, -0.1302490234375, -0.1163482666015625, -0.102447509765625, -0.0885467529296875, -0.07464599609375, -0.0607452392578125, -0.046844482421875, -0.0329437255859375, -0.01904296875, -0.0051422119140625, 0.008758544921875, 0.0226593017578125, 0.03656005859375, 0.0504608154296875, 0.064361572265625, 0.0782623291015625, 0.0921630859375, 0.1060638427734375, 0.119964599609375, 0.1338653564453125, 0.14776611328125, 0.1616668701171875, 0.175567626953125, 0.1894683837890625, 0.203369140625, 0.2172698974609375, 0.231170654296875, 0.2450714111328125, 0.25897216796875, 0.2728729248046875, 0.286773681640625, 0.3006744384765625, 0.3145751953125, 0.3284759521484375, 0.342376708984375, 0.3562774658203125, 0.37017822265625, 0.3840789794921875, 0.397979736328125, 0.4118804931640625, 0.42578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 10.0, 5.0, 9.0, 22.0, 24.0, 36.0, 54.0, 83.0, 104.0, 123.0, 136.0, 114.0, 85.0, 63.0, 35.0, 25.0, 13.0, 14.0, 12.0, 7.0, 11.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7675237655639648, -1.7045420408248901, -1.6415603160858154, -1.5785787105560303, -1.5155969858169556, -1.4526152610778809, -1.3896336555480957, -1.326651930809021, -1.2636702060699463, -1.2006884813308716, -1.1377067565917969, -1.0747251510620117, -1.011743426322937, -0.9487617015838623, -0.8857800364494324, -0.8227983713150024, -0.7598166465759277, -0.696834921836853, -0.6338532567024231, -0.5708715915679932, -0.5078898668289185, -0.44490817189216614, -0.3819264769554138, -0.3189447820186615, -0.2559630870819092, -0.19298139214515686, -0.12999969720840454, -0.06701800227165222, -0.004036307334899902, 0.05894538760185242, 0.12192708253860474, 0.18490877747535706, 0.24789047241210938, 0.3108721673488617, 0.373853862285614, 0.43683555722236633, 0.49981725215911865, 0.5627989768981934, 0.6257806420326233, 0.6887623071670532, 0.7517440319061279, 0.8147257566452026, 0.8777074217796326, 0.9406890869140625, 1.0036708116531372, 1.066652536392212, 1.129634141921997, 1.1926158666610718, 1.2555975914001465, 1.3185793161392212, 1.381561040878296, 1.444542646408081, 1.5075243711471558, 1.5705060958862305, 1.6334877014160156, 1.6964694261550903, 1.759451150894165, 1.8224328756332397, 1.8854146003723145, 1.9483962059020996, 2.0113778114318848, 2.074359655380249, 2.137341260910034, 2.2003231048583984, 2.2633047103881836]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 7.0, 16.0, 13.0, 15.0, 10.0, 23.0, 25.0, 26.0, 24.0, 39.0, 47.0, 30.0, 47.0, 54.0, 44.0, 38.0, 51.0, 49.0, 56.0, 54.0, 52.0, 35.0, 35.0, 35.0, 28.0, 17.0, 12.0, 22.0, 22.0, 17.0, 13.0, 7.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0062812566757202, -0.9750056862831116, -0.9437301754951477, -0.9124546051025391, -0.8811790347099304, -0.8499034643173218, -0.8186279535293579, -0.7873523831367493, -0.7560768127441406, -0.724801242351532, -0.6935257315635681, -0.6622501611709595, -0.6309745907783508, -0.5996990203857422, -0.5684235095977783, -0.5371479392051697, -0.5058724284172058, -0.47459688782691956, -0.4433213174343109, -0.41204577684402466, -0.380770206451416, -0.34949466586112976, -0.3182191252708435, -0.28694355487823486, -0.2556680142879486, -0.22439245879650116, -0.1931169033050537, -0.16184136271476746, -0.13056580722332, -0.09929025173187256, -0.0680147111415863, -0.036739155650138855, -0.005463600158691406, 0.025811951607465744, 0.057087503373622894, 0.08836305141448975, 0.1196386069059372, 0.15091416239738464, 0.1821897029876709, 0.21346525847911835, 0.2447408139705658, 0.27601635456085205, 0.3072919249534607, 0.33856746554374695, 0.3698430061340332, 0.40111857652664185, 0.4323941171169281, 0.46366965770721436, 0.494945228099823, 0.5262207984924316, 0.5574963092803955, 0.5887718796730042, 0.6200474500656128, 0.6513229608535767, 0.6825985312461853, 0.713874101638794, 0.7451496124267578, 0.7764251828193665, 0.8077006936073303, 0.838976263999939, 0.8702518343925476, 0.9015274047851562, 0.9328029155731201, 0.9640784859657288, 0.9953540563583374]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 9.0, 2.0, 9.0, 16.0, 32.0, 34.0, 63.0, 102.0, 212.0, 397.0, 854.0, 2163.0, 5384.0, 17277.0, 74990.0, 458882.0, 400161.0, 64468.0, 15137.0, 4882.0, 1828.0, 785.0, 372.0, 234.0, 107.0, 68.0, 25.0, 23.0, 19.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.360107421875, -0.3450736999511719, -0.33003997802734375, -0.3150062561035156, -0.2999725341796875, -0.2849388122558594, -0.26990509033203125, -0.2548713684082031, -0.239837646484375, -0.22480392456054688, -0.20977020263671875, -0.19473648071289062, -0.1797027587890625, -0.16466903686523438, -0.14963531494140625, -0.13460159301757812, -0.11956787109375, -0.10453414916992188, -0.08950042724609375, -0.07446670532226562, -0.0594329833984375, -0.044399261474609375, -0.02936553955078125, -0.014331817626953125, 0.000701904296875, 0.015735626220703125, 0.03076934814453125, 0.045803070068359375, 0.0608367919921875, 0.07587051391601562, 0.09090423583984375, 0.10593795776367188, 0.1209716796875, 0.13600540161132812, 0.15103912353515625, 0.16607284545898438, 0.1811065673828125, 0.19614028930664062, 0.21117401123046875, 0.22620773315429688, 0.241241455078125, 0.2562751770019531, 0.27130889892578125, 0.2863426208496094, 0.3013763427734375, 0.3164100646972656, 0.33144378662109375, 0.3464775085449219, 0.36151123046875, 0.3765449523925781, 0.39157867431640625, 0.4066123962402344, 0.4216461181640625, 0.4366798400878906, 0.45171356201171875, 0.4667472839355469, 0.481781005859375, 0.4968147277832031, 0.5118484497070312, 0.5268821716308594, 0.5419158935546875, 0.5569496154785156, 0.5719833374023438, 0.5870170593261719, 0.60205078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 12.0, 10.0, 16.0, 21.0, 23.0, 19.0, 22.0, 37.0, 36.0, 45.0, 35.0, 64.0, 69.0, 47.0, 56.0, 54.0, 57.0, 66.0, 52.0, 34.0, 48.0, 31.0, 34.0, 14.0, 20.0, 12.0, 12.0, 19.0, 4.0, 14.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.6494674682617188, -0.6275482177734375, -0.6056289672851562, -0.583709716796875, -0.5617904663085938, -0.5398712158203125, -0.5179519653320312, -0.49603271484375, -0.47411346435546875, -0.4521942138671875, -0.43027496337890625, -0.408355712890625, -0.38643646240234375, -0.3645172119140625, -0.34259796142578125, -0.3206787109375, -0.29875946044921875, -0.2768402099609375, -0.25492095947265625, -0.233001708984375, -0.21108245849609375, -0.1891632080078125, -0.16724395751953125, -0.14532470703125, -0.12340545654296875, -0.1014862060546875, -0.07956695556640625, -0.057647705078125, -0.03572845458984375, -0.0138092041015625, 0.00811004638671875, 0.030029296875, 0.05194854736328125, 0.0738677978515625, 0.09578704833984375, 0.117706298828125, 0.13962554931640625, 0.1615447998046875, 0.18346405029296875, 0.20538330078125, 0.22730255126953125, 0.2492218017578125, 0.27114105224609375, 0.293060302734375, 0.31497955322265625, 0.3368988037109375, 0.35881805419921875, 0.3807373046875, 0.40265655517578125, 0.4245758056640625, 0.44649505615234375, 0.468414306640625, 0.49033355712890625, 0.5122528076171875, 0.5341720581054688, 0.55609130859375, 0.5780105590820312, 0.5999298095703125, 0.6218490600585938, 0.643768310546875, 0.6656875610351562, 0.6876068115234375, 0.7095260620117188, 0.7314453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 8.0, 9.0, 6.0, 14.0, 12.0, 19.0, 33.0, 27.0, 41.0, 75.0, 85.0, 134.0, 240.0, 370.0, 776.0, 1475.0, 3444.0, 9309.0, 30766.0, 136483.0, 525602.0, 262705.0, 52882.0, 14559.0, 5064.0, 2133.0, 942.0, 493.0, 313.0, 171.0, 90.0, 70.0, 52.0, 30.0, 25.0, 21.0, 18.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.332763671875, -0.32317352294921875, -0.3135833740234375, -0.30399322509765625, -0.294403076171875, -0.28481292724609375, -0.2752227783203125, -0.26563262939453125, -0.25604248046875, -0.24645233154296875, -0.2368621826171875, -0.22727203369140625, -0.217681884765625, -0.20809173583984375, -0.1985015869140625, -0.18891143798828125, -0.1793212890625, -0.16973114013671875, -0.1601409912109375, -0.15055084228515625, -0.140960693359375, -0.13137054443359375, -0.1217803955078125, -0.11219024658203125, -0.10260009765625, -0.09300994873046875, -0.0834197998046875, -0.07382965087890625, -0.064239501953125, -0.05464935302734375, -0.0450592041015625, -0.03546905517578125, -0.02587890625, -0.01628875732421875, -0.0066986083984375, 0.00289154052734375, 0.012481689453125, 0.02207183837890625, 0.0316619873046875, 0.04125213623046875, 0.05084228515625, 0.06043243408203125, 0.0700225830078125, 0.07961273193359375, 0.089202880859375, 0.09879302978515625, 0.1083831787109375, 0.11797332763671875, 0.1275634765625, 0.13715362548828125, 0.1467437744140625, 0.15633392333984375, 0.165924072265625, 0.17551422119140625, 0.1851043701171875, 0.19469451904296875, 0.20428466796875, 0.21387481689453125, 0.2234649658203125, 0.23305511474609375, 0.242645263671875, 0.25223541259765625, 0.2618255615234375, 0.27141571044921875, 0.281005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 9.0, 5.0, 9.0, 5.0, 13.0, 12.0, 14.0, 19.0, 24.0, 22.0, 23.0, 28.0, 40.0, 41.0, 47.0, 48.0, 40.0, 51.0, 42.0, 53.0, 41.0, 49.0, 47.0, 45.0, 47.0, 31.0, 22.0, 28.0, 30.0, 20.0, 21.0, 15.0, 9.0, 10.0, 7.0, 8.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0859375, -1.0514068603515625, -1.016876220703125, -0.9823455810546875, -0.94781494140625, -0.9132843017578125, -0.878753662109375, -0.8442230224609375, -0.8096923828125, -0.7751617431640625, -0.740631103515625, -0.7061004638671875, -0.67156982421875, -0.6370391845703125, -0.602508544921875, -0.5679779052734375, -0.533447265625, -0.4989166259765625, -0.464385986328125, -0.4298553466796875, -0.39532470703125, -0.3607940673828125, -0.326263427734375, -0.2917327880859375, -0.2572021484375, -0.2226715087890625, -0.188140869140625, -0.1536102294921875, -0.11907958984375, -0.0845489501953125, -0.050018310546875, -0.0154876708984375, 0.01904296875, 0.0535736083984375, 0.088104248046875, 0.1226348876953125, 0.15716552734375, 0.1916961669921875, 0.226226806640625, 0.2607574462890625, 0.2952880859375, 0.3298187255859375, 0.364349365234375, 0.3988800048828125, 0.43341064453125, 0.4679412841796875, 0.502471923828125, 0.5370025634765625, 0.571533203125, 0.6060638427734375, 0.640594482421875, 0.6751251220703125, 0.70965576171875, 0.7441864013671875, 0.778717041015625, 0.8132476806640625, 0.8477783203125, 0.8823089599609375, 0.916839599609375, 0.9513702392578125, 0.98590087890625, 1.0204315185546875, 1.054962158203125, 1.0894927978515625, 1.1240234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 19.0, 19.0, 19.0, 42.0, 60.0, 122.0, 179.0, 324.0, 674.0, 1400.0, 3212.0, 8001.0, 25025.0, 106891.0, 527531.0, 295913.0, 54459.0, 14919.0, 5424.0, 2157.0, 1045.0, 472.0, 257.0, 141.0, 75.0, 47.0, 34.0, 19.0, 16.0, 10.0, 13.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.136474609375, -0.1325511932373047, -0.12862777709960938, -0.12470436096191406, -0.12078094482421875, -0.11685752868652344, -0.11293411254882812, -0.10901069641113281, -0.1050872802734375, -0.10116386413574219, -0.09724044799804688, -0.09331703186035156, -0.08939361572265625, -0.08547019958496094, -0.08154678344726562, -0.07762336730957031, -0.073699951171875, -0.06977653503417969, -0.06585311889648438, -0.06192970275878906, -0.05800628662109375, -0.05408287048339844, -0.050159454345703125, -0.04623603820800781, -0.0423126220703125, -0.03838920593261719, -0.034465789794921875, -0.030542373657226562, -0.02661895751953125, -0.022695541381835938, -0.018772125244140625, -0.014848709106445312, -0.01092529296875, -0.0070018768310546875, -0.003078460693359375, 0.0008449554443359375, 0.00476837158203125, 0.008691787719726562, 0.012615203857421875, 0.016538619995117188, 0.0204620361328125, 0.024385452270507812, 0.028308868408203125, 0.03223228454589844, 0.03615570068359375, 0.04007911682128906, 0.044002532958984375, 0.04792594909667969, 0.051849365234375, 0.05577278137207031, 0.059696197509765625, 0.06361961364746094, 0.06754302978515625, 0.07146644592285156, 0.07538986206054688, 0.07931327819824219, 0.0832366943359375, 0.08716011047363281, 0.09108352661132812, 0.09500694274902344, 0.09893035888671875, 0.10285377502441406, 0.10677719116210938, 0.11070060729980469, 0.1146240234375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 9.0, 9.0, 13.0, 17.0, 20.0, 23.0, 29.0, 33.0, 45.0, 72.0, 76.0, 82.0, 76.0, 101.0, 82.0, 73.0, 52.0, 43.0, 32.0, 18.0, 16.0, 11.0, 13.0, 7.0, 10.0, 9.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.186962127685547e-05, -5.9845857322216034e-05, -5.78220933675766e-05, -5.5798329412937164e-05, -5.377456545829773e-05, -5.1750801503658295e-05, -4.972703754901886e-05, -4.7703273594379425e-05, -4.567950963973999e-05, -4.3655745685100555e-05, -4.163198173046112e-05, -3.9608217775821686e-05, -3.758445382118225e-05, -3.5560689866542816e-05, -3.353692591190338e-05, -3.1513161957263947e-05, -2.9489398002624512e-05, -2.7465634047985077e-05, -2.5441870093345642e-05, -2.3418106138706207e-05, -2.1394342184066772e-05, -1.9370578229427338e-05, -1.7346814274787903e-05, -1.5323050320148468e-05, -1.3299286365509033e-05, -1.1275522410869598e-05, -9.251758456230164e-06, -7.227994501590729e-06, -5.204230546951294e-06, -3.180466592311859e-06, -1.1567026376724243e-06, 8.670613169670105e-07, 2.8908252716064453e-06, 4.91458922624588e-06, 6.938353180885315e-06, 8.96211713552475e-06, 1.0985881090164185e-05, 1.300964504480362e-05, 1.5033408999443054e-05, 1.705717295408249e-05, 1.9080936908721924e-05, 2.110470086336136e-05, 2.3128464818000793e-05, 2.5152228772640228e-05, 2.7175992727279663e-05, 2.9199756681919098e-05, 3.122352063655853e-05, 3.324728459119797e-05, 3.52710485458374e-05, 3.729481250047684e-05, 3.931857645511627e-05, 4.134234040975571e-05, 4.336610436439514e-05, 4.5389868319034576e-05, 4.741363227367401e-05, 4.9437396228313446e-05, 5.146116018295288e-05, 5.3484924137592316e-05, 5.550868809223175e-05, 5.7532452046871185e-05, 5.955621600151062e-05, 6.157997995615005e-05, 6.360374391078949e-05, 6.562750786542892e-05, 6.765127182006836e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 7.0, 3.0, 10.0, 12.0, 19.0, 27.0, 63.0, 88.0, 162.0, 242.0, 511.0, 927.0, 2050.0, 5140.0, 15086.0, 68406.0, 533510.0, 357795.0, 45417.0, 11498.0, 4150.0, 1711.0, 810.0, 371.0, 205.0, 115.0, 88.0, 36.0, 34.0, 22.0, 11.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.1591625213623047, -0.15365219116210938, -0.14814186096191406, -0.14263153076171875, -0.13712120056152344, -0.13161087036132812, -0.1261005401611328, -0.1205902099609375, -0.11507987976074219, -0.10956954956054688, -0.10405921936035156, -0.09854888916015625, -0.09303855895996094, -0.08752822875976562, -0.08201789855957031, -0.076507568359375, -0.07099723815917969, -0.06548690795898438, -0.05997657775878906, -0.05446624755859375, -0.04895591735839844, -0.043445587158203125, -0.03793525695800781, -0.0324249267578125, -0.026914596557617188, -0.021404266357421875, -0.015893936157226562, -0.01038360595703125, -0.0048732757568359375, 0.000637054443359375, 0.0061473846435546875, 0.01165771484375, 0.017168045043945312, 0.022678375244140625, 0.028188705444335938, 0.03369903564453125, 0.03920936584472656, 0.044719696044921875, 0.05023002624511719, 0.0557403564453125, 0.06125068664550781, 0.06676101684570312, 0.07227134704589844, 0.07778167724609375, 0.08329200744628906, 0.08880233764648438, 0.09431266784667969, 0.099822998046875, 0.10533332824707031, 0.11084365844726562, 0.11635398864746094, 0.12186431884765625, 0.12737464904785156, 0.13288497924804688, 0.1383953094482422, 0.1439056396484375, 0.1494159698486328, 0.15492630004882812, 0.16043663024902344, 0.16594696044921875, 0.17145729064941406, 0.17696762084960938, 0.1824779510498047, 0.18798828125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 8.0, 12.0, 16.0, 35.0, 48.0, 85.0, 100.0, 123.0, 121.0, 112.0, 103.0, 58.0, 50.0, 38.0, 19.0, 13.0, 15.0, 3.0, 8.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04144287109375, -0.040164947509765625, -0.03888702392578125, -0.037609100341796875, -0.0363311767578125, -0.035053253173828125, -0.03377532958984375, -0.032497406005859375, -0.031219482421875, -0.029941558837890625, -0.02866363525390625, -0.027385711669921875, -0.0261077880859375, -0.024829864501953125, -0.02355194091796875, -0.022274017333984375, -0.02099609375, -0.019718170166015625, -0.01844024658203125, -0.017162322998046875, -0.0158843994140625, -0.014606475830078125, -0.01332855224609375, -0.012050628662109375, -0.010772705078125, -0.009494781494140625, -0.00821685791015625, -0.006938934326171875, -0.0056610107421875, -0.004383087158203125, -0.00310516357421875, -0.001827239990234375, -0.00054931640625, 0.000728607177734375, 0.00200653076171875, 0.003284454345703125, 0.0045623779296875, 0.005840301513671875, 0.00711822509765625, 0.008396148681640625, 0.009674072265625, 0.010951995849609375, 0.01222991943359375, 0.013507843017578125, 0.0147857666015625, 0.016063690185546875, 0.01734161376953125, 0.018619537353515625, 0.0198974609375, 0.021175384521484375, 0.02245330810546875, 0.023731231689453125, 0.0250091552734375, 0.026287078857421875, 0.02756500244140625, 0.028842926025390625, 0.030120849609375, 0.031398773193359375, 0.03267669677734375, 0.033954620361328125, 0.0352325439453125, 0.036510467529296875, 0.03778839111328125, 0.039066314697265625, 0.04034423828125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 15.0, 13.0, 32.0, 53.0, 112.0, 139.0, 173.0, 186.0, 104.0, 53.0, 36.0, 25.0, 15.0, 8.0, 5.0, 3.0, 1.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4070826768875122, -1.3561787605285645, -1.3052749633789062, -1.2543710470199585, -1.2034671306610107, -1.1525633335113525, -1.1016594171524048, -1.050755500793457, -0.9998517036437988, -0.9489478468894958, -0.8980439901351929, -0.8471400737762451, -0.7962362170219421, -0.7453323602676392, -0.6944284439086914, -0.6435245871543884, -0.5926207304000854, -0.5417168736457825, -0.4908129870891571, -0.43990910053253174, -0.38900524377822876, -0.3381013870239258, -0.2871975004673004, -0.23629361391067505, -0.18538975715637207, -0.1344858855009079, -0.08358201384544373, -0.03267814218997955, 0.01822572946548462, 0.0691295862197876, 0.12003347277641296, 0.17093735933303833, 0.22184133529663086, 0.27274519205093384, 0.3236490786075592, 0.37455296516418457, 0.42545682191848755, 0.4763606786727905, 0.5272645950317383, 0.5781684517860413, 0.6290723085403442, 0.6799761652946472, 0.7308800220489502, 0.781783938407898, 0.8326877951622009, 0.8835916519165039, 0.9344955682754517, 0.9853994250297546, 1.0363032817840576, 1.0872071981430054, 1.1381109952926636, 1.1890149116516113, 1.2399187088012695, 1.2908226251602173, 1.341726541519165, 1.3926303386688232, 1.443534255027771, 1.4944381713867188, 1.545341968536377, 1.5962458848953247, 1.6471498012542725, 1.6980535984039307, 1.7489575147628784, 1.7998614311218262, 1.8507652282714844]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 9.0, 7.0, 13.0, 12.0, 18.0, 20.0, 23.0, 27.0, 28.0, 53.0, 51.0, 43.0, 50.0, 44.0, 50.0, 57.0, 50.0, 61.0, 56.0, 63.0, 49.0, 38.0, 24.0, 26.0, 22.0, 26.0, 16.0, 13.0, 13.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6505870223045349, -0.6298807263374329, -0.6091744899749756, -0.5884681940078735, -0.5677618980407715, -0.5470556020736694, -0.5263493657112122, -0.5056430697441101, -0.48493680357933044, -0.4642305374145508, -0.44352424144744873, -0.42281797528266907, -0.4021117091178894, -0.38140541315078735, -0.3606991469860077, -0.339992880821228, -0.319286584854126, -0.2985803186893463, -0.27787402272224426, -0.2571677565574646, -0.23646147549152374, -0.21575519442558289, -0.19504892826080322, -0.17434264719486237, -0.1536363661289215, -0.13293008506298065, -0.11222381144762039, -0.09151753783226013, -0.07081125676631927, -0.05010497570037842, -0.029398702085018158, -0.008692428469657898, 0.012013852596282959, 0.03272012993693352, 0.053426407277584076, 0.07413268089294434, 0.09483896195888519, 0.11554524302482605, 0.1362515091896057, 0.15695779025554657, 0.17766407132148743, 0.19837035238742828, 0.21907663345336914, 0.2397828996181488, 0.26048916578292847, 0.2811954617500305, 0.3019017279148102, 0.32260799407958984, 0.3433142900466919, 0.36402055621147156, 0.3847268521785736, 0.40543311834335327, 0.4261394143104553, 0.446845680475235, 0.46755194664001465, 0.4882582426071167, 0.5089645385742188, 0.5296708345413208, 0.5503770709037781, 0.5710833668708801, 0.5917896628379822, 0.6124958992004395, 0.6332021951675415, 0.6539084911346436, 0.6746147274971008]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 12.0, 21.0, 22.0, 28.0, 41.0, 90.0, 179.0, 321.0, 668.0, 1451.0, 3527.0, 8746.0, 25669.0, 87845.0, 384227.0, 400730.0, 92547.0, 26648.0, 9258.0, 3556.0, 1528.0, 674.0, 353.0, 157.0, 89.0, 58.0, 32.0, 16.0, 12.0, 9.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8538742065429688, -0.8244476318359375, -0.7950210571289062, -0.765594482421875, -0.7361679077148438, -0.7067413330078125, -0.6773147583007812, -0.64788818359375, -0.6184616088867188, -0.5890350341796875, -0.5596084594726562, -0.530181884765625, -0.5007553100585938, -0.4713287353515625, -0.44190216064453125, -0.4124755859375, -0.38304901123046875, -0.3536224365234375, -0.32419586181640625, -0.294769287109375, -0.26534271240234375, -0.2359161376953125, -0.20648956298828125, -0.17706298828125, -0.14763641357421875, -0.1182098388671875, -0.08878326416015625, -0.059356689453125, -0.02993011474609375, -0.0005035400390625, 0.02892303466796875, 0.058349609375, 0.08777618408203125, 0.1172027587890625, 0.14662933349609375, 0.176055908203125, 0.20548248291015625, 0.2349090576171875, 0.26433563232421875, 0.29376220703125, 0.32318878173828125, 0.3526153564453125, 0.38204193115234375, 0.411468505859375, 0.44089508056640625, 0.4703216552734375, 0.49974822998046875, 0.5291748046875, 0.5586013793945312, 0.5880279541015625, 0.6174545288085938, 0.646881103515625, 0.6763076782226562, 0.7057342529296875, 0.7351608276367188, 0.76458740234375, 0.7940139770507812, 0.8234405517578125, 0.8528671264648438, 0.882293701171875, 0.9117202758789062, 0.9411468505859375, 0.9705734252929688, 1.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 6.0, 7.0, 10.0, 4.0, 14.0, 16.0, 30.0, 27.0, 26.0, 40.0, 47.0, 37.0, 47.0, 57.0, 60.0, 50.0, 60.0, 58.0, 76.0, 54.0, 50.0, 45.0, 35.0, 29.0, 26.0, 23.0, 15.0, 12.0, 9.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3828125, -1.33514404296875, -1.2874755859375, -1.23980712890625, -1.192138671875, -1.14447021484375, -1.0968017578125, -1.04913330078125, -1.00146484375, -0.95379638671875, -0.9061279296875, -0.85845947265625, -0.810791015625, -0.76312255859375, -0.7154541015625, -0.66778564453125, -0.6201171875, -0.57244873046875, -0.5247802734375, -0.47711181640625, -0.429443359375, -0.38177490234375, -0.3341064453125, -0.28643798828125, -0.23876953125, -0.19110107421875, -0.1434326171875, -0.09576416015625, -0.048095703125, -0.00042724609375, 0.0472412109375, 0.09490966796875, 0.142578125, 0.19024658203125, 0.2379150390625, 0.28558349609375, 0.333251953125, 0.38092041015625, 0.4285888671875, 0.47625732421875, 0.52392578125, 0.57159423828125, 0.6192626953125, 0.66693115234375, 0.714599609375, 0.76226806640625, 0.8099365234375, 0.85760498046875, 0.9052734375, 0.95294189453125, 1.0006103515625, 1.04827880859375, 1.095947265625, 1.14361572265625, 1.1912841796875, 1.23895263671875, 1.28662109375, 1.33428955078125, 1.3819580078125, 1.42962646484375, 1.477294921875, 1.52496337890625, 1.5726318359375, 1.62030029296875, 1.66796875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 10.0, 17.0, 10.0, 11.0, 13.0, 20.0, 23.0, 22.0, 29.0, 26.0, 28.0, 45.0, 44.0, 67.0, 124.0, 772.0, 51773.0, 985085.0, 9582.0, 360.0, 99.0, 67.0, 42.0, 31.0, 38.0, 18.0, 29.0, 18.0, 26.0, 16.0, 20.0, 14.0, 10.0, 11.0, 12.0, 9.0, 4.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.12109375, -3.997467041015625, -3.87384033203125, -3.750213623046875, -3.6265869140625, -3.502960205078125, -3.37933349609375, -3.255706787109375, -3.132080078125, -3.008453369140625, -2.88482666015625, -2.761199951171875, -2.6375732421875, -2.513946533203125, -2.39031982421875, -2.266693115234375, -2.14306640625, -2.019439697265625, -1.89581298828125, -1.772186279296875, -1.6485595703125, -1.524932861328125, -1.40130615234375, -1.277679443359375, -1.154052734375, -1.030426025390625, -0.90679931640625, -0.783172607421875, -0.6595458984375, -0.535919189453125, -0.41229248046875, -0.288665771484375, -0.1650390625, -0.041412353515625, 0.08221435546875, 0.205841064453125, 0.3294677734375, 0.453094482421875, 0.57672119140625, 0.700347900390625, 0.823974609375, 0.947601318359375, 1.07122802734375, 1.194854736328125, 1.3184814453125, 1.442108154296875, 1.56573486328125, 1.689361572265625, 1.81298828125, 1.936614990234375, 2.06024169921875, 2.183868408203125, 2.3074951171875, 2.431121826171875, 2.55474853515625, 2.678375244140625, 2.802001953125, 2.925628662109375, 3.04925537109375, 3.172882080078125, 3.2965087890625, 3.420135498046875, 3.54376220703125, 3.667388916015625, 3.791015625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 3.0, 6.0, 7.0, 6.0, 18.0, 12.0, 12.0, 18.0, 13.0, 17.0, 33.0, 20.0, 30.0, 44.0, 33.0, 25.0, 40.0, 44.0, 41.0, 40.0, 51.0, 53.0, 49.0, 41.0, 32.0, 24.0, 34.0, 40.0, 23.0, 16.0, 28.0, 20.0, 12.0, 20.0, 23.0, 13.0, 7.0, 9.0, 9.0, 8.0, 7.0, 2.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2431640625, -1.2056427001953125, -1.168121337890625, -1.1305999755859375, -1.09307861328125, -1.0555572509765625, -1.018035888671875, -0.9805145263671875, -0.9429931640625, -0.9054718017578125, -0.867950439453125, -0.8304290771484375, -0.79290771484375, -0.7553863525390625, -0.717864990234375, -0.6803436279296875, -0.642822265625, -0.6053009033203125, -0.567779541015625, -0.5302581787109375, -0.49273681640625, -0.4552154541015625, -0.417694091796875, -0.3801727294921875, -0.3426513671875, -0.3051300048828125, -0.267608642578125, -0.2300872802734375, -0.19256591796875, -0.1550445556640625, -0.117523193359375, -0.0800018310546875, -0.04248046875, -0.0049591064453125, 0.032562255859375, 0.0700836181640625, 0.10760498046875, 0.1451263427734375, 0.182647705078125, 0.2201690673828125, 0.2576904296875, 0.2952117919921875, 0.332733154296875, 0.3702545166015625, 0.40777587890625, 0.4452972412109375, 0.482818603515625, 0.5203399658203125, 0.557861328125, 0.5953826904296875, 0.632904052734375, 0.6704254150390625, 0.70794677734375, 0.7454681396484375, 0.782989501953125, 0.8205108642578125, 0.8580322265625, 0.8955535888671875, 0.933074951171875, 0.9705963134765625, 1.00811767578125, 1.0456390380859375, 1.083160400390625, 1.1206817626953125, 1.158203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 7.0, 8.0, 11.0, 14.0, 27.0, 31.0, 39.0, 60.0, 103.0, 176.0, 319.0, 611.0, 1312.0, 3042.0, 7735.0, 22004.0, 80348.0, 391556.0, 417685.0, 86257.0, 23390.0, 7898.0, 3124.0, 1308.0, 663.0, 327.0, 175.0, 113.0, 67.0, 38.0, 31.0, 23.0, 17.0, 11.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2098388671875, -0.2020740509033203, -0.19430923461914062, -0.18654441833496094, -0.17877960205078125, -0.17101478576660156, -0.16324996948242188, -0.1554851531982422, -0.1477203369140625, -0.1399555206298828, -0.13219070434570312, -0.12442588806152344, -0.11666107177734375, -0.10889625549316406, -0.10113143920898438, -0.09336662292480469, -0.085601806640625, -0.07783699035644531, -0.07007217407226562, -0.06230735778808594, -0.05454254150390625, -0.04677772521972656, -0.039012908935546875, -0.031248092651367188, -0.0234832763671875, -0.015718460083007812, -0.007953643798828125, -0.0001888275146484375, 0.00757598876953125, 0.015340805053710938, 0.023105621337890625, 0.030870437622070312, 0.03863525390625, 0.04640007019042969, 0.054164886474609375, 0.06192970275878906, 0.06969451904296875, 0.07745933532714844, 0.08522415161132812, 0.09298896789550781, 0.1007537841796875, 0.10851860046386719, 0.11628341674804688, 0.12404823303222656, 0.13181304931640625, 0.13957786560058594, 0.14734268188476562, 0.1551074981689453, 0.162872314453125, 0.1706371307373047, 0.17840194702148438, 0.18616676330566406, 0.19393157958984375, 0.20169639587402344, 0.20946121215820312, 0.2172260284423828, 0.2249908447265625, 0.2327556610107422, 0.24052047729492188, 0.24828529357910156, 0.25605010986328125, 0.26381492614746094, 0.2715797424316406, 0.2793445587158203, 0.287109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 11.0, 11.0, 8.0, 15.0, 11.0, 25.0, 29.0, 24.0, 46.0, 49.0, 77.0, 98.0, 121.0, 106.0, 90.0, 75.0, 47.0, 40.0, 26.0, 27.0, 22.0, 5.0, 9.0, 8.0, 8.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8743019104003906e-05, -3.735162317752838e-05, -3.5960227251052856e-05, -3.456883132457733e-05, -3.317743539810181e-05, -3.178603947162628e-05, -3.0394643545150757e-05, -2.9003247618675232e-05, -2.7611851692199707e-05, -2.6220455765724182e-05, -2.4829059839248657e-05, -2.3437663912773132e-05, -2.2046267986297607e-05, -2.0654872059822083e-05, -1.9263476133346558e-05, -1.7872080206871033e-05, -1.6480684280395508e-05, -1.5089288353919983e-05, -1.3697892427444458e-05, -1.2306496500968933e-05, -1.0915100574493408e-05, -9.523704648017883e-06, -8.132308721542358e-06, -6.7409127950668335e-06, -5.349516868591309e-06, -3.958120942115784e-06, -2.566725015640259e-06, -1.1753290891647339e-06, 2.1606683731079102e-07, 1.607462763786316e-06, 2.998858690261841e-06, 4.390254616737366e-06, 5.781650543212891e-06, 7.1730464696884155e-06, 8.56444239616394e-06, 9.955838322639465e-06, 1.134723424911499e-05, 1.2738630175590515e-05, 1.413002610206604e-05, 1.5521422028541565e-05, 1.691281795501709e-05, 1.8304213881492615e-05, 1.969560980796814e-05, 2.1087005734443665e-05, 2.247840166091919e-05, 2.3869797587394714e-05, 2.526119351387024e-05, 2.6652589440345764e-05, 2.804398536682129e-05, 2.9435381293296814e-05, 3.082677721977234e-05, 3.2218173146247864e-05, 3.360956907272339e-05, 3.5000964999198914e-05, 3.639236092567444e-05, 3.778375685214996e-05, 3.917515277862549e-05, 4.056654870510101e-05, 4.195794463157654e-05, 4.334934055805206e-05, 4.474073648452759e-05, 4.613213241100311e-05, 4.752352833747864e-05, 4.891492426395416e-05, 5.030632019042969e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 13.0, 7.0, 26.0, 22.0, 49.0, 60.0, 90.0, 167.0, 262.0, 451.0, 755.0, 1453.0, 2513.0, 5018.0, 10446.0, 24759.0, 67236.0, 211693.0, 421580.0, 195873.0, 62421.0, 23242.0, 10015.0, 4747.0, 2480.0, 1318.0, 720.0, 428.0, 237.0, 159.0, 119.0, 48.0, 47.0, 18.0, 20.0, 8.0, 15.0, 11.0, 5.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1763916015625, -0.17078590393066406, -0.16518020629882812, -0.1595745086669922, -0.15396881103515625, -0.1483631134033203, -0.14275741577148438, -0.13715171813964844, -0.1315460205078125, -0.12594032287597656, -0.12033462524414062, -0.11472892761230469, -0.10912322998046875, -0.10351753234863281, -0.09791183471679688, -0.09230613708496094, -0.086700439453125, -0.08109474182128906, -0.07548904418945312, -0.06988334655761719, -0.06427764892578125, -0.05867195129394531, -0.053066253662109375, -0.04746055603027344, -0.0418548583984375, -0.03624916076660156, -0.030643463134765625, -0.025037765502929688, -0.01943206787109375, -0.013826370239257812, -0.008220672607421875, -0.0026149749755859375, 0.00299072265625, 0.008596420288085938, 0.014202117919921875, 0.019807815551757812, 0.02541351318359375, 0.031019210815429688, 0.036624908447265625, 0.04223060607910156, 0.0478363037109375, 0.05344200134277344, 0.059047698974609375, 0.06465339660644531, 0.07025909423828125, 0.07586479187011719, 0.08147048950195312, 0.08707618713378906, 0.092681884765625, 0.09828758239746094, 0.10389328002929688, 0.10949897766113281, 0.11510467529296875, 0.12071037292480469, 0.12631607055664062, 0.13192176818847656, 0.1375274658203125, 0.14313316345214844, 0.14873886108398438, 0.1543445587158203, 0.15995025634765625, 0.1655559539794922, 0.17116165161132812, 0.17676734924316406, 0.182373046875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 9.0, 9.0, 20.0, 15.0, 23.0, 26.0, 41.0, 38.0, 48.0, 47.0, 49.0, 71.0, 74.0, 59.0, 74.0, 63.0, 45.0, 52.0, 44.0, 37.0, 33.0, 10.0, 23.0, 11.0, 12.0, 9.0, 9.0, 10.0, 6.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1019287109375, -0.09894657135009766, -0.09596443176269531, -0.09298229217529297, -0.09000015258789062, -0.08701801300048828, -0.08403587341308594, -0.0810537338256836, -0.07807159423828125, -0.0750894546508789, -0.07210731506347656, -0.06912517547607422, -0.06614303588867188, -0.06316089630126953, -0.06017875671386719, -0.057196617126464844, -0.0542144775390625, -0.051232337951660156, -0.04825019836425781, -0.04526805877685547, -0.042285919189453125, -0.03930377960205078, -0.03632164001464844, -0.033339500427246094, -0.03035736083984375, -0.027375221252441406, -0.024393081665039062, -0.02141094207763672, -0.018428802490234375, -0.015446662902832031, -0.012464523315429688, -0.009482383728027344, -0.006500244140625, -0.0035181045532226562, -0.0005359649658203125, 0.0024461746215820312, 0.005428314208984375, 0.008410453796386719, 0.011392593383789062, 0.014374732971191406, 0.01735687255859375, 0.020339012145996094, 0.023321151733398438, 0.02630329132080078, 0.029285430908203125, 0.03226757049560547, 0.03524971008300781, 0.038231849670410156, 0.0412139892578125, 0.044196128845214844, 0.04717826843261719, 0.05016040802001953, 0.053142547607421875, 0.05612468719482422, 0.05910682678222656, 0.062088966369628906, 0.06507110595703125, 0.0680532455444336, 0.07103538513183594, 0.07401752471923828, 0.07699966430664062, 0.07998180389404297, 0.08296394348144531, 0.08594608306884766, 0.08892822265625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 13.0, 33.0, 79.0, 190.0, 281.0, 213.0, 112.0, 37.0, 16.0, 8.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.725197792053223, -8.552907943725586, -8.38061809539795, -8.208327293395996, -8.03603744506836, -7.863747596740723, -7.691457748413086, -7.519167900085449, -7.346877574920654, -7.174587726593018, -7.002297401428223, -6.830007553100586, -6.657717704772949, -6.485427379608154, -6.313137531280518, -6.140847206115723, -5.968557357788086, -5.796267509460449, -5.623977184295654, -5.451687335968018, -5.279397010803223, -5.107107162475586, -4.934817314147949, -4.7625274658203125, -4.590237140655518, -4.417947292327881, -4.245656967163086, -4.073367118835449, -3.9010770320892334, -3.7287869453430176, -3.556497097015381, -3.384207010269165, -3.2119174003601074, -3.0396273136138916, -2.867337226867676, -2.695047378540039, -2.5227572917938232, -2.3504672050476074, -2.1781773567199707, -2.005887269973755, -1.833597183227539, -1.6613070964813232, -1.489017128944397, -1.3167271614074707, -1.1444370746612549, -0.9721470475196838, -0.7998570203781128, -0.6275670528411865, -0.4552769660949707, -0.28298693895339966, -0.11069691181182861, 0.06159311532974243, 0.23388314247131348, 0.4061731696128845, 0.5784631967544556, 0.7507531642913818, 0.9230432510375977, 1.0953333377838135, 1.2676233053207397, 1.439913272857666, 1.6122033596038818, 1.7844934463500977, 1.956783413887024, 2.12907338142395, 2.301363468170166]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 4.0, 6.0, 9.0, 9.0, 11.0, 17.0, 24.0, 24.0, 32.0, 40.0, 41.0, 37.0, 46.0, 44.0, 48.0, 44.0, 44.0, 59.0, 48.0, 46.0, 37.0, 52.0, 47.0, 44.0, 31.0, 31.0, 17.0, 23.0, 15.0, 10.0, 14.0, 7.0, 10.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.600468158721924, -2.5228521823883057, -2.4452362060546875, -2.3676204681396484, -2.2900044918060303, -2.212388515472412, -2.134772539138794, -2.057156562805176, -1.9795407056808472, -1.901924729347229, -1.8243088722229004, -1.7466928958892822, -1.669076919555664, -1.5914610624313354, -1.5138450860977173, -1.4362292289733887, -1.3586132526397705, -1.2809972763061523, -1.2033814191818237, -1.1257654428482056, -1.048149585723877, -0.9705336093902588, -0.8929176330566406, -0.8153017163276672, -0.7376857995986938, -0.6600698828697205, -0.5824539661407471, -0.5048379898071289, -0.4272220730781555, -0.34960615634918213, -0.27199020981788635, -0.19437426328659058, -0.11675810813903809, -0.0391421765089035, 0.03847375512123108, 0.11608968675136566, 0.19370561838150024, 0.27132153511047363, 0.3489374816417694, 0.4265534281730652, 0.5041693449020386, 0.581785261631012, 0.6594011783599854, 0.7370171546936035, 0.8146330714225769, 0.8922489881515503, 0.9698649644851685, 1.047480821609497, 1.1250967979431152, 1.2027127742767334, 1.280328631401062, 1.3579446077346802, 1.4355604648590088, 1.513176441192627, 1.5907924175262451, 1.6684083938598633, 1.746024250984192, 1.82364022731781, 1.9012560844421387, 1.9788720607757568, 2.056488037109375, 2.134103775024414, 2.2117197513580322, 2.2893357276916504, 2.3669517040252686]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 3.0, 4.0, 2.0, 10.0, 10.0, 11.0, 22.0, 20.0, 36.0, 45.0, 60.0, 113.0, 154.0, 244.0, 357.0, 664.0, 1129.0, 2348.0, 5138.0, 12818.0, 39934.0, 214741.0, 2133801.0, 1567919.0, 161427.0, 33212.0, 10985.0, 4273.0, 2108.0, 1122.0, 615.0, 348.0, 169.0, 123.0, 90.0, 54.0, 38.0, 39.0, 18.0, 16.0, 16.0, 8.0, 14.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.2900390625, -1.25201416015625, -1.2139892578125, -1.17596435546875, -1.137939453125, -1.09991455078125, -1.0618896484375, -1.02386474609375, -0.98583984375, -0.94781494140625, -0.9097900390625, -0.87176513671875, -0.833740234375, -0.79571533203125, -0.7576904296875, -0.71966552734375, -0.681640625, -0.64361572265625, -0.6055908203125, -0.56756591796875, -0.529541015625, -0.49151611328125, -0.4534912109375, -0.41546630859375, -0.37744140625, -0.33941650390625, -0.3013916015625, -0.26336669921875, -0.225341796875, -0.18731689453125, -0.1492919921875, -0.11126708984375, -0.0732421875, -0.03521728515625, 0.0028076171875, 0.04083251953125, 0.078857421875, 0.11688232421875, 0.1549072265625, 0.19293212890625, 0.23095703125, 0.26898193359375, 0.3070068359375, 0.34503173828125, 0.383056640625, 0.42108154296875, 0.4591064453125, 0.49713134765625, 0.53515625, 0.57318115234375, 0.6112060546875, 0.64923095703125, 0.687255859375, 0.72528076171875, 0.7633056640625, 0.80133056640625, 0.83935546875, 0.87738037109375, 0.9154052734375, 0.95343017578125, 0.991455078125, 1.02947998046875, 1.0675048828125, 1.10552978515625, 1.1435546875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 6.0, 3.0, 6.0, 13.0, 19.0, 13.0, 25.0, 28.0, 31.0, 38.0, 45.0, 46.0, 53.0, 48.0, 68.0, 65.0, 80.0, 56.0, 58.0, 39.0, 54.0, 36.0, 34.0, 27.0, 20.0, 18.0, 15.0, 15.0, 12.0, 9.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9349517822265625, -0.904571533203125, -0.8741912841796875, -0.84381103515625, -0.8134307861328125, -0.783050537109375, -0.7526702880859375, -0.7222900390625, -0.6919097900390625, -0.661529541015625, -0.6311492919921875, -0.60076904296875, -0.5703887939453125, -0.540008544921875, -0.5096282958984375, -0.479248046875, -0.4488677978515625, -0.418487548828125, -0.3881072998046875, -0.35772705078125, -0.3273468017578125, -0.296966552734375, -0.2665863037109375, -0.2362060546875, -0.2058258056640625, -0.175445556640625, -0.1450653076171875, -0.11468505859375, -0.0843048095703125, -0.053924560546875, -0.0235443115234375, 0.0068359375, 0.0372161865234375, 0.067596435546875, 0.0979766845703125, 0.12835693359375, 0.1587371826171875, 0.189117431640625, 0.2194976806640625, 0.2498779296875, 0.2802581787109375, 0.310638427734375, 0.3410186767578125, 0.37139892578125, 0.4017791748046875, 0.432159423828125, 0.4625396728515625, 0.492919921875, 0.5233001708984375, 0.553680419921875, 0.5840606689453125, 0.61444091796875, 0.6448211669921875, 0.675201416015625, 0.7055816650390625, 0.7359619140625, 0.7663421630859375, 0.796722412109375, 0.8271026611328125, 0.85748291015625, 0.8878631591796875, 0.918243408203125, 0.9486236572265625, 0.97900390625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 6.0, 6.0, 9.0, 20.0, 27.0, 49.0, 77.0, 154.0, 502.0, 3732.0, 283853.0, 3894110.0, 10368.0, 868.0, 232.0, 94.0, 55.0, 39.0, 21.0, 12.0, 8.0, 11.0, 8.0, 6.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.8265380859375, -4.676513671875, -4.5264892578125, -4.37646484375, -4.2264404296875, -4.076416015625, -3.9263916015625, -3.7763671875, -3.6263427734375, -3.476318359375, -3.3262939453125, -3.17626953125, -3.0262451171875, -2.876220703125, -2.7261962890625, -2.576171875, -2.4261474609375, -2.276123046875, -2.1260986328125, -1.97607421875, -1.8260498046875, -1.676025390625, -1.5260009765625, -1.3759765625, -1.2259521484375, -1.075927734375, -0.9259033203125, -0.77587890625, -0.6258544921875, -0.475830078125, -0.3258056640625, -0.17578125, -0.0257568359375, 0.124267578125, 0.2742919921875, 0.42431640625, 0.5743408203125, 0.724365234375, 0.8743896484375, 1.0244140625, 1.1744384765625, 1.324462890625, 1.4744873046875, 1.62451171875, 1.7745361328125, 1.924560546875, 2.0745849609375, 2.224609375, 2.3746337890625, 2.524658203125, 2.6746826171875, 2.82470703125, 2.9747314453125, 3.124755859375, 3.2747802734375, 3.4248046875, 3.5748291015625, 3.724853515625, 3.8748779296875, 4.02490234375, 4.1749267578125, 4.324951171875, 4.4749755859375, 4.625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 8.0, 9.0, 8.0, 19.0, 25.0, 21.0, 34.0, 38.0, 53.0, 79.0, 114.0, 171.0, 308.0, 497.0, 739.0, 746.0, 460.0, 244.0, 156.0, 105.0, 61.0, 39.0, 34.0, 21.0, 16.0, 17.0, 15.0, 10.0, 8.0, 0.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.433837890625, -0.4223823547363281, -0.41092681884765625, -0.3994712829589844, -0.3880157470703125, -0.3765602111816406, -0.36510467529296875, -0.3536491394042969, -0.342193603515625, -0.3307380676269531, -0.31928253173828125, -0.3078269958496094, -0.2963714599609375, -0.2849159240722656, -0.27346038818359375, -0.2620048522949219, -0.25054931640625, -0.23909378051757812, -0.22763824462890625, -0.21618270874023438, -0.2047271728515625, -0.19327163696289062, -0.18181610107421875, -0.17036056518554688, -0.158905029296875, -0.14744949340820312, -0.13599395751953125, -0.12453842163085938, -0.1130828857421875, -0.10162734985351562, -0.09017181396484375, -0.07871627807617188, -0.0672607421875, -0.055805206298828125, -0.04434967041015625, -0.032894134521484375, -0.0214385986328125, -0.009983062744140625, 0.00147247314453125, 0.012928009033203125, 0.024383544921875, 0.035839080810546875, 0.04729461669921875, 0.058750152587890625, 0.0702056884765625, 0.08166122436523438, 0.09311676025390625, 0.10457229614257812, 0.11602783203125, 0.12748336791992188, 0.13893890380859375, 0.15039443969726562, 0.1618499755859375, 0.17330551147460938, 0.18476104736328125, 0.19621658325195312, 0.207672119140625, 0.21912765502929688, 0.23058319091796875, 0.24203872680664062, 0.2534942626953125, 0.2649497985839844, 0.27640533447265625, 0.2878608703613281, 0.29931640625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 7.0, 6.0, 12.0, 12.0, 30.0, 35.0, 59.0, 76.0, 111.0, 119.0, 128.0, 107.0, 97.0, 74.0, 43.0, 28.0, 15.0, 13.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7254536151885986, -1.6646838188171387, -1.6039140224456787, -1.5431443452835083, -1.4823745489120483, -1.4216047525405884, -1.360835075378418, -1.300065279006958, -1.239295482635498, -1.178525686264038, -1.1177558898925781, -1.0569862127304077, -0.9962164163589478, -0.9354466199874878, -0.8746768832206726, -0.8139071464538574, -0.7531373500823975, -0.6923675537109375, -0.6315978169441223, -0.5708280801773071, -0.5100582838058472, -0.4492885172367096, -0.388518750667572, -0.32774898409843445, -0.2669792175292969, -0.2062094509601593, -0.14543968439102173, -0.08466991782188416, -0.023900151252746582, 0.03686961531639099, 0.09763938188552856, 0.15840914845466614, 0.2191789150238037, 0.2799486815929413, 0.34071844816207886, 0.40148821473121643, 0.462257981300354, 0.523027777671814, 0.5837975144386292, 0.6445672512054443, 0.7053370475769043, 0.7661068439483643, 0.8268765807151794, 0.8876463174819946, 0.9484161138534546, 1.0091859102249146, 1.069955587387085, 1.130725383758545, 1.1914951801300049, 1.2522649765014648, 1.3130347728729248, 1.3738044500350952, 1.4345742464065552, 1.4953440427780151, 1.5561137199401855, 1.6168835163116455, 1.6776533126831055, 1.7384231090545654, 1.7991929054260254, 1.8599625825881958, 1.9207323789596558, 1.9815021753311157, 2.042271852493286, 2.103041648864746, 2.163811445236206]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 8.0, 6.0, 7.0, 9.0, 12.0, 21.0, 24.0, 35.0, 37.0, 46.0, 40.0, 53.0, 71.0, 64.0, 59.0, 64.0, 56.0, 65.0, 60.0, 57.0, 33.0, 29.0, 36.0, 37.0, 16.0, 17.0, 11.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.300908088684082, -1.2635077238082886, -1.2261073589324951, -1.1887069940567017, -1.1513066291809082, -1.1139062643051147, -1.0765058994293213, -1.0391055345535278, -1.0017051696777344, -0.9643048048019409, -0.9269044399261475, -0.889504075050354, -0.8521037101745605, -0.8147033452987671, -0.7773029804229736, -0.7399026155471802, -0.7025023102760315, -0.665101945400238, -0.6277015805244446, -0.5903012156486511, -0.5529008507728577, -0.5155004858970642, -0.47810015082359314, -0.4406997859477997, -0.4032994210720062, -0.36589905619621277, -0.3284986913204193, -0.29109835624694824, -0.2536979913711548, -0.21629761159420013, -0.17889726161956787, -0.14149689674377441, -0.10409653186798096, -0.0666961669921875, -0.02929580956697464, 0.00810454785823822, 0.04550491273403168, 0.08290527760982513, 0.1203056275844574, 0.15770599246025085, 0.1951063573360443, 0.23250672221183777, 0.2699070870876312, 0.3073074221611023, 0.34470778703689575, 0.3821081519126892, 0.41950851678848267, 0.4569088816642761, 0.4943092465400696, 0.531709611415863, 0.5691099762916565, 0.60651034116745, 0.6439107060432434, 0.6813110709190369, 0.7187113761901855, 0.756111741065979, 0.7935121059417725, 0.8309124708175659, 0.8683128356933594, 0.9057132005691528, 0.9431135654449463, 0.9805139303207397, 1.0179142951965332, 1.0553146600723267, 1.0927150249481201]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 10.0, 10.0, 16.0, 22.0, 20.0, 22.0, 41.0, 75.0, 107.0, 208.0, 446.0, 1102.0, 2996.0, 10084.0, 43213.0, 269484.0, 584490.0, 106678.0, 20852.0, 5399.0, 1836.0, 719.0, 285.0, 148.0, 107.0, 56.0, 35.0, 24.0, 12.0, 5.0, 10.0, 6.0, 3.0, 1.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.364013671875, -0.3530693054199219, -0.34212493896484375, -0.3311805725097656, -0.3202362060546875, -0.3092918395996094, -0.29834747314453125, -0.2874031066894531, -0.276458740234375, -0.2655143737792969, -0.25457000732421875, -0.24362564086914062, -0.2326812744140625, -0.22173690795898438, -0.21079254150390625, -0.19984817504882812, -0.18890380859375, -0.17795944213867188, -0.16701507568359375, -0.15607070922851562, -0.1451263427734375, -0.13418197631835938, -0.12323760986328125, -0.11229324340820312, -0.101348876953125, -0.09040451049804688, -0.07946014404296875, -0.06851577758789062, -0.0575714111328125, -0.046627044677734375, -0.03568267822265625, -0.024738311767578125, -0.0137939453125, -0.002849578857421875, 0.00809478759765625, 0.019039154052734375, 0.0299835205078125, 0.040927886962890625, 0.05187225341796875, 0.06281661987304688, 0.073760986328125, 0.08470535278320312, 0.09564971923828125, 0.10659408569335938, 0.1175384521484375, 0.12848281860351562, 0.13942718505859375, 0.15037155151367188, 0.16131591796875, 0.17226028442382812, 0.18320465087890625, 0.19414901733398438, 0.2050933837890625, 0.21603775024414062, 0.22698211669921875, 0.23792648315429688, 0.248870849609375, 0.2598152160644531, 0.27075958251953125, 0.2817039489746094, 0.2926483154296875, 0.3035926818847656, 0.31453704833984375, 0.3254814147949219, 0.33642578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 13.0, 14.0, 25.0, 29.0, 38.0, 44.0, 56.0, 65.0, 80.0, 70.0, 86.0, 69.0, 81.0, 54.0, 60.0, 50.0, 37.0, 31.0, 27.0, 11.0, 15.0, 12.0, 4.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90869140625, -0.880035400390625, -0.85137939453125, -0.822723388671875, -0.7940673828125, -0.765411376953125, -0.73675537109375, -0.708099365234375, -0.679443359375, -0.650787353515625, -0.62213134765625, -0.593475341796875, -0.5648193359375, -0.536163330078125, -0.50750732421875, -0.478851318359375, -0.4501953125, -0.421539306640625, -0.39288330078125, -0.364227294921875, -0.3355712890625, -0.306915283203125, -0.27825927734375, -0.249603271484375, -0.220947265625, -0.192291259765625, -0.16363525390625, -0.134979248046875, -0.1063232421875, -0.077667236328125, -0.04901123046875, -0.020355224609375, 0.00830078125, 0.036956787109375, 0.06561279296875, 0.094268798828125, 0.1229248046875, 0.151580810546875, 0.18023681640625, 0.208892822265625, 0.237548828125, 0.266204833984375, 0.29486083984375, 0.323516845703125, 0.3521728515625, 0.380828857421875, 0.40948486328125, 0.438140869140625, 0.466796875, 0.495452880859375, 0.52410888671875, 0.552764892578125, 0.5814208984375, 0.610076904296875, 0.63873291015625, 0.667388916015625, 0.696044921875, 0.724700927734375, 0.75335693359375, 0.782012939453125, 0.8106689453125, 0.839324951171875, 0.86798095703125, 0.896636962890625, 0.92529296875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 5.0, 5.0, 4.0, 11.0, 13.0, 22.0, 25.0, 57.0, 58.0, 123.0, 212.0, 459.0, 1029.0, 2662.0, 10168.0, 57776.0, 462114.0, 445046.0, 54624.0, 9538.0, 2681.0, 957.0, 409.0, 215.0, 129.0, 75.0, 39.0, 29.0, 14.0, 12.0, 14.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.314208984375, -0.3043861389160156, -0.29456329345703125, -0.2847404479980469, -0.2749176025390625, -0.2650947570800781, -0.25527191162109375, -0.24544906616210938, -0.235626220703125, -0.22580337524414062, -0.21598052978515625, -0.20615768432617188, -0.1963348388671875, -0.18651199340820312, -0.17668914794921875, -0.16686630249023438, -0.15704345703125, -0.14722061157226562, -0.13739776611328125, -0.12757492065429688, -0.1177520751953125, -0.10792922973632812, -0.09810638427734375, -0.08828353881835938, -0.078460693359375, -0.06863784790039062, -0.05881500244140625, -0.048992156982421875, -0.0391693115234375, -0.029346466064453125, -0.01952362060546875, -0.009700775146484375, 0.0001220703125, 0.009944915771484375, 0.01976776123046875, 0.029590606689453125, 0.0394134521484375, 0.049236297607421875, 0.05905914306640625, 0.06888198852539062, 0.078704833984375, 0.08852767944335938, 0.09835052490234375, 0.10817337036132812, 0.1179962158203125, 0.12781906127929688, 0.13764190673828125, 0.14746475219726562, 0.15728759765625, 0.16711044311523438, 0.17693328857421875, 0.18675613403320312, 0.1965789794921875, 0.20640182495117188, 0.21622467041015625, 0.22604751586914062, 0.235870361328125, 0.24569320678710938, 0.25551605224609375, 0.2653388977050781, 0.2751617431640625, 0.2849845886230469, 0.29480743408203125, 0.3046302795410156, 0.314453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 9.0, 4.0, 5.0, 8.0, 10.0, 11.0, 16.0, 15.0, 17.0, 18.0, 24.0, 36.0, 35.0, 31.0, 32.0, 31.0, 35.0, 51.0, 49.0, 45.0, 46.0, 50.0, 39.0, 34.0, 46.0, 40.0, 34.0, 26.0, 23.0, 30.0, 22.0, 14.0, 22.0, 12.0, 12.0, 16.0, 8.0, 11.0, 13.0, 10.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98779296875, -0.9526596069335938, -0.9175262451171875, -0.8823928833007812, -0.847259521484375, -0.8121261596679688, -0.7769927978515625, -0.7418594360351562, -0.70672607421875, -0.6715927124023438, -0.6364593505859375, -0.6013259887695312, -0.566192626953125, -0.5310592651367188, -0.4959259033203125, -0.46079254150390625, -0.4256591796875, -0.39052581787109375, -0.3553924560546875, -0.32025909423828125, -0.285125732421875, -0.24999237060546875, -0.2148590087890625, -0.17972564697265625, -0.14459228515625, -0.10945892333984375, -0.0743255615234375, -0.03919219970703125, -0.004058837890625, 0.03107452392578125, 0.0662078857421875, 0.10134124755859375, 0.136474609375, 0.17160797119140625, 0.2067413330078125, 0.24187469482421875, 0.277008056640625, 0.31214141845703125, 0.3472747802734375, 0.38240814208984375, 0.41754150390625, 0.45267486572265625, 0.4878082275390625, 0.5229415893554688, 0.558074951171875, 0.5932083129882812, 0.6283416748046875, 0.6634750366210938, 0.6986083984375, 0.7337417602539062, 0.7688751220703125, 0.8040084838867188, 0.839141845703125, 0.8742752075195312, 0.9094085693359375, 0.9445419311523438, 0.97967529296875, 1.0148086547851562, 1.0499420166015625, 1.0850753784179688, 1.120208740234375, 1.1553421020507812, 1.1904754638671875, 1.2256088256835938, 1.2607421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 12.0, 12.0, 25.0, 16.0, 33.0, 57.0, 89.0, 128.0, 195.0, 281.0, 607.0, 1173.0, 2419.0, 6139.0, 17958.0, 67813.0, 324715.0, 475126.0, 109919.0, 26647.0, 8500.0, 3301.0, 1497.0, 739.0, 425.0, 268.0, 151.0, 85.0, 61.0, 36.0, 30.0, 24.0, 15.0, 10.0, 8.0, 6.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07855224609375, -0.07576274871826172, -0.07297325134277344, -0.07018375396728516, -0.06739425659179688, -0.0646047592163086, -0.06181526184082031, -0.05902576446533203, -0.05623626708984375, -0.05344676971435547, -0.05065727233886719, -0.047867774963378906, -0.045078277587890625, -0.042288780212402344, -0.03949928283691406, -0.03670978546142578, -0.0339202880859375, -0.03113079071044922, -0.028341293334960938, -0.025551795959472656, -0.022762298583984375, -0.019972801208496094, -0.017183303833007812, -0.014393806457519531, -0.01160430908203125, -0.008814811706542969, -0.0060253143310546875, -0.0032358169555664062, -0.000446319580078125, 0.0023431777954101562, 0.0051326751708984375, 0.007922172546386719, 0.010711669921875, 0.013501167297363281, 0.016290664672851562, 0.019080162048339844, 0.021869659423828125, 0.024659156799316406, 0.027448654174804688, 0.03023815155029297, 0.03302764892578125, 0.03581714630126953, 0.03860664367675781, 0.041396141052246094, 0.044185638427734375, 0.046975135803222656, 0.04976463317871094, 0.05255413055419922, 0.0553436279296875, 0.05813312530517578, 0.06092262268066406, 0.06371212005615234, 0.06650161743164062, 0.0692911148071289, 0.07208061218261719, 0.07487010955810547, 0.07765960693359375, 0.08044910430908203, 0.08323860168457031, 0.0860280990600586, 0.08881759643554688, 0.09160709381103516, 0.09439659118652344, 0.09718608856201172, 0.0999755859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 4.0, 4.0, 7.0, 8.0, 21.0, 16.0, 32.0, 39.0, 21.0, 37.0, 59.0, 56.0, 71.0, 86.0, 61.0, 70.0, 69.0, 56.0, 51.0, 42.0, 43.0, 19.0, 23.0, 18.0, 16.0, 17.0, 10.0, 6.0, 7.0, 3.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2319297790527344e-05, -4.085153341293335e-05, -3.9383769035339355e-05, -3.791600465774536e-05, -3.644824028015137e-05, -3.498047590255737e-05, -3.351271152496338e-05, -3.2044947147369385e-05, -3.057718276977539e-05, -2.9109418392181396e-05, -2.7641654014587402e-05, -2.6173889636993408e-05, -2.4706125259399414e-05, -2.323836088180542e-05, -2.1770596504211426e-05, -2.030283212661743e-05, -1.8835067749023438e-05, -1.7367303371429443e-05, -1.589953899383545e-05, -1.4431774616241455e-05, -1.2964010238647461e-05, -1.1496245861053467e-05, -1.0028481483459473e-05, -8.560717105865479e-06, -7.092952728271484e-06, -5.62518835067749e-06, -4.157423973083496e-06, -2.689659595489502e-06, -1.2218952178955078e-06, 2.4586915969848633e-07, 1.7136335372924805e-06, 3.1813979148864746e-06, 4.649162292480469e-06, 6.116926670074463e-06, 7.584691047668457e-06, 9.052455425262451e-06, 1.0520219802856445e-05, 1.198798418045044e-05, 1.3455748558044434e-05, 1.4923512935638428e-05, 1.6391277313232422e-05, 1.7859041690826416e-05, 1.932680606842041e-05, 2.0794570446014404e-05, 2.22623348236084e-05, 2.3730099201202393e-05, 2.5197863578796387e-05, 2.666562795639038e-05, 2.8133392333984375e-05, 2.960115671157837e-05, 3.106892108917236e-05, 3.253668546676636e-05, 3.400444984436035e-05, 3.5472214221954346e-05, 3.693997859954834e-05, 3.8407742977142334e-05, 3.987550735473633e-05, 4.134327173233032e-05, 4.2811036109924316e-05, 4.427880048751831e-05, 4.5746564865112305e-05, 4.72143292427063e-05, 4.868209362030029e-05, 5.014985799789429e-05, 5.161762237548828e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 5.0, 13.0, 18.0, 31.0, 40.0, 97.0, 243.0, 451.0, 1345.0, 4670.0, 23677.0, 187258.0, 677822.0, 129830.0, 17370.0, 3716.0, 1074.0, 420.0, 190.0, 91.0, 56.0, 35.0, 20.0, 15.0, 16.0, 13.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1494140625, -0.1449432373046875, -0.140472412109375, -0.1360015869140625, -0.13153076171875, -0.1270599365234375, -0.122589111328125, -0.1181182861328125, -0.1136474609375, -0.1091766357421875, -0.104705810546875, -0.1002349853515625, -0.09576416015625, -0.0912933349609375, -0.086822509765625, -0.0823516845703125, -0.077880859375, -0.0734100341796875, -0.068939208984375, -0.0644683837890625, -0.05999755859375, -0.0555267333984375, -0.051055908203125, -0.0465850830078125, -0.0421142578125, -0.0376434326171875, -0.033172607421875, -0.0287017822265625, -0.02423095703125, -0.0197601318359375, -0.015289306640625, -0.0108184814453125, -0.00634765625, -0.0018768310546875, 0.002593994140625, 0.0070648193359375, 0.01153564453125, 0.0160064697265625, 0.020477294921875, 0.0249481201171875, 0.0294189453125, 0.0338897705078125, 0.038360595703125, 0.0428314208984375, 0.04730224609375, 0.0517730712890625, 0.056243896484375, 0.0607147216796875, 0.065185546875, 0.0696563720703125, 0.074127197265625, 0.0785980224609375, 0.08306884765625, 0.0875396728515625, 0.092010498046875, 0.0964813232421875, 0.1009521484375, 0.1054229736328125, 0.109893798828125, 0.1143646240234375, 0.11883544921875, 0.1233062744140625, 0.127777099609375, 0.1322479248046875, 0.13671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 9.0, 10.0, 5.0, 11.0, 13.0, 15.0, 34.0, 22.0, 19.0, 31.0, 37.0, 39.0, 41.0, 36.0, 66.0, 45.0, 54.0, 68.0, 73.0, 55.0, 46.0, 39.0, 33.0, 28.0, 33.0, 20.0, 23.0, 15.0, 8.0, 14.0, 9.0, 8.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0177764892578125, -0.01723480224609375, -0.016693115234375, -0.01615142822265625, -0.0156097412109375, -0.01506805419921875, -0.0145263671875, -0.01398468017578125, -0.0134429931640625, -0.01290130615234375, -0.012359619140625, -0.01181793212890625, -0.0112762451171875, -0.01073455810546875, -0.01019287109375, -0.00965118408203125, -0.0091094970703125, -0.00856781005859375, -0.008026123046875, -0.00748443603515625, -0.0069427490234375, -0.00640106201171875, -0.005859375, -0.00531768798828125, -0.0047760009765625, -0.00423431396484375, -0.003692626953125, -0.00315093994140625, -0.0026092529296875, -0.00206756591796875, -0.00152587890625, -0.00098419189453125, -0.0004425048828125, 9.918212890625e-05, 0.000640869140625, 0.00118255615234375, 0.0017242431640625, 0.00226593017578125, 0.0028076171875, 0.00334930419921875, 0.0038909912109375, 0.00443267822265625, 0.004974365234375, 0.00551605224609375, 0.0060577392578125, 0.00659942626953125, 0.00714111328125, 0.00768280029296875, 0.0082244873046875, 0.00876617431640625, 0.009307861328125, 0.00984954833984375, 0.0103912353515625, 0.01093292236328125, 0.011474609375, 0.01201629638671875, 0.0125579833984375, 0.01309967041015625, 0.013641357421875, 0.01418304443359375, 0.0147247314453125, 0.01526641845703125, 0.01580810546875, 0.01634979248046875, 0.0168914794921875]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 5.0, 6.0, 13.0, 22.0, 21.0, 70.0, 95.0, 150.0, 195.0, 169.0, 113.0, 62.0, 35.0, 14.0, 13.0, 6.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5946288108825684, -1.5408854484558105, -1.4871422052383423, -1.4333988428115845, -1.3796554803848267, -1.3259122371673584, -1.2721688747406006, -1.2184255123138428, -1.164682149887085, -1.1109387874603271, -1.0571955442428589, -1.003452181816101, -0.9497088193893433, -0.8959655165672302, -0.8422222137451172, -0.7884788513183594, -0.7347355484962463, -0.6809922456741333, -0.6272488832473755, -0.5735055804252625, -0.5197622179985046, -0.4660189151763916, -0.4122755825519562, -0.35853224992752075, -0.3047889173030853, -0.2510455846786499, -0.19730225205421448, -0.14355893433094025, -0.08981560170650482, -0.03607228398323059, 0.017671048641204834, 0.07141438126564026, 0.12515771389007568, 0.1789010465145111, 0.23264437913894653, 0.28638768196105957, 0.3401310443878174, 0.3938743472099304, 0.44761767983436584, 0.5013610124588013, 0.5551043748855591, 0.6088476777076721, 0.6625910401344299, 0.716334342956543, 0.7700777053833008, 0.8238210082054138, 0.8775643110275269, 0.9313076734542847, 0.9850509762763977, 1.0387942790985107, 1.0925376415252686, 1.1462810039520264, 1.2000242471694946, 1.2537676095962524, 1.3075109720230103, 1.3612542152404785, 1.4149975776672363, 1.4687409400939941, 1.5224841833114624, 1.5762275457382202, 1.629970908164978, 1.6837141513824463, 1.737457513809204, 1.791200876235962, 1.8449442386627197]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 1.0, 8.0, 4.0, 14.0, 9.0, 16.0, 26.0, 30.0, 33.0, 55.0, 55.0, 58.0, 55.0, 82.0, 74.0, 71.0, 66.0, 62.0, 57.0, 53.0, 31.0, 39.0, 21.0, 29.0, 11.0, 5.0, 11.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.8604404330253601, -0.8348312377929688, -0.8092220425605774, -0.783612847328186, -0.7580037117004395, -0.7323944568634033, -0.7067853212356567, -0.6811761260032654, -0.655566930770874, -0.6299577355384827, -0.6043485403060913, -0.5787393450737, -0.5531301498413086, -0.527521014213562, -0.5019118189811707, -0.4763026237487793, -0.45069342851638794, -0.4250842332839966, -0.3994750380516052, -0.37386587262153625, -0.3482566773891449, -0.32264748215675354, -0.29703831672668457, -0.2714291214942932, -0.24581992626190186, -0.2202107310295105, -0.19460155069828033, -0.16899237036705017, -0.1433831751346588, -0.11777397990226746, -0.09216479957103729, -0.06655561923980713, -0.040946364402770996, -0.015337176620960236, 0.010272011160850525, 0.035881198942661285, 0.061490386724472046, 0.0870995819568634, 0.11270876228809357, 0.13831794261932373, 0.1639271378517151, 0.18953633308410645, 0.2151455134153366, 0.24075469374656677, 0.26636388897895813, 0.2919730842113495, 0.31758224964141846, 0.3431914448738098, 0.36880064010620117, 0.39440983533859253, 0.4200190305709839, 0.44562819600105286, 0.4712373912334442, 0.49684658646583557, 0.5224557518959045, 0.5480649471282959, 0.5736741423606873, 0.5992833375930786, 0.62489253282547, 0.6505017280578613, 0.6761108636856079, 0.701720118522644, 0.7273292541503906, 0.752938449382782, 0.7785476446151733]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 9.0, 6.0, 3.0, 5.0, 8.0, 13.0, 15.0, 20.0, 36.0, 71.0, 214.0, 1052.0, 15688.0, 978914.0, 50117.0, 1868.0, 284.0, 73.0, 42.0, 32.0, 19.0, 12.0, 9.0, 4.0, 7.0, 5.0, 3.0, 11.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.849609375, -3.719696044921875, -3.58978271484375, -3.459869384765625, -3.3299560546875, -3.200042724609375, -3.07012939453125, -2.940216064453125, -2.810302734375, -2.680389404296875, -2.55047607421875, -2.420562744140625, -2.2906494140625, -2.160736083984375, -2.03082275390625, -1.900909423828125, -1.77099609375, -1.641082763671875, -1.51116943359375, -1.381256103515625, -1.2513427734375, -1.121429443359375, -0.99151611328125, -0.861602783203125, -0.731689453125, -0.601776123046875, -0.47186279296875, -0.341949462890625, -0.2120361328125, -0.082122802734375, 0.04779052734375, 0.177703857421875, 0.3076171875, 0.437530517578125, 0.56744384765625, 0.697357177734375, 0.8272705078125, 0.957183837890625, 1.08709716796875, 1.217010498046875, 1.346923828125, 1.476837158203125, 1.60675048828125, 1.736663818359375, 1.8665771484375, 1.996490478515625, 2.12640380859375, 2.256317138671875, 2.38623046875, 2.516143798828125, 2.64605712890625, 2.775970458984375, 2.9058837890625, 3.035797119140625, 3.16571044921875, 3.295623779296875, 3.425537109375, 3.555450439453125, 3.68536376953125, 3.815277099609375, 3.9451904296875, 4.075103759765625, 4.20501708984375, 4.334930419921875, 4.46484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 10.0, 31.0, 32.0, 38.0, 53.0, 61.0, 77.0, 89.0, 108.0, 99.0, 94.0, 76.0, 60.0, 45.0, 46.0, 26.0, 13.0, 11.0, 5.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03515625, -1.962249755859375, -1.88934326171875, -1.816436767578125, -1.7435302734375, -1.670623779296875, -1.59771728515625, -1.524810791015625, -1.451904296875, -1.378997802734375, -1.30609130859375, -1.233184814453125, -1.1602783203125, -1.087371826171875, -1.01446533203125, -0.941558837890625, -0.86865234375, -0.795745849609375, -0.72283935546875, -0.649932861328125, -0.5770263671875, -0.504119873046875, -0.43121337890625, -0.358306884765625, -0.285400390625, -0.212493896484375, -0.13958740234375, -0.066680908203125, 0.0062255859375, 0.079132080078125, 0.15203857421875, 0.224945068359375, 0.2978515625, 0.370758056640625, 0.44366455078125, 0.516571044921875, 0.5894775390625, 0.662384033203125, 0.73529052734375, 0.808197021484375, 0.881103515625, 0.954010009765625, 1.02691650390625, 1.099822998046875, 1.1727294921875, 1.245635986328125, 1.31854248046875, 1.391448974609375, 1.46435546875, 1.537261962890625, 1.61016845703125, 1.683074951171875, 1.7559814453125, 1.828887939453125, 1.90179443359375, 1.974700927734375, 2.047607421875, 2.120513916015625, 2.19342041015625, 2.266326904296875, 2.3392333984375, 2.412139892578125, 2.48504638671875, 2.557952880859375, 2.630859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 7.0, 10.0, 21.0, 19.0, 23.0, 33.0, 57.0, 66.0, 76.0, 135.0, 280.0, 784.0, 4431.0, 81017.0, 924355.0, 33392.0, 2623.0, 549.0, 235.0, 123.0, 94.0, 68.0, 43.0, 30.0, 22.0, 15.0, 10.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.251953125, -2.177825927734375, -2.10369873046875, -2.029571533203125, -1.9554443359375, -1.881317138671875, -1.80718994140625, -1.733062744140625, -1.658935546875, -1.584808349609375, -1.51068115234375, -1.436553955078125, -1.3624267578125, -1.288299560546875, -1.21417236328125, -1.140045166015625, -1.06591796875, -0.991790771484375, -0.91766357421875, -0.843536376953125, -0.7694091796875, -0.695281982421875, -0.62115478515625, -0.547027587890625, -0.472900390625, -0.398773193359375, -0.32464599609375, -0.250518798828125, -0.1763916015625, -0.102264404296875, -0.02813720703125, 0.045989990234375, 0.1201171875, 0.194244384765625, 0.26837158203125, 0.342498779296875, 0.4166259765625, 0.490753173828125, 0.56488037109375, 0.639007568359375, 0.713134765625, 0.787261962890625, 0.86138916015625, 0.935516357421875, 1.0096435546875, 1.083770751953125, 1.15789794921875, 1.232025146484375, 1.30615234375, 1.380279541015625, 1.45440673828125, 1.528533935546875, 1.6026611328125, 1.676788330078125, 1.75091552734375, 1.825042724609375, 1.899169921875, 1.973297119140625, 2.04742431640625, 2.121551513671875, 2.1956787109375, 2.269805908203125, 2.34393310546875, 2.418060302734375, 2.4921875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 6.0, 12.0, 15.0, 20.0, 21.0, 31.0, 34.0, 38.0, 34.0, 47.0, 55.0, 60.0, 60.0, 67.0, 60.0, 48.0, 49.0, 50.0, 45.0, 48.0, 47.0, 33.0, 31.0, 27.0, 12.0, 16.0, 8.0, 7.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.724609375, -1.6712493896484375, -1.617889404296875, -1.5645294189453125, -1.51116943359375, -1.4578094482421875, -1.404449462890625, -1.3510894775390625, -1.2977294921875, -1.2443695068359375, -1.191009521484375, -1.1376495361328125, -1.08428955078125, -1.0309295654296875, -0.977569580078125, -0.9242095947265625, -0.870849609375, -0.8174896240234375, -0.764129638671875, -0.7107696533203125, -0.65740966796875, -0.6040496826171875, -0.550689697265625, -0.4973297119140625, -0.4439697265625, -0.3906097412109375, -0.337249755859375, -0.2838897705078125, -0.23052978515625, -0.1771697998046875, -0.123809814453125, -0.0704498291015625, -0.01708984375, 0.0362701416015625, 0.089630126953125, 0.1429901123046875, 0.19635009765625, 0.2497100830078125, 0.303070068359375, 0.3564300537109375, 0.4097900390625, 0.4631500244140625, 0.516510009765625, 0.5698699951171875, 0.62322998046875, 0.6765899658203125, 0.729949951171875, 0.7833099365234375, 0.836669921875, 0.8900299072265625, 0.943389892578125, 0.9967498779296875, 1.05010986328125, 1.1034698486328125, 1.156829833984375, 1.2101898193359375, 1.2635498046875, 1.3169097900390625, 1.370269775390625, 1.4236297607421875, 1.47698974609375, 1.5303497314453125, 1.583709716796875, 1.6370697021484375, 1.6904296875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 10.0, 9.0, 4.0, 10.0, 13.0, 19.0, 24.0, 38.0, 42.0, 82.0, 125.0, 180.0, 305.0, 508.0, 833.0, 1397.0, 2625.0, 4983.0, 9919.0, 22937.0, 59180.0, 190853.0, 471934.0, 182960.0, 56778.0, 22286.0, 9693.0, 4766.0, 2478.0, 1382.0, 777.0, 494.0, 310.0, 170.0, 130.0, 90.0, 65.0, 50.0, 32.0, 24.0, 14.0, 6.0, 8.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22021484375, -0.2136383056640625, -0.207061767578125, -0.2004852294921875, -0.19390869140625, -0.1873321533203125, -0.180755615234375, -0.1741790771484375, -0.1676025390625, -0.1610260009765625, -0.154449462890625, -0.1478729248046875, -0.14129638671875, -0.1347198486328125, -0.128143310546875, -0.1215667724609375, -0.114990234375, -0.1084136962890625, -0.101837158203125, -0.0952606201171875, -0.08868408203125, -0.0821075439453125, -0.075531005859375, -0.0689544677734375, -0.0623779296875, -0.0558013916015625, -0.049224853515625, -0.0426483154296875, -0.03607177734375, -0.0294952392578125, -0.022918701171875, -0.0163421630859375, -0.009765625, -0.0031890869140625, 0.003387451171875, 0.0099639892578125, 0.01654052734375, 0.0231170654296875, 0.029693603515625, 0.0362701416015625, 0.0428466796875, 0.0494232177734375, 0.055999755859375, 0.0625762939453125, 0.06915283203125, 0.0757293701171875, 0.082305908203125, 0.0888824462890625, 0.095458984375, 0.1020355224609375, 0.108612060546875, 0.1151885986328125, 0.12176513671875, 0.1283416748046875, 0.134918212890625, 0.1414947509765625, 0.1480712890625, 0.1546478271484375, 0.161224365234375, 0.1678009033203125, 0.17437744140625, 0.1809539794921875, 0.187530517578125, 0.1941070556640625, 0.20068359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 9.0, 13.0, 8.0, 14.0, 15.0, 32.0, 34.0, 45.0, 78.0, 89.0, 103.0, 138.0, 105.0, 80.0, 52.0, 38.0, 36.0, 21.0, 23.0, 14.0, 9.0, 11.0, 6.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.762411117553711e-05, -4.599429666996002e-05, -4.4364482164382935e-05, -4.273466765880585e-05, -4.110485315322876e-05, -3.947503864765167e-05, -3.7845224142074585e-05, -3.62154096364975e-05, -3.458559513092041e-05, -3.295578062534332e-05, -3.1325966119766235e-05, -2.9696151614189148e-05, -2.806633710861206e-05, -2.6436522603034973e-05, -2.4806708097457886e-05, -2.31768935918808e-05, -2.154707908630371e-05, -1.9917264580726624e-05, -1.8287450075149536e-05, -1.665763556957245e-05, -1.5027821063995361e-05, -1.3398006558418274e-05, -1.1768192052841187e-05, -1.0138377547264099e-05, -8.508563041687012e-06, -6.878748536109924e-06, -5.248934030532837e-06, -3.6191195249557495e-06, -1.989305019378662e-06, -3.594905138015747e-07, 1.2703239917755127e-06, 2.9001384973526e-06, 4.5299530029296875e-06, 6.159767508506775e-06, 7.789582014083862e-06, 9.41939651966095e-06, 1.1049211025238037e-05, 1.2679025530815125e-05, 1.4308840036392212e-05, 1.59386545419693e-05, 1.7568469047546387e-05, 1.9198283553123474e-05, 2.082809805870056e-05, 2.245791256427765e-05, 2.4087727069854736e-05, 2.5717541575431824e-05, 2.734735608100891e-05, 2.8977170586586e-05, 3.0606985092163086e-05, 3.223679959774017e-05, 3.386661410331726e-05, 3.549642860889435e-05, 3.7126243114471436e-05, 3.875605762004852e-05, 4.038587212562561e-05, 4.20156866312027e-05, 4.3645501136779785e-05, 4.527531564235687e-05, 4.690513014793396e-05, 4.853494465351105e-05, 5.0164759159088135e-05, 5.179457366466522e-05, 5.342438817024231e-05, 5.50542026758194e-05, 5.6684017181396484e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 10.0, 7.0, 18.0, 28.0, 28.0, 56.0, 77.0, 120.0, 184.0, 263.0, 499.0, 834.0, 1563.0, 3031.0, 6067.0, 13620.0, 34154.0, 98778.0, 355348.0, 369235.0, 102248.0, 35050.0, 14157.0, 6189.0, 3088.0, 1620.0, 870.0, 502.0, 307.0, 206.0, 123.0, 73.0, 58.0, 32.0, 24.0, 15.0, 18.0, 9.0, 13.0, 5.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.2310791015625, -0.2238616943359375, -0.216644287109375, -0.2094268798828125, -0.20220947265625, -0.1949920654296875, -0.187774658203125, -0.1805572509765625, -0.17333984375, -0.1661224365234375, -0.158905029296875, -0.1516876220703125, -0.14447021484375, -0.1372528076171875, -0.130035400390625, -0.1228179931640625, -0.1156005859375, -0.1083831787109375, -0.101165771484375, -0.0939483642578125, -0.08673095703125, -0.0795135498046875, -0.072296142578125, -0.0650787353515625, -0.057861328125, -0.0506439208984375, -0.043426513671875, -0.0362091064453125, -0.02899169921875, -0.0217742919921875, -0.014556884765625, -0.0073394775390625, -0.0001220703125, 0.0070953369140625, 0.014312744140625, 0.0215301513671875, 0.02874755859375, 0.0359649658203125, 0.043182373046875, 0.0503997802734375, 0.0576171875, 0.0648345947265625, 0.072052001953125, 0.0792694091796875, 0.08648681640625, 0.0937042236328125, 0.100921630859375, 0.1081390380859375, 0.1153564453125, 0.1225738525390625, 0.129791259765625, 0.1370086669921875, 0.14422607421875, 0.1514434814453125, 0.158660888671875, 0.1658782958984375, 0.173095703125, 0.1803131103515625, 0.187530517578125, 0.1947479248046875, 0.20196533203125, 0.2091827392578125, 0.216400146484375, 0.2236175537109375, 0.2308349609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 2.0, 6.0, 9.0, 12.0, 16.0, 22.0, 19.0, 26.0, 25.0, 27.0, 27.0, 41.0, 50.0, 59.0, 76.0, 101.0, 74.0, 59.0, 59.0, 59.0, 44.0, 22.0, 22.0, 20.0, 23.0, 19.0, 9.0, 11.0, 10.0, 12.0, 10.0, 5.0, 5.0, 5.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1337890625, -0.12996292114257812, -0.12613677978515625, -0.12231063842773438, -0.1184844970703125, -0.11465835571289062, -0.11083221435546875, -0.10700607299804688, -0.103179931640625, -0.09935379028320312, -0.09552764892578125, -0.09170150756835938, -0.0878753662109375, -0.08404922485351562, -0.08022308349609375, -0.07639694213867188, -0.07257080078125, -0.06874465942382812, -0.06491851806640625, -0.061092376708984375, -0.0572662353515625, -0.053440093994140625, -0.04961395263671875, -0.045787811279296875, -0.041961669921875, -0.038135528564453125, -0.03430938720703125, -0.030483245849609375, -0.0266571044921875, -0.022830963134765625, -0.01900482177734375, -0.015178680419921875, -0.0113525390625, -0.007526397705078125, -0.00370025634765625, 0.000125885009765625, 0.0039520263671875, 0.007778167724609375, 0.01160430908203125, 0.015430450439453125, 0.019256591796875, 0.023082733154296875, 0.02690887451171875, 0.030735015869140625, 0.0345611572265625, 0.038387298583984375, 0.04221343994140625, 0.046039581298828125, 0.04986572265625, 0.053691864013671875, 0.05751800537109375, 0.061344146728515625, 0.0651702880859375, 0.06899642944335938, 0.07282257080078125, 0.07664871215820312, 0.080474853515625, 0.08430099487304688, 0.08812713623046875, 0.09195327758789062, 0.0957794189453125, 0.09960556030273438, 0.10343170166015625, 0.10725784301757812, 0.111083984375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 33.0, 98.0, 234.0, 305.0, 181.0, 73.0, 34.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.625051975250244, -3.4474427700042725, -3.269833564758301, -3.092224597930908, -2.9146153926849365, -2.737006187438965, -2.5593972206115723, -2.3817880153656006, -2.204178810119629, -2.0265696048736572, -1.848960518836975, -1.671351432800293, -1.4937422275543213, -1.3161330223083496, -1.1385239362716675, -0.9609148502349854, -0.7833056449890137, -0.6056964993476868, -0.42808735370635986, -0.25047820806503296, -0.07286906242370605, 0.10474008321762085, 0.28234922885894775, 0.4599583148956299, 0.6375675201416016, 0.8151766657829285, 0.9927858114242554, 1.1703948974609375, 1.3480041027069092, 1.5256133079528809, 1.703222393989563, 1.8808314800262451, 2.058440685272217, 2.2360498905181885, 2.41365909576416, 2.5912680625915527, 2.7688772678375244, 2.946486473083496, 3.1240954399108887, 3.3017046451568604, 3.479313850402832, 3.6569230556488037, 3.8345322608947754, 4.012141227722168, 4.189750671386719, 4.367359638214111, 4.544968605041504, 4.722578048706055, 4.900187015533447, 5.07779598236084, 5.255405426025391, 5.433014392852783, 5.610623359680176, 5.788232803344727, 5.965841770172119, 6.143450736999512, 6.3210601806640625, 6.498669147491455, 6.676278591156006, 6.853887557983398, 7.031497001647949, 7.209105968475342, 7.386714935302734, 7.564324378967285, 7.741933345794678]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 4.0, 12.0, 9.0, 17.0, 15.0, 27.0, 22.0, 30.0, 38.0, 49.0, 41.0, 48.0, 54.0, 46.0, 51.0, 58.0, 48.0, 51.0, 41.0, 43.0, 39.0, 31.0, 43.0, 37.0, 21.0, 31.0, 20.0, 9.0, 7.0, 10.0, 8.0, 14.0, 1.0, 4.0, 1.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.414971351623535, -2.3306961059570312, -2.2464206218719482, -2.1621453762054443, -2.0778698921203613, -1.9935946464538574, -1.9093194007873535, -1.82504403591156, -1.7407686710357666, -1.6564933061599731, -1.5722179412841797, -1.4879426956176758, -1.4036673307418823, -1.3193919658660889, -1.235116720199585, -1.1508413553237915, -1.066565990447998, -0.9822906255722046, -0.8980153203010559, -0.8137400150299072, -0.7294646501541138, -0.6451892852783203, -0.5609139800071716, -0.47663867473602295, -0.3923633098602295, -0.3080879747867584, -0.22381263971328735, -0.13953730463981628, -0.055261969566345215, 0.029013365507125854, 0.11328870058059692, 0.1975640058517456, 0.28183913230895996, 0.36611446738243103, 0.4503898024559021, 0.5346651077270508, 0.6189404726028442, 0.7032158374786377, 0.7874911427497864, 0.8717664480209351, 0.9560418128967285, 1.040317177772522, 1.1245925426483154, 1.2088677883148193, 1.2931431531906128, 1.3774185180664062, 1.4616937637329102, 1.5459691286087036, 1.630244493484497, 1.7145198583602905, 1.798795223236084, 1.883070468902588, 1.9673458337783813, 2.051621198654175, 2.1358964443206787, 2.2201719284057617, 2.3044471740722656, 2.3887224197387695, 2.4729979038238525, 2.5572731494903564, 2.6415486335754395, 2.7258238792419434, 2.8100991249084473, 2.894374370574951, 2.978649854660034]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 7.0, 4.0, 7.0, 8.0, 13.0, 19.0, 38.0, 57.0, 92.0, 177.0, 380.0, 843.0, 2249.0, 7975.0, 56966.0, 2339029.0, 1730722.0, 44920.0, 7086.0, 2114.0, 764.0, 362.0, 190.0, 105.0, 49.0, 22.0, 31.0, 10.0, 10.0, 16.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -2.005340576171875, -1.93841552734375, -1.871490478515625, -1.8045654296875, -1.737640380859375, -1.67071533203125, -1.603790283203125, -1.536865234375, -1.469940185546875, -1.40301513671875, -1.336090087890625, -1.2691650390625, -1.202239990234375, -1.13531494140625, -1.068389892578125, -1.00146484375, -0.934539794921875, -0.86761474609375, -0.800689697265625, -0.7337646484375, -0.666839599609375, -0.59991455078125, -0.532989501953125, -0.466064453125, -0.399139404296875, -0.33221435546875, -0.265289306640625, -0.1983642578125, -0.131439208984375, -0.06451416015625, 0.002410888671875, 0.0693359375, 0.136260986328125, 0.20318603515625, 0.270111083984375, 0.3370361328125, 0.403961181640625, 0.47088623046875, 0.537811279296875, 0.604736328125, 0.671661376953125, 0.73858642578125, 0.805511474609375, 0.8724365234375, 0.939361572265625, 1.00628662109375, 1.073211669921875, 1.14013671875, 1.207061767578125, 1.27398681640625, 1.340911865234375, 1.4078369140625, 1.474761962890625, 1.54168701171875, 1.608612060546875, 1.675537109375, 1.742462158203125, 1.80938720703125, 1.876312255859375, 1.9432373046875, 2.010162353515625, 2.07708740234375, 2.144012451171875, 2.2109375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 2.0, 2.0, 6.0, 11.0, 8.0, 11.0, 11.0, 27.0, 18.0, 17.0, 38.0, 37.0, 45.0, 53.0, 65.0, 48.0, 60.0, 77.0, 76.0, 68.0, 43.0, 48.0, 48.0, 29.0, 31.0, 21.0, 30.0, 16.0, 11.0, 11.0, 6.0, 7.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.94091796875, -0.9110565185546875, -0.881195068359375, -0.8513336181640625, -0.82147216796875, -0.7916107177734375, -0.761749267578125, -0.7318878173828125, -0.7020263671875, -0.6721649169921875, -0.642303466796875, -0.6124420166015625, -0.58258056640625, -0.5527191162109375, -0.522857666015625, -0.4929962158203125, -0.463134765625, -0.4332733154296875, -0.403411865234375, -0.3735504150390625, -0.34368896484375, -0.3138275146484375, -0.283966064453125, -0.2541046142578125, -0.2242431640625, -0.1943817138671875, -0.164520263671875, -0.1346588134765625, -0.10479736328125, -0.0749359130859375, -0.045074462890625, -0.0152130126953125, 0.0146484375, 0.0445098876953125, 0.074371337890625, 0.1042327880859375, 0.13409423828125, 0.1639556884765625, 0.193817138671875, 0.2236785888671875, 0.2535400390625, 0.2834014892578125, 0.313262939453125, 0.3431243896484375, 0.37298583984375, 0.4028472900390625, 0.432708740234375, 0.4625701904296875, 0.492431640625, 0.5222930908203125, 0.552154541015625, 0.5820159912109375, 0.61187744140625, 0.6417388916015625, 0.671600341796875, 0.7014617919921875, 0.7313232421875, 0.7611846923828125, 0.791046142578125, 0.8209075927734375, 0.85076904296875, 0.8806304931640625, 0.910491943359375, 0.9403533935546875, 0.97021484375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 11.0, 4.0, 9.0, 14.0, 17.0, 25.0, 28.0, 84.0, 95.0, 188.0, 456.0, 1397.0, 6729.0, 69586.0, 3824092.0, 273936.0, 13857.0, 2444.0, 690.0, 239.0, 130.0, 67.0, 55.0, 34.0, 18.0, 17.0, 14.0, 12.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.15966796875, -2.0869140625, -2.01416015625, -1.94140625, -1.86865234375, -1.7958984375, -1.72314453125, -1.650390625, -1.57763671875, -1.5048828125, -1.43212890625, -1.359375, -1.28662109375, -1.2138671875, -1.14111328125, -1.068359375, -0.99560546875, -0.9228515625, -0.85009765625, -0.77734375, -0.70458984375, -0.6318359375, -0.55908203125, -0.486328125, -0.41357421875, -0.3408203125, -0.26806640625, -0.1953125, -0.12255859375, -0.0498046875, 0.02294921875, 0.095703125, 0.16845703125, 0.2412109375, 0.31396484375, 0.38671875, 0.45947265625, 0.5322265625, 0.60498046875, 0.677734375, 0.75048828125, 0.8232421875, 0.89599609375, 0.96875, 1.04150390625, 1.1142578125, 1.18701171875, 1.259765625, 1.33251953125, 1.4052734375, 1.47802734375, 1.55078125, 1.62353515625, 1.6962890625, 1.76904296875, 1.841796875, 1.91455078125, 1.9873046875, 2.06005859375, 2.1328125, 2.20556640625, 2.2783203125, 2.35107421875, 2.423828125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 5.0, 6.0, 10.0, 15.0, 19.0, 11.0, 28.0, 35.0, 43.0, 60.0, 94.0, 134.0, 176.0, 330.0, 496.0, 750.0, 630.0, 435.0, 254.0, 158.0, 89.0, 64.0, 62.0, 21.0, 30.0, 28.0, 23.0, 10.0, 11.0, 5.0, 11.0, 4.0, 3.0, 5.0, 1.0, 0.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.31787109375, -0.3084449768066406, -0.29901885986328125, -0.2895927429199219, -0.2801666259765625, -0.2707405090332031, -0.26131439208984375, -0.2518882751464844, -0.242462158203125, -0.23303604125976562, -0.22360992431640625, -0.21418380737304688, -0.2047576904296875, -0.19533157348632812, -0.18590545654296875, -0.17647933959960938, -0.16705322265625, -0.15762710571289062, -0.14820098876953125, -0.13877487182617188, -0.1293487548828125, -0.11992263793945312, -0.11049652099609375, -0.10107040405273438, -0.091644287109375, -0.08221817016601562, -0.07279205322265625, -0.06336593627929688, -0.0539398193359375, -0.044513702392578125, -0.03508758544921875, -0.025661468505859375, -0.0162353515625, -0.006809234619140625, 0.00261688232421875, 0.012042999267578125, 0.0214691162109375, 0.030895233154296875, 0.04032135009765625, 0.049747467041015625, 0.059173583984375, 0.06859970092773438, 0.07802581787109375, 0.08745193481445312, 0.0968780517578125, 0.10630416870117188, 0.11573028564453125, 0.12515640258789062, 0.13458251953125, 0.14400863647460938, 0.15343475341796875, 0.16286087036132812, 0.1722869873046875, 0.18171310424804688, 0.19113922119140625, 0.20056533813476562, 0.209991455078125, 0.21941757202148438, 0.22884368896484375, 0.23826980590820312, 0.2476959228515625, 0.2571220397949219, 0.26654815673828125, 0.2759742736816406, 0.285400390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 12.0, 12.0, 9.0, 37.0, 52.0, 81.0, 105.0, 124.0, 123.0, 145.0, 106.0, 63.0, 38.0, 25.0, 15.0, 10.0, 13.0, 5.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6911894083023071, -1.6294071674346924, -1.5676249265670776, -1.505842685699463, -1.4440603256225586, -1.3822782039642334, -1.320495843887329, -1.2587136030197144, -1.1969313621520996, -1.1351491212844849, -1.0733668804168701, -1.0115846395492554, -0.9498023390769958, -0.8880200982093811, -0.8262377977371216, -0.7644555568695068, -0.7026733160018921, -0.6408910751342773, -0.5791088342666626, -0.5173265337944031, -0.45554429292678833, -0.3937620520591736, -0.33197978138923645, -0.2701975107192993, -0.20841526985168457, -0.14663301408290863, -0.08485075831413269, -0.02306850254535675, 0.03871375322341919, 0.10049599409103394, 0.16227826476097107, 0.2240605354309082, 0.2858428955078125, 0.34762513637542725, 0.4094074070453644, 0.4711896777153015, 0.5329719185829163, 0.594754159450531, 0.6565364599227905, 0.7183187007904053, 0.78010094165802, 0.8418831825256348, 0.9036654233932495, 0.965447723865509, 1.0272300243377686, 1.0890121459960938, 1.150794506072998, 1.2125767469406128, 1.2743589878082275, 1.3361412286758423, 1.397923469543457, 1.4597057104110718, 1.5214879512786865, 1.5832703113555908, 1.6450525522232056, 1.7068347930908203, 1.768617033958435, 1.8303992748260498, 1.8921815156936646, 1.9539637565612793, 2.0157461166381836, 2.077528238296509, 2.139310598373413, 2.2010927200317383, 2.2628750801086426]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 4.0, 5.0, 4.0, 11.0, 12.0, 15.0, 10.0, 34.0, 29.0, 22.0, 40.0, 48.0, 61.0, 62.0, 71.0, 68.0, 63.0, 65.0, 49.0, 61.0, 46.0, 49.0, 41.0, 31.0, 24.0, 18.0, 15.0, 16.0, 5.0, 4.0, 4.0, 4.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1286977529525757, -1.0920480489730835, -1.0553984642028809, -1.0187487602233887, -0.9820990562438965, -0.9454493522644043, -0.9087997078895569, -0.8721500635147095, -0.8355003595352173, -0.7988506555557251, -0.7622010111808777, -0.7255513668060303, -0.6889016628265381, -0.6522519588470459, -0.6156023144721985, -0.5789526700973511, -0.5423029661178589, -0.5056532621383667, -0.4690036177635193, -0.4323539435863495, -0.3957042694091797, -0.3590545952320099, -0.3224049210548401, -0.2857552468776703, -0.2491055727005005, -0.2124558985233307, -0.1758062243461609, -0.1391565501689911, -0.10250687599182129, -0.06585720181465149, -0.02920752763748169, 0.00744214653968811, 0.04409193992614746, 0.08074161410331726, 0.11739128828048706, 0.15404096245765686, 0.19069063663482666, 0.22734031081199646, 0.26398998498916626, 0.30063965916633606, 0.33728933334350586, 0.37393900752067566, 0.41058868169784546, 0.44723835587501526, 0.48388803005218506, 0.5205377340316772, 0.5571873784065247, 0.5938370227813721, 0.6304867267608643, 0.6671364307403564, 0.7037860751152039, 0.7404357194900513, 0.7770854234695435, 0.8137351274490356, 0.8503847718238831, 0.8870344161987305, 0.9236841201782227, 0.9603338241577148, 0.9969834685325623, 1.0336331129074097, 1.0702828168869019, 1.106932520866394, 1.1435821056365967, 1.1802318096160889, 1.216881513595581]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 13.0, 6.0, 10.0, 17.0, 29.0, 28.0, 51.0, 56.0, 69.0, 111.0, 167.0, 257.0, 356.0, 581.0, 990.0, 1766.0, 3257.0, 6613.0, 16040.0, 56002.0, 364875.0, 487654.0, 74155.0, 19234.0, 7690.0, 3615.0, 1938.0, 1081.0, 629.0, 404.0, 267.0, 170.0, 110.0, 80.0, 66.0, 48.0, 25.0, 30.0, 13.0, 16.0, 10.0, 8.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.287109375, -0.2786865234375, -0.270263671875, -0.2618408203125, -0.25341796875, -0.2449951171875, -0.236572265625, -0.2281494140625, -0.2197265625, -0.2113037109375, -0.202880859375, -0.1944580078125, -0.18603515625, -0.1776123046875, -0.169189453125, -0.1607666015625, -0.15234375, -0.1439208984375, -0.135498046875, -0.1270751953125, -0.11865234375, -0.1102294921875, -0.101806640625, -0.0933837890625, -0.0849609375, -0.0765380859375, -0.068115234375, -0.0596923828125, -0.05126953125, -0.0428466796875, -0.034423828125, -0.0260009765625, -0.017578125, -0.0091552734375, -0.000732421875, 0.0076904296875, 0.01611328125, 0.0245361328125, 0.032958984375, 0.0413818359375, 0.0498046875, 0.0582275390625, 0.066650390625, 0.0750732421875, 0.08349609375, 0.0919189453125, 0.100341796875, 0.1087646484375, 0.1171875, 0.1256103515625, 0.134033203125, 0.1424560546875, 0.15087890625, 0.1593017578125, 0.167724609375, 0.1761474609375, 0.1845703125, 0.1929931640625, 0.201416015625, 0.2098388671875, 0.21826171875, 0.2266845703125, 0.235107421875, 0.2435302734375, 0.251953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 7.0, 11.0, 10.0, 11.0, 15.0, 17.0, 22.0, 39.0, 34.0, 43.0, 63.0, 76.0, 81.0, 80.0, 77.0, 43.0, 56.0, 63.0, 54.0, 43.0, 34.0, 28.0, 16.0, 21.0, 17.0, 5.0, 7.0, 3.0, 3.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.794921875, -0.7684326171875, -0.741943359375, -0.7154541015625, -0.68896484375, -0.6624755859375, -0.635986328125, -0.6094970703125, -0.5830078125, -0.5565185546875, -0.530029296875, -0.5035400390625, -0.47705078125, -0.4505615234375, -0.424072265625, -0.3975830078125, -0.37109375, -0.3446044921875, -0.318115234375, -0.2916259765625, -0.26513671875, -0.2386474609375, -0.212158203125, -0.1856689453125, -0.1591796875, -0.1326904296875, -0.106201171875, -0.0797119140625, -0.05322265625, -0.0267333984375, -0.000244140625, 0.0262451171875, 0.052734375, 0.0792236328125, 0.105712890625, 0.1322021484375, 0.15869140625, 0.1851806640625, 0.211669921875, 0.2381591796875, 0.2646484375, 0.2911376953125, 0.317626953125, 0.3441162109375, 0.37060546875, 0.3970947265625, 0.423583984375, 0.4500732421875, 0.4765625, 0.5030517578125, 0.529541015625, 0.5560302734375, 0.58251953125, 0.6090087890625, 0.635498046875, 0.6619873046875, 0.6884765625, 0.7149658203125, 0.741455078125, 0.7679443359375, 0.79443359375, 0.8209228515625, 0.847412109375, 0.8739013671875, 0.900390625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 7.0, 2.0, 4.0, 9.0, 11.0, 10.0, 15.0, 28.0, 24.0, 29.0, 43.0, 85.0, 125.0, 246.0, 516.0, 1190.0, 2814.0, 8204.0, 37926.0, 404072.0, 528294.0, 49234.0, 9726.0, 3283.0, 1367.0, 583.0, 281.0, 141.0, 91.0, 55.0, 40.0, 36.0, 13.0, 10.0, 9.0, 6.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.326171875, -0.31687164306640625, -0.3075714111328125, -0.29827117919921875, -0.288970947265625, -0.27967071533203125, -0.2703704833984375, -0.26107025146484375, -0.25177001953125, -0.24246978759765625, -0.2331695556640625, -0.22386932373046875, -0.214569091796875, -0.20526885986328125, -0.1959686279296875, -0.18666839599609375, -0.1773681640625, -0.16806793212890625, -0.1587677001953125, -0.14946746826171875, -0.140167236328125, -0.13086700439453125, -0.1215667724609375, -0.11226654052734375, -0.10296630859375, -0.09366607666015625, -0.0843658447265625, -0.07506561279296875, -0.065765380859375, -0.05646514892578125, -0.0471649169921875, -0.03786468505859375, -0.028564453125, -0.01926422119140625, -0.0099639892578125, -0.00066375732421875, 0.008636474609375, 0.01793670654296875, 0.0272369384765625, 0.03653717041015625, 0.04583740234375, 0.05513763427734375, 0.0644378662109375, 0.07373809814453125, 0.083038330078125, 0.09233856201171875, 0.1016387939453125, 0.11093902587890625, 0.1202392578125, 0.12953948974609375, 0.1388397216796875, 0.14813995361328125, 0.157440185546875, 0.16674041748046875, 0.1760406494140625, 0.18534088134765625, 0.19464111328125, 0.20394134521484375, 0.2132415771484375, 0.22254180908203125, 0.231842041015625, 0.24114227294921875, 0.2504425048828125, 0.25974273681640625, 0.26904296875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 3.0, 9.0, 5.0, 11.0, 12.0, 8.0, 15.0, 24.0, 16.0, 25.0, 27.0, 26.0, 35.0, 38.0, 58.0, 56.0, 56.0, 57.0, 60.0, 52.0, 49.0, 40.0, 47.0, 27.0, 38.0, 32.0, 30.0, 26.0, 20.0, 15.0, 15.0, 10.0, 10.0, 9.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2958984375, -1.25579833984375, -1.2156982421875, -1.17559814453125, -1.135498046875, -1.09539794921875, -1.0552978515625, -1.01519775390625, -0.97509765625, -0.93499755859375, -0.8948974609375, -0.85479736328125, -0.814697265625, -0.77459716796875, -0.7344970703125, -0.69439697265625, -0.654296875, -0.61419677734375, -0.5740966796875, -0.53399658203125, -0.493896484375, -0.45379638671875, -0.4136962890625, -0.37359619140625, -0.33349609375, -0.29339599609375, -0.2532958984375, -0.21319580078125, -0.173095703125, -0.13299560546875, -0.0928955078125, -0.05279541015625, -0.0126953125, 0.02740478515625, 0.0675048828125, 0.10760498046875, 0.147705078125, 0.18780517578125, 0.2279052734375, 0.26800537109375, 0.30810546875, 0.34820556640625, 0.3883056640625, 0.42840576171875, 0.468505859375, 0.50860595703125, 0.5487060546875, 0.58880615234375, 0.62890625, 0.66900634765625, 0.7091064453125, 0.74920654296875, 0.789306640625, 0.82940673828125, 0.8695068359375, 0.90960693359375, 0.94970703125, 0.98980712890625, 1.0299072265625, 1.07000732421875, 1.110107421875, 1.15020751953125, 1.1903076171875, 1.23040771484375, 1.2705078125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 18.0, 23.0, 33.0, 35.0, 66.0, 94.0, 161.0, 216.0, 370.0, 627.0, 1071.0, 1947.0, 3942.0, 9352.0, 30814.0, 160008.0, 643552.0, 149434.0, 29332.0, 9118.0, 3893.0, 1768.0, 1002.0, 623.0, 353.0, 203.0, 152.0, 102.0, 62.0, 43.0, 37.0, 18.0, 22.0, 19.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.094970703125, -0.09221649169921875, -0.0894622802734375, -0.08670806884765625, -0.083953857421875, -0.08119964599609375, -0.0784454345703125, -0.07569122314453125, -0.07293701171875, -0.07018280029296875, -0.0674285888671875, -0.06467437744140625, -0.061920166015625, -0.05916595458984375, -0.0564117431640625, -0.05365753173828125, -0.0509033203125, -0.04814910888671875, -0.0453948974609375, -0.04264068603515625, -0.039886474609375, -0.03713226318359375, -0.0343780517578125, -0.03162384033203125, -0.02886962890625, -0.02611541748046875, -0.0233612060546875, -0.02060699462890625, -0.017852783203125, -0.01509857177734375, -0.0123443603515625, -0.00959014892578125, -0.0068359375, -0.00408172607421875, -0.0013275146484375, 0.00142669677734375, 0.004180908203125, 0.00693511962890625, 0.0096893310546875, 0.01244354248046875, 0.01519775390625, 0.01795196533203125, 0.0207061767578125, 0.02346038818359375, 0.026214599609375, 0.02896881103515625, 0.0317230224609375, 0.03447723388671875, 0.0372314453125, 0.03998565673828125, 0.0427398681640625, 0.04549407958984375, 0.048248291015625, 0.05100250244140625, 0.0537567138671875, 0.05651092529296875, 0.05926513671875, 0.06201934814453125, 0.0647735595703125, 0.06752777099609375, 0.070281982421875, 0.07303619384765625, 0.0757904052734375, 0.07854461669921875, 0.081298828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 8.0, 2.0, 6.0, 7.0, 10.0, 16.0, 24.0, 21.0, 32.0, 36.0, 66.0, 76.0, 109.0, 122.0, 114.0, 79.0, 71.0, 43.0, 29.0, 32.0, 20.0, 14.0, 18.0, 13.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0067901611328125e-05, -4.835333675146103e-05, -4.663877189159393e-05, -4.492420703172684e-05, -4.320964217185974e-05, -4.1495077311992645e-05, -3.978051245212555e-05, -3.806594759225845e-05, -3.635138273239136e-05, -3.463681787252426e-05, -3.2922253012657166e-05, -3.120768815279007e-05, -2.9493123292922974e-05, -2.7778558433055878e-05, -2.6063993573188782e-05, -2.4349428713321686e-05, -2.263486385345459e-05, -2.0920298993587494e-05, -1.9205734133720398e-05, -1.7491169273853302e-05, -1.5776604413986206e-05, -1.406203955411911e-05, -1.2347474694252014e-05, -1.0632909834384918e-05, -8.918344974517822e-06, -7.203780114650726e-06, -5.48921525478363e-06, -3.7746503949165344e-06, -2.0600855350494385e-06, -3.4552067518234253e-07, 1.3690441846847534e-06, 3.0836090445518494e-06, 4.798173904418945e-06, 6.512738764286041e-06, 8.227303624153137e-06, 9.941868484020233e-06, 1.1656433343887329e-05, 1.3370998203754425e-05, 1.5085563063621521e-05, 1.6800127923488617e-05, 1.8514692783355713e-05, 2.022925764322281e-05, 2.1943822503089905e-05, 2.3658387362957e-05, 2.5372952222824097e-05, 2.7087517082691193e-05, 2.880208194255829e-05, 3.0516646802425385e-05, 3.223121166229248e-05, 3.3945776522159576e-05, 3.566034138202667e-05, 3.737490624189377e-05, 3.9089471101760864e-05, 4.080403596162796e-05, 4.2518600821495056e-05, 4.423316568136215e-05, 4.594773054122925e-05, 4.7662295401096344e-05, 4.937686026096344e-05, 5.1091425120830536e-05, 5.280598998069763e-05, 5.452055484056473e-05, 5.6235119700431824e-05, 5.794968456029892e-05, 5.9664249420166016e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 5.0, 8.0, 14.0, 25.0, 46.0, 48.0, 81.0, 99.0, 163.0, 278.0, 419.0, 703.0, 1310.0, 2426.0, 4910.0, 11585.0, 35045.0, 148610.0, 569166.0, 203196.0, 44467.0, 13972.0, 5669.0, 2766.0, 1485.0, 856.0, 439.0, 262.0, 180.0, 108.0, 60.0, 48.0, 27.0, 19.0, 17.0, 7.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07794189453125, -0.07547473907470703, -0.07300758361816406, -0.0705404281616211, -0.06807327270507812, -0.06560611724853516, -0.06313896179199219, -0.06067180633544922, -0.05820465087890625, -0.05573749542236328, -0.05327033996582031, -0.050803184509277344, -0.048336029052734375, -0.045868873596191406, -0.04340171813964844, -0.04093456268310547, -0.0384674072265625, -0.03600025177001953, -0.03353309631347656, -0.031065940856933594, -0.028598785400390625, -0.026131629943847656, -0.023664474487304688, -0.02119731903076172, -0.01873016357421875, -0.01626300811767578, -0.013795852661132812, -0.011328697204589844, -0.008861541748046875, -0.006394386291503906, -0.0039272308349609375, -0.0014600753784179688, 0.001007080078125, 0.0034742355346679688, 0.0059413909912109375, 0.008408546447753906, 0.010875701904296875, 0.013342857360839844, 0.015810012817382812, 0.01827716827392578, 0.02074432373046875, 0.02321147918701172, 0.025678634643554688, 0.028145790100097656, 0.030612945556640625, 0.033080101013183594, 0.03554725646972656, 0.03801441192626953, 0.0404815673828125, 0.04294872283935547, 0.04541587829589844, 0.047883033752441406, 0.050350189208984375, 0.052817344665527344, 0.05528450012207031, 0.05775165557861328, 0.06021881103515625, 0.06268596649169922, 0.06515312194824219, 0.06762027740478516, 0.07008743286132812, 0.0725545883178711, 0.07502174377441406, 0.07748889923095703, 0.0799560546875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 4.0, 4.0, 10.0, 12.0, 10.0, 13.0, 18.0, 25.0, 27.0, 42.0, 58.0, 77.0, 80.0, 103.0, 97.0, 85.0, 77.0, 59.0, 39.0, 33.0, 29.0, 16.0, 15.0, 11.0, 14.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0165252685546875, -0.01597762107849121, -0.015429973602294922, -0.014882326126098633, -0.014334678649902344, -0.013787031173706055, -0.013239383697509766, -0.012691736221313477, -0.012144088745117188, -0.011596441268920898, -0.01104879379272461, -0.01050114631652832, -0.009953498840332031, -0.009405851364135742, -0.008858203887939453, -0.008310556411743164, -0.007762908935546875, -0.007215261459350586, -0.006667613983154297, -0.006119966506958008, -0.005572319030761719, -0.00502467155456543, -0.004477024078369141, -0.0039293766021728516, -0.0033817291259765625, -0.0028340816497802734, -0.0022864341735839844, -0.0017387866973876953, -0.0011911392211914062, -0.0006434917449951172, -9.584426879882812e-05, 0.00045180320739746094, 0.00099945068359375, 0.001547098159790039, 0.002094745635986328, 0.002642393112182617, 0.0031900405883789062, 0.0037376880645751953, 0.004285335540771484, 0.0048329830169677734, 0.0053806304931640625, 0.0059282779693603516, 0.006475925445556641, 0.00702357292175293, 0.007571220397949219, 0.008118867874145508, 0.008666515350341797, 0.009214162826538086, 0.009761810302734375, 0.010309457778930664, 0.010857105255126953, 0.011404752731323242, 0.011952400207519531, 0.01250004768371582, 0.01304769515991211, 0.013595342636108398, 0.014142990112304688, 0.014690637588500977, 0.015238285064697266, 0.015785932540893555, 0.016333580017089844, 0.016881227493286133, 0.017428874969482422, 0.01797652244567871, 0.018524169921875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 7.0, 13.0, 15.0, 21.0, 66.0, 79.0, 156.0, 187.0, 196.0, 118.0, 56.0, 35.0, 19.0, 13.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419613003730774, -1.3642818927764893, -1.3089509010314941, -1.2536197900772095, -1.1982886791229248, -1.1429576873779297, -1.087626576423645, -1.0322954654693604, -0.9769644141197205, -0.9216333627700806, -0.8663022518157959, -0.810971200466156, -0.7556401491165161, -0.7003090381622314, -0.6449779868125916, -0.5896469354629517, -0.534315824508667, -0.4789847433567047, -0.42365366220474243, -0.36832261085510254, -0.31299152970314026, -0.257660448551178, -0.20232939720153809, -0.1469983160495758, -0.09166723489761353, -0.03633616119623184, 0.01899491250514984, 0.07432597875595093, 0.1296570599079132, 0.1849881410598755, 0.24031919240951538, 0.29565027356147766, 0.3509814739227295, 0.4063125550746918, 0.46164363622665405, 0.516974687576294, 0.5723057985305786, 0.6276368498802185, 0.6829679012298584, 0.7382990121841431, 0.793630063533783, 0.8489611148834229, 0.9042922258377075, 0.9596232771873474, 1.0149543285369873, 1.070285439491272, 1.1256165504455566, 1.1809475421905518, 1.2362786531448364, 1.291609764099121, 1.3469407558441162, 1.4022718667984009, 1.4576029777526855, 1.5129339694976807, 1.5682650804519653, 1.62359619140625, 1.6789271831512451, 1.7342582941055298, 1.789589285850525, 1.8449203968048096, 1.9002515077590942, 1.955582618713379, 2.010913610458374, 2.066244602203369, 2.1215758323669434]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 1.0, 11.0, 14.0, 9.0, 16.0, 21.0, 32.0, 25.0, 40.0, 51.0, 44.0, 74.0, 74.0, 76.0, 69.0, 65.0, 62.0, 58.0, 50.0, 45.0, 36.0, 28.0, 22.0, 19.0, 17.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7303915023803711, -0.7054252624511719, -0.6804590225219727, -0.6554927825927734, -0.6305265426635742, -0.605560302734375, -0.5805940628051758, -0.5556278228759766, -0.5306615829467773, -0.5056953430175781, -0.4807291030883789, -0.4557628631591797, -0.43079662322998047, -0.40583038330078125, -0.38086414337158203, -0.3558979034423828, -0.3309316635131836, -0.3059654235839844, -0.28099918365478516, -0.25603294372558594, -0.23106670379638672, -0.2061004638671875, -0.18113422393798828, -0.15616798400878906, -0.13120174407958984, -0.10623550415039062, -0.0812692642211914, -0.05630302429199219, -0.03133678436279297, -0.00637054443359375, 0.01859569549560547, 0.04356193542480469, 0.0685281753540039, 0.09349441528320312, 0.11846065521240234, 0.14342689514160156, 0.16839313507080078, 0.193359375, 0.21832561492919922, 0.24329185485839844, 0.26825809478759766, 0.2932243347167969, 0.3181905746459961, 0.3431568145751953, 0.36812305450439453, 0.39308929443359375, 0.41805553436279297, 0.4430217742919922, 0.4679880142211914, 0.4929542541503906, 0.5179204940795898, 0.5428867340087891, 0.5678529739379883, 0.5928192138671875, 0.6177854537963867, 0.6427516937255859, 0.6677179336547852, 0.6926841735839844, 0.7176504135131836, 0.7426166534423828, 0.767582893371582, 0.7925491333007812, 0.8175153732299805, 0.8424816131591797, 0.8674478530883789]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 0.0, 3.0, 2.0, 6.0, 6.0, 5.0, 10.0, 10.0, 20.0, 44.0, 134.0, 664.0, 5771.0, 378684.0, 654830.0, 7300.0, 766.0, 157.0, 59.0, 25.0, 13.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.17120361328125, -3.0494384765625, -2.92767333984375, -2.805908203125, -2.68414306640625, -2.5623779296875, -2.44061279296875, -2.31884765625, -2.19708251953125, -2.0753173828125, -1.95355224609375, -1.831787109375, -1.71002197265625, -1.5882568359375, -1.46649169921875, -1.3447265625, -1.22296142578125, -1.1011962890625, -0.97943115234375, -0.857666015625, -0.73590087890625, -0.6141357421875, -0.49237060546875, -0.37060546875, -0.24884033203125, -0.1270751953125, -0.00531005859375, 0.116455078125, 0.23822021484375, 0.3599853515625, 0.48175048828125, 0.603515625, 0.72528076171875, 0.8470458984375, 0.96881103515625, 1.090576171875, 1.21234130859375, 1.3341064453125, 1.45587158203125, 1.57763671875, 1.69940185546875, 1.8211669921875, 1.94293212890625, 2.064697265625, 2.18646240234375, 2.3082275390625, 2.42999267578125, 2.5517578125, 2.67352294921875, 2.7952880859375, 2.91705322265625, 3.038818359375, 3.16058349609375, 3.2823486328125, 3.40411376953125, 3.52587890625, 3.64764404296875, 3.7694091796875, 3.89117431640625, 4.012939453125, 4.13470458984375, 4.2564697265625, 4.37823486328125, 4.5]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 1.0, 7.0, 5.0, 11.0, 21.0, 17.0, 21.0, 19.0, 33.0, 38.0, 51.0, 75.0, 78.0, 79.0, 79.0, 77.0, 61.0, 56.0, 59.0, 51.0, 39.0, 29.0, 25.0, 10.0, 11.0, 15.0, 7.0, 7.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6416015625, -1.5864410400390625, -1.531280517578125, -1.4761199951171875, -1.42095947265625, -1.3657989501953125, -1.310638427734375, -1.2554779052734375, -1.2003173828125, -1.1451568603515625, -1.089996337890625, -1.0348358154296875, -0.97967529296875, -0.9245147705078125, -0.869354248046875, -0.8141937255859375, -0.759033203125, -0.7038726806640625, -0.648712158203125, -0.5935516357421875, -0.53839111328125, -0.4832305908203125, -0.428070068359375, -0.3729095458984375, -0.3177490234375, -0.2625885009765625, -0.207427978515625, -0.1522674560546875, -0.09710693359375, -0.0419464111328125, 0.013214111328125, 0.0683746337890625, 0.12353515625, 0.1786956787109375, 0.233856201171875, 0.2890167236328125, 0.34417724609375, 0.3993377685546875, 0.454498291015625, 0.5096588134765625, 0.5648193359375, 0.6199798583984375, 0.675140380859375, 0.7303009033203125, 0.78546142578125, 0.8406219482421875, 0.895782470703125, 0.9509429931640625, 1.006103515625, 1.0612640380859375, 1.116424560546875, 1.1715850830078125, 1.22674560546875, 1.2819061279296875, 1.337066650390625, 1.3922271728515625, 1.4473876953125, 1.5025482177734375, 1.557708740234375, 1.6128692626953125, 1.66802978515625, 1.7231903076171875, 1.778350830078125, 1.8335113525390625, 1.888671875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 3.0, 7.0, 13.0, 15.0, 27.0, 28.0, 62.0, 76.0, 89.0, 172.0, 309.0, 547.0, 1022.0, 2267.0, 5458.0, 15946.0, 63600.0, 444023.0, 428564.0, 60811.0, 15556.0, 5307.0, 2208.0, 1060.0, 566.0, 306.0, 172.0, 124.0, 64.0, 37.0, 32.0, 27.0, 12.0, 12.0, 8.0, 7.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.845703125, -0.8184127807617188, -0.7911224365234375, -0.7638320922851562, -0.736541748046875, -0.7092514038085938, -0.6819610595703125, -0.6546707153320312, -0.62738037109375, -0.6000900268554688, -0.5727996826171875, -0.5455093383789062, -0.518218994140625, -0.49092864990234375, -0.4636383056640625, -0.43634796142578125, -0.4090576171875, -0.38176727294921875, -0.3544769287109375, -0.32718658447265625, -0.299896240234375, -0.27260589599609375, -0.2453155517578125, -0.21802520751953125, -0.19073486328125, -0.16344451904296875, -0.1361541748046875, -0.10886383056640625, -0.081573486328125, -0.05428314208984375, -0.0269927978515625, 0.00029754638671875, 0.027587890625, 0.05487823486328125, 0.0821685791015625, 0.10945892333984375, 0.136749267578125, 0.16403961181640625, 0.1913299560546875, 0.21862030029296875, 0.24591064453125, 0.27320098876953125, 0.3004913330078125, 0.32778167724609375, 0.355072021484375, 0.38236236572265625, 0.4096527099609375, 0.43694305419921875, 0.4642333984375, 0.49152374267578125, 0.5188140869140625, 0.5461044311523438, 0.573394775390625, 0.6006851196289062, 0.6279754638671875, 0.6552658081054688, 0.68255615234375, 0.7098464965820312, 0.7371368408203125, 0.7644271850585938, 0.791717529296875, 0.8190078735351562, 0.8462982177734375, 0.8735885620117188, 0.90087890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 9.0, 6.0, 5.0, 6.0, 16.0, 8.0, 7.0, 17.0, 20.0, 31.0, 31.0, 39.0, 51.0, 41.0, 34.0, 40.0, 40.0, 44.0, 46.0, 46.0, 42.0, 42.0, 43.0, 48.0, 35.0, 27.0, 31.0, 19.0, 33.0, 22.0, 22.0, 14.0, 18.0, 10.0, 17.0, 7.0, 7.0, 2.0, 5.0, 3.0, 8.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-1.599609375, -1.5549774169921875, -1.510345458984375, -1.4657135009765625, -1.42108154296875, -1.3764495849609375, -1.331817626953125, -1.2871856689453125, -1.2425537109375, -1.1979217529296875, -1.153289794921875, -1.1086578369140625, -1.06402587890625, -1.0193939208984375, -0.974761962890625, -0.9301300048828125, -0.885498046875, -0.8408660888671875, -0.796234130859375, -0.7516021728515625, -0.70697021484375, -0.6623382568359375, -0.617706298828125, -0.5730743408203125, -0.5284423828125, -0.4838104248046875, -0.439178466796875, -0.3945465087890625, -0.34991455078125, -0.3052825927734375, -0.260650634765625, -0.2160186767578125, -0.17138671875, -0.1267547607421875, -0.082122802734375, -0.0374908447265625, 0.00714111328125, 0.0517730712890625, 0.096405029296875, 0.1410369873046875, 0.1856689453125, 0.2303009033203125, 0.274932861328125, 0.3195648193359375, 0.36419677734375, 0.4088287353515625, 0.453460693359375, 0.4980926513671875, 0.542724609375, 0.5873565673828125, 0.631988525390625, 0.6766204833984375, 0.72125244140625, 0.7658843994140625, 0.810516357421875, 0.8551483154296875, 0.8997802734375, 0.9444122314453125, 0.989044189453125, 1.0336761474609375, 1.07830810546875, 1.1229400634765625, 1.167572021484375, 1.2122039794921875, 1.2568359375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 8.0, 8.0, 12.0, 20.0, 27.0, 42.0, 73.0, 102.0, 168.0, 272.0, 497.0, 992.0, 1917.0, 4460.0, 12023.0, 40854.0, 229793.0, 619738.0, 100863.0, 23182.0, 7423.0, 3033.0, 1366.0, 664.0, 414.0, 201.0, 123.0, 78.0, 67.0, 35.0, 28.0, 16.0, 6.0, 10.0, 11.0, 6.0, 4.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310546875, -0.30062103271484375, -0.2906951904296875, -0.28076934814453125, -0.270843505859375, -0.26091766357421875, -0.2509918212890625, -0.24106597900390625, -0.23114013671875, -0.22121429443359375, -0.2112884521484375, -0.20136260986328125, -0.191436767578125, -0.18151092529296875, -0.1715850830078125, -0.16165924072265625, -0.1517333984375, -0.14180755615234375, -0.1318817138671875, -0.12195587158203125, -0.112030029296875, -0.10210418701171875, -0.0921783447265625, -0.08225250244140625, -0.07232666015625, -0.06240081787109375, -0.0524749755859375, -0.04254913330078125, -0.032623291015625, -0.02269744873046875, -0.0127716064453125, -0.00284576416015625, 0.007080078125, 0.01700592041015625, 0.0269317626953125, 0.03685760498046875, 0.046783447265625, 0.05670928955078125, 0.0666351318359375, 0.07656097412109375, 0.08648681640625, 0.09641265869140625, 0.1063385009765625, 0.11626434326171875, 0.126190185546875, 0.13611602783203125, 0.1460418701171875, 0.15596771240234375, 0.1658935546875, 0.17581939697265625, 0.1857452392578125, 0.19567108154296875, 0.205596923828125, 0.21552276611328125, 0.2254486083984375, 0.23537445068359375, 0.24530029296875, 0.25522613525390625, 0.2651519775390625, 0.27507781982421875, 0.285003662109375, 0.29492950439453125, 0.3048553466796875, 0.31478118896484375, 0.32470703125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 8.0, 10.0, 11.0, 13.0, 22.0, 31.0, 49.0, 54.0, 64.0, 92.0, 132.0, 111.0, 113.0, 92.0, 53.0, 32.0, 27.0, 26.0, 13.0, 5.0, 9.0, 3.0, 6.0, 11.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7206878662109375e-05, -4.5464374125003815e-05, -4.3721869587898254e-05, -4.1979365050792694e-05, -4.0236860513687134e-05, -3.8494355976581573e-05, -3.675185143947601e-05, -3.500934690237045e-05, -3.326684236526489e-05, -3.152433782815933e-05, -2.9781833291053772e-05, -2.803932875394821e-05, -2.629682421684265e-05, -2.455431967973709e-05, -2.281181514263153e-05, -2.106931060552597e-05, -1.932680606842041e-05, -1.758430153131485e-05, -1.584179699420929e-05, -1.409929245710373e-05, -1.2356787919998169e-05, -1.0614283382892609e-05, -8.871778845787048e-06, -7.129274308681488e-06, -5.386769771575928e-06, -3.6442652344703674e-06, -1.9017606973648071e-06, -1.5925616025924683e-07, 1.5832483768463135e-06, 3.3257529139518738e-06, 5.068257451057434e-06, 6.810761988162994e-06, 8.553266525268555e-06, 1.0295771062374115e-05, 1.2038275599479675e-05, 1.3780780136585236e-05, 1.5523284673690796e-05, 1.7265789210796356e-05, 1.9008293747901917e-05, 2.0750798285007477e-05, 2.2493302822113037e-05, 2.4235807359218597e-05, 2.5978311896324158e-05, 2.7720816433429718e-05, 2.946332097053528e-05, 3.120582550764084e-05, 3.29483300447464e-05, 3.469083458185196e-05, 3.643333911895752e-05, 3.817584365606308e-05, 3.991834819316864e-05, 4.16608527302742e-05, 4.340335726737976e-05, 4.514586180448532e-05, 4.688836634159088e-05, 4.863087087869644e-05, 5.0373375415802e-05, 5.211587995290756e-05, 5.385838449001312e-05, 5.560088902711868e-05, 5.734339356422424e-05, 5.9085898101329803e-05, 6.0828402638435364e-05, 6.257090717554092e-05, 6.431341171264648e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 7.0, 5.0, 9.0, 15.0, 15.0, 30.0, 41.0, 65.0, 102.0, 188.0, 321.0, 758.0, 1655.0, 4206.0, 12759.0, 51236.0, 333707.0, 539229.0, 76560.0, 17909.0, 5733.0, 2107.0, 878.0, 438.0, 227.0, 121.0, 84.0, 46.0, 42.0, 20.0, 15.0, 7.0, 4.0, 4.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27978515625, -0.26947021484375, -0.2591552734375, -0.24884033203125, -0.238525390625, -0.22821044921875, -0.2178955078125, -0.20758056640625, -0.197265625, -0.18695068359375, -0.1766357421875, -0.16632080078125, -0.156005859375, -0.14569091796875, -0.1353759765625, -0.12506103515625, -0.11474609375, -0.10443115234375, -0.0941162109375, -0.08380126953125, -0.073486328125, -0.06317138671875, -0.0528564453125, -0.04254150390625, -0.0322265625, -0.02191162109375, -0.0115966796875, -0.00128173828125, 0.009033203125, 0.01934814453125, 0.0296630859375, 0.03997802734375, 0.05029296875, 0.06060791015625, 0.0709228515625, 0.08123779296875, 0.091552734375, 0.10186767578125, 0.1121826171875, 0.12249755859375, 0.1328125, 0.14312744140625, 0.1534423828125, 0.16375732421875, 0.174072265625, 0.18438720703125, 0.1947021484375, 0.20501708984375, 0.21533203125, 0.22564697265625, 0.2359619140625, 0.24627685546875, 0.256591796875, 0.26690673828125, 0.2772216796875, 0.28753662109375, 0.2978515625, 0.30816650390625, 0.3184814453125, 0.32879638671875, 0.339111328125, 0.34942626953125, 0.3597412109375, 0.37005615234375, 0.38037109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 2.0, 7.0, 9.0, 7.0, 13.0, 16.0, 15.0, 27.0, 20.0, 38.0, 67.0, 98.0, 97.0, 116.0, 107.0, 88.0, 80.0, 45.0, 32.0, 11.0, 25.0, 13.0, 14.0, 5.0, 6.0, 8.0, 2.0, 3.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1741943359375, -0.16884803771972656, -0.16350173950195312, -0.1581554412841797, -0.15280914306640625, -0.1474628448486328, -0.14211654663085938, -0.13677024841308594, -0.1314239501953125, -0.12607765197753906, -0.12073135375976562, -0.11538505554199219, -0.11003875732421875, -0.10469245910644531, -0.09934616088867188, -0.09399986267089844, -0.088653564453125, -0.08330726623535156, -0.07796096801757812, -0.07261466979980469, -0.06726837158203125, -0.06192207336425781, -0.056575775146484375, -0.05122947692871094, -0.0458831787109375, -0.04053688049316406, -0.035190582275390625, -0.029844284057617188, -0.02449798583984375, -0.019151687622070312, -0.013805389404296875, -0.008459091186523438, -0.00311279296875, 0.0022335052490234375, 0.007579803466796875, 0.012926101684570312, 0.01827239990234375, 0.023618698120117188, 0.028964996337890625, 0.03431129455566406, 0.0396575927734375, 0.04500389099121094, 0.050350189208984375, 0.05569648742675781, 0.06104278564453125, 0.06638908386230469, 0.07173538208007812, 0.07708168029785156, 0.082427978515625, 0.08777427673339844, 0.09312057495117188, 0.09846687316894531, 0.10381317138671875, 0.10915946960449219, 0.11450576782226562, 0.11985206604003906, 0.1251983642578125, 0.13054466247558594, 0.13589096069335938, 0.1412372589111328, 0.14658355712890625, 0.1519298553466797, 0.15727615356445312, 0.16262245178222656, 0.16796875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 8.0, 19.0, 37.0, 81.0, 233.0, 338.0, 183.0, 64.0, 24.0, 8.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.351993560791016, -6.166636943817139, -5.981280326843262, -5.795923233032227, -5.61056661605835, -5.425209999084473, -5.239853382110596, -5.054496765136719, -4.869139671325684, -4.683783054351807, -4.49842643737793, -4.3130693435668945, -4.127712726593018, -3.9423561096191406, -3.7569994926452637, -3.5716428756713867, -3.3862862586975098, -3.200929641723633, -3.0155727863311768, -2.8302161693573, -2.6448593139648438, -2.459502696990967, -2.27414608001709, -2.088789463043213, -1.9034326076507568, -1.7180758714675903, -1.5327191352844238, -1.3473625183105469, -1.1620057821273804, -0.9766490459442139, -0.7912924289703369, -0.6059356927871704, -0.4205784797668457, -0.2352217733860016, -0.04986506700515747, 0.13549160957336426, 0.32084834575653076, 0.5062050819396973, 0.6915616989135742, 0.8769184350967407, 1.0622751712799072, 1.2476319074630737, 1.4329886436462402, 1.6183452606201172, 1.8037019968032837, 1.9890587329864502, 2.174415349960327, 2.359772205352783, 2.54512882232666, 2.730485439300537, 2.915842294692993, 3.10119891166687, 3.286555767059326, 3.471912384033203, 3.65726900100708, 3.842625617980957, 4.027982711791992, 4.213339328765869, 4.398695945739746, 4.584053039550781, 4.769409656524658, 4.954766273498535, 5.140122890472412, 5.325479507446289, 5.510836124420166]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 16.0, 10.0, 8.0, 5.0, 20.0, 17.0, 19.0, 20.0, 27.0, 41.0, 38.0, 45.0, 45.0, 39.0, 45.0, 38.0, 50.0, 52.0, 55.0, 48.0, 54.0, 40.0, 43.0, 36.0, 37.0, 31.0, 13.0, 26.0, 16.0, 19.0, 16.0, 7.0, 5.0, 5.0, 2.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7163403034210205, -2.6242775917053223, -2.532214879989624, -2.440152168273926, -2.3480896949768066, -2.2560269832611084, -2.16396427154541, -2.071901559829712, -1.9798389673233032, -1.887776255607605, -1.7957136631011963, -1.703650951385498, -1.6115882396697998, -1.5195256471633911, -1.4274629354476929, -1.3354003429412842, -1.243337631225586, -1.1512749195098877, -1.059212327003479, -0.9671496152877808, -0.8750869631767273, -0.7830243110656738, -0.6909615993499756, -0.5988989472389221, -0.5068362951278687, -0.4147736430168152, -0.32271096110343933, -0.23064827919006348, -0.13858562707901, -0.04652297496795654, 0.0455397367477417, 0.13760238885879517, 0.22966527938842773, 0.3217279314994812, 0.41379061341285706, 0.5058532953262329, 0.5979159474372864, 0.6899785995483398, 0.7820413112640381, 0.8741039633750916, 0.966166615486145, 1.0582293272018433, 1.150291919708252, 1.2423546314239502, 1.3344173431396484, 1.4264799356460571, 1.5185426473617554, 1.610605239868164, 1.7026679515838623, 1.7947306632995605, 1.8867932558059692, 1.9788559675216675, 2.070918560028076, 2.1629812717437744, 2.2550439834594727, 2.347106695175171, 2.439169406890869, 2.5312321186065674, 2.6232948303222656, 2.7153573036193848, 2.807420015335083, 2.8994827270507812, 2.9915454387664795, 3.0836081504821777, 3.175670623779297]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 8.0, 5.0, 17.0, 23.0, 36.0, 80.0, 167.0, 299.0, 745.0, 1964.0, 7328.0, 51164.0, 2618149.0, 1470043.0, 35725.0, 5708.0, 1614.0, 620.0, 272.0, 133.0, 83.0, 45.0, 30.0, 12.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.53125, -1.461456298828125, -1.39166259765625, -1.321868896484375, -1.2520751953125, -1.182281494140625, -1.11248779296875, -1.042694091796875, -0.972900390625, -0.903106689453125, -0.83331298828125, -0.763519287109375, -0.6937255859375, -0.623931884765625, -0.55413818359375, -0.484344482421875, -0.41455078125, -0.344757080078125, -0.27496337890625, -0.205169677734375, -0.1353759765625, -0.065582275390625, 0.00421142578125, 0.074005126953125, 0.143798828125, 0.213592529296875, 0.28338623046875, 0.353179931640625, 0.4229736328125, 0.492767333984375, 0.56256103515625, 0.632354736328125, 0.7021484375, 0.771942138671875, 0.84173583984375, 0.911529541015625, 0.9813232421875, 1.051116943359375, 1.12091064453125, 1.190704345703125, 1.260498046875, 1.330291748046875, 1.40008544921875, 1.469879150390625, 1.5396728515625, 1.609466552734375, 1.67926025390625, 1.749053955078125, 1.81884765625, 1.888641357421875, 1.95843505859375, 2.028228759765625, 2.0980224609375, 2.167816162109375, 2.23760986328125, 2.307403564453125, 2.377197265625, 2.446990966796875, 2.51678466796875, 2.586578369140625, 2.6563720703125, 2.726165771484375, 2.79595947265625, 2.865753173828125, 2.935546875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 10.0, 12.0, 11.0, 14.0, 16.0, 26.0, 23.0, 28.0, 49.0, 41.0, 79.0, 71.0, 62.0, 81.0, 82.0, 58.0, 64.0, 55.0, 53.0, 36.0, 30.0, 27.0, 12.0, 19.0, 12.0, 3.0, 8.0, 5.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.056640625, -1.0222320556640625, -0.987823486328125, -0.9534149169921875, -0.91900634765625, -0.8845977783203125, -0.850189208984375, -0.8157806396484375, -0.7813720703125, -0.7469635009765625, -0.712554931640625, -0.6781463623046875, -0.64373779296875, -0.6093292236328125, -0.574920654296875, -0.5405120849609375, -0.506103515625, -0.4716949462890625, -0.437286376953125, -0.4028778076171875, -0.36846923828125, -0.3340606689453125, -0.299652099609375, -0.2652435302734375, -0.2308349609375, -0.1964263916015625, -0.162017822265625, -0.1276092529296875, -0.09320068359375, -0.0587921142578125, -0.024383544921875, 0.0100250244140625, 0.04443359375, 0.0788421630859375, 0.113250732421875, 0.1476593017578125, 0.18206787109375, 0.2164764404296875, 0.250885009765625, 0.2852935791015625, 0.3197021484375, 0.3541107177734375, 0.388519287109375, 0.4229278564453125, 0.45733642578125, 0.4917449951171875, 0.526153564453125, 0.5605621337890625, 0.594970703125, 0.6293792724609375, 0.663787841796875, 0.6981964111328125, 0.73260498046875, 0.7670135498046875, 0.801422119140625, 0.8358306884765625, 0.8702392578125, 0.9046478271484375, 0.939056396484375, 0.9734649658203125, 1.00787353515625, 1.0422821044921875, 1.076690673828125, 1.1110992431640625, 1.1455078125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 16.0, 20.0, 18.0, 38.0, 47.0, 65.0, 112.0, 147.0, 226.0, 440.0, 786.0, 1659.0, 3571.0, 9606.0, 33182.0, 194310.0, 3287601.0, 577608.0, 59910.0, 15059.0, 5233.0, 2229.0, 1022.0, 553.0, 295.0, 156.0, 102.0, 78.0, 56.0, 34.0, 24.0, 16.0, 11.0, 9.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0108795166015625, -0.976837158203125, -0.9427947998046875, -0.90875244140625, -0.8747100830078125, -0.840667724609375, -0.8066253662109375, -0.7725830078125, -0.7385406494140625, -0.704498291015625, -0.6704559326171875, -0.63641357421875, -0.6023712158203125, -0.568328857421875, -0.5342864990234375, -0.500244140625, -0.4662017822265625, -0.432159423828125, -0.3981170654296875, -0.36407470703125, -0.3300323486328125, -0.295989990234375, -0.2619476318359375, -0.2279052734375, -0.1938629150390625, -0.159820556640625, -0.1257781982421875, -0.09173583984375, -0.0576934814453125, -0.023651123046875, 0.0103912353515625, 0.04443359375, 0.0784759521484375, 0.112518310546875, 0.1465606689453125, 0.18060302734375, 0.2146453857421875, 0.248687744140625, 0.2827301025390625, 0.3167724609375, 0.3508148193359375, 0.384857177734375, 0.4188995361328125, 0.45294189453125, 0.4869842529296875, 0.521026611328125, 0.5550689697265625, 0.589111328125, 0.6231536865234375, 0.657196044921875, 0.6912384033203125, 0.72528076171875, 0.7593231201171875, 0.793365478515625, 0.8274078369140625, 0.8614501953125, 0.8954925537109375, 0.929534912109375, 0.9635772705078125, 0.99761962890625, 1.0316619873046875, 1.065704345703125, 1.0997467041015625, 1.1337890625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 7.0, 10.0, 8.0, 15.0, 15.0, 14.0, 44.0, 41.0, 59.0, 76.0, 112.0, 178.0, 287.0, 467.0, 685.0, 717.0, 448.0, 289.0, 187.0, 103.0, 69.0, 68.0, 32.0, 34.0, 18.0, 13.0, 12.0, 10.0, 10.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.288330078125, -0.2793121337890625, -0.270294189453125, -0.2612762451171875, -0.25225830078125, -0.2432403564453125, -0.234222412109375, -0.2252044677734375, -0.2161865234375, -0.2071685791015625, -0.198150634765625, -0.1891326904296875, -0.18011474609375, -0.1710968017578125, -0.162078857421875, -0.1530609130859375, -0.14404296875, -0.1350250244140625, -0.126007080078125, -0.1169891357421875, -0.10797119140625, -0.0989532470703125, -0.089935302734375, -0.0809173583984375, -0.0718994140625, -0.0628814697265625, -0.053863525390625, -0.0448455810546875, -0.03582763671875, -0.0268096923828125, -0.017791748046875, -0.0087738037109375, 0.000244140625, 0.0092620849609375, 0.018280029296875, 0.0272979736328125, 0.03631591796875, 0.0453338623046875, 0.054351806640625, 0.0633697509765625, 0.0723876953125, 0.0814056396484375, 0.090423583984375, 0.0994415283203125, 0.10845947265625, 0.1174774169921875, 0.126495361328125, 0.1355133056640625, 0.14453125, 0.1535491943359375, 0.162567138671875, 0.1715850830078125, 0.18060302734375, 0.1896209716796875, 0.198638916015625, 0.2076568603515625, 0.2166748046875, 0.2256927490234375, 0.234710693359375, 0.2437286376953125, 0.25274658203125, 0.2617645263671875, 0.270782470703125, 0.2798004150390625, 0.288818359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 0.0, 4.0, 8.0, 8.0, 17.0, 28.0, 39.0, 53.0, 97.0, 152.0, 169.0, 155.0, 139.0, 58.0, 31.0, 15.0, 14.0, 8.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6436997652053833, -1.5736243724822998, -1.5035490989685059, -1.433473825454712, -1.3633984327316284, -1.293323040008545, -1.223247766494751, -1.153172492980957, -1.0830971002578735, -1.01302170753479, -0.9429464340209961, -0.8728711009025574, -0.8027957677841187, -0.7327204346656799, -0.6626451015472412, -0.5925697684288025, -0.5224944353103638, -0.45241910219192505, -0.38234376907348633, -0.3122684359550476, -0.2421931028366089, -0.17211776971817017, -0.10204243659973145, -0.031967103481292725, 0.038108229637145996, 0.10818356275558472, 0.17825889587402344, 0.24833422899246216, 0.3184095621109009, 0.3884848952293396, 0.4585602283477783, 0.528635561466217, 0.5987107753753662, 0.6687861084938049, 0.7388614416122437, 0.8089367747306824, 0.8790121078491211, 0.9490874409675598, 1.0191627740859985, 1.089238166809082, 1.159313440322876, 1.22938871383667, 1.2994641065597534, 1.369539499282837, 1.4396147727966309, 1.5096900463104248, 1.5797654390335083, 1.6498408317565918, 1.7199161052703857, 1.7899913787841797, 1.8600667715072632, 1.9301421642303467, 2.0002174377441406, 2.0702927112579346, 2.1403679847717285, 2.2104434967041016, 2.2805187702178955, 2.3505940437316895, 2.4206695556640625, 2.4907448291778564, 2.5608201026916504, 2.6308953762054443, 2.7009706497192383, 2.7710461616516113, 2.8411214351654053]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 6.0, 9.0, 8.0, 17.0, 21.0, 25.0, 25.0, 44.0, 41.0, 44.0, 48.0, 54.0, 63.0, 54.0, 67.0, 51.0, 50.0, 49.0, 49.0, 51.0, 47.0, 26.0, 25.0, 18.0, 19.0, 18.0, 10.0, 10.0, 9.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.9853600859642029, -0.9542308449745178, -0.923101544380188, -0.8919723033905029, -0.8608430624008179, -0.8297138214111328, -0.798584520816803, -0.7674552798271179, -0.7363259792327881, -0.705196738243103, -0.6740674376487732, -0.6429381966590881, -0.6118089556694031, -0.5806796550750732, -0.5495504140853882, -0.5184211730957031, -0.48729193210601807, -0.4561626613140106, -0.42503342032432556, -0.3939041495323181, -0.36277490854263306, -0.3316456377506256, -0.30051636695861816, -0.2693871259689331, -0.23825785517692566, -0.2071285992860794, -0.17599934339523315, -0.1448700726032257, -0.11374081671237946, -0.0826115608215332, -0.05148229002952576, -0.020353034138679504, 0.010776281356811523, 0.041905540972948074, 0.07303480058908463, 0.10416406393051147, 0.13529331982135773, 0.16642257571220398, 0.19755184650421143, 0.22868110239505768, 0.25981035828590393, 0.2909396290779114, 0.32206887006759644, 0.3531981408596039, 0.38432741165161133, 0.4154566526412964, 0.44658592343330383, 0.4777151942253113, 0.5088444352149963, 0.5399736762046814, 0.5711029767990112, 0.6022322177886963, 0.6333614587783813, 0.6644906997680664, 0.6956200003623962, 0.7267492413520813, 0.7578785419464111, 0.7890077829360962, 0.820137083530426, 0.8512663245201111, 0.8823955655097961, 0.913524866104126, 0.944654107093811, 0.9757833480834961, 1.0069125890731812]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 10.0, 7.0, 8.0, 15.0, 23.0, 29.0, 39.0, 86.0, 97.0, 164.0, 236.0, 395.0, 729.0, 1299.0, 2455.0, 5139.0, 11581.0, 28350.0, 80274.0, 270019.0, 419662.0, 147123.0, 47355.0, 17896.0, 7856.0, 3547.0, 1779.0, 943.0, 553.0, 313.0, 203.0, 134.0, 76.0, 46.0, 32.0, 24.0, 20.0, 8.0, 9.0, 4.0, 5.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.119140625, -0.11532878875732422, -0.11151695251464844, -0.10770511627197266, -0.10389328002929688, -0.1000814437866211, -0.09626960754394531, -0.09245777130126953, -0.08864593505859375, -0.08483409881591797, -0.08102226257324219, -0.0772104263305664, -0.07339859008789062, -0.06958675384521484, -0.06577491760253906, -0.06196308135986328, -0.0581512451171875, -0.05433940887451172, -0.05052757263183594, -0.046715736389160156, -0.042903900146484375, -0.039092063903808594, -0.03528022766113281, -0.03146839141845703, -0.02765655517578125, -0.02384471893310547, -0.020032882690429688, -0.016221046447753906, -0.012409210205078125, -0.008597373962402344, -0.0047855377197265625, -0.0009737014770507812, 0.002838134765625, 0.006649971008300781, 0.010461807250976562, 0.014273643493652344, 0.018085479736328125, 0.021897315979003906, 0.025709152221679688, 0.02952098846435547, 0.03333282470703125, 0.03714466094970703, 0.04095649719238281, 0.044768333435058594, 0.048580169677734375, 0.052392005920410156, 0.05620384216308594, 0.06001567840576172, 0.0638275146484375, 0.06763935089111328, 0.07145118713378906, 0.07526302337646484, 0.07907485961914062, 0.0828866958618164, 0.08669853210449219, 0.09051036834716797, 0.09432220458984375, 0.09813404083251953, 0.10194587707519531, 0.1057577133178711, 0.10956954956054688, 0.11338138580322266, 0.11719322204589844, 0.12100505828857422, 0.12481689453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 7.0, 6.0, 12.0, 14.0, 18.0, 24.0, 43.0, 56.0, 47.0, 56.0, 53.0, 66.0, 92.0, 66.0, 65.0, 62.0, 61.0, 41.0, 50.0, 32.0, 22.0, 24.0, 13.0, 15.0, 6.0, 9.0, 6.0, 3.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.74853515625, -0.7244033813476562, -0.7002716064453125, -0.6761398315429688, -0.652008056640625, -0.6278762817382812, -0.6037445068359375, -0.5796127319335938, -0.55548095703125, -0.5313491821289062, -0.5072174072265625, -0.48308563232421875, -0.458953857421875, -0.43482208251953125, -0.4106903076171875, -0.38655853271484375, -0.3624267578125, -0.33829498291015625, -0.3141632080078125, -0.29003143310546875, -0.265899658203125, -0.24176788330078125, -0.2176361083984375, -0.19350433349609375, -0.16937255859375, -0.14524078369140625, -0.1211090087890625, -0.09697723388671875, -0.072845458984375, -0.04871368408203125, -0.0245819091796875, -0.00045013427734375, 0.023681640625, 0.04781341552734375, 0.0719451904296875, 0.09607696533203125, 0.120208740234375, 0.14434051513671875, 0.1684722900390625, 0.19260406494140625, 0.21673583984375, 0.24086761474609375, 0.2649993896484375, 0.28913116455078125, 0.313262939453125, 0.33739471435546875, 0.3615264892578125, 0.38565826416015625, 0.4097900390625, 0.43392181396484375, 0.4580535888671875, 0.48218536376953125, 0.506317138671875, 0.5304489135742188, 0.5545806884765625, 0.5787124633789062, 0.60284423828125, 0.6269760131835938, 0.6511077880859375, 0.6752395629882812, 0.699371337890625, 0.7235031127929688, 0.7476348876953125, 0.7717666625976562, 0.7958984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 5.0, 11.0, 12.0, 15.0, 29.0, 17.0, 41.0, 61.0, 82.0, 189.0, 328.0, 664.0, 1657.0, 4659.0, 18509.0, 101906.0, 549199.0, 308338.0, 47663.0, 9982.0, 2907.0, 1135.0, 449.0, 267.0, 150.0, 85.0, 58.0, 33.0, 26.0, 17.0, 12.0, 17.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1824951171875, -0.17724990844726562, -0.17200469970703125, -0.16675949096679688, -0.1615142822265625, -0.15626907348632812, -0.15102386474609375, -0.14577865600585938, -0.140533447265625, -0.13528823852539062, -0.13004302978515625, -0.12479782104492188, -0.1195526123046875, -0.11430740356445312, -0.10906219482421875, -0.10381698608398438, -0.09857177734375, -0.09332656860351562, -0.08808135986328125, -0.08283615112304688, -0.0775909423828125, -0.07234573364257812, -0.06710052490234375, -0.061855316162109375, -0.056610107421875, -0.051364898681640625, -0.04611968994140625, -0.040874481201171875, -0.0356292724609375, -0.030384063720703125, -0.02513885498046875, -0.019893646240234375, -0.0146484375, -0.009403228759765625, -0.00415802001953125, 0.001087188720703125, 0.0063323974609375, 0.011577606201171875, 0.01682281494140625, 0.022068023681640625, 0.027313232421875, 0.032558441162109375, 0.03780364990234375, 0.043048858642578125, 0.0482940673828125, 0.053539276123046875, 0.05878448486328125, 0.06402969360351562, 0.06927490234375, 0.07452011108398438, 0.07976531982421875, 0.08501052856445312, 0.0902557373046875, 0.09550094604492188, 0.10074615478515625, 0.10599136352539062, 0.111236572265625, 0.11648178100585938, 0.12172698974609375, 0.12697219848632812, 0.1322174072265625, 0.13746261596679688, 0.14270782470703125, 0.14795303344726562, 0.1531982421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 3.0, 12.0, 6.0, 12.0, 16.0, 24.0, 23.0, 22.0, 30.0, 43.0, 44.0, 34.0, 45.0, 44.0, 54.0, 44.0, 67.0, 41.0, 57.0, 44.0, 45.0, 37.0, 49.0, 28.0, 24.0, 21.0, 28.0, 16.0, 18.0, 7.0, 13.0, 14.0, 6.0, 4.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.333984375, -1.2990951538085938, -1.2642059326171875, -1.2293167114257812, -1.194427490234375, -1.1595382690429688, -1.1246490478515625, -1.0897598266601562, -1.05487060546875, -1.0199813842773438, -0.9850921630859375, -0.9502029418945312, -0.915313720703125, -0.8804244995117188, -0.8455352783203125, -0.8106460571289062, -0.7757568359375, -0.7408676147460938, -0.7059783935546875, -0.6710891723632812, -0.636199951171875, -0.6013107299804688, -0.5664215087890625, -0.5315322875976562, -0.49664306640625, -0.46175384521484375, -0.4268646240234375, -0.39197540283203125, -0.357086181640625, -0.32219696044921875, -0.2873077392578125, -0.25241851806640625, -0.217529296875, -0.18264007568359375, -0.1477508544921875, -0.11286163330078125, -0.077972412109375, -0.04308319091796875, -0.0081939697265625, 0.02669525146484375, 0.06158447265625, 0.09647369384765625, 0.1313629150390625, 0.16625213623046875, 0.201141357421875, 0.23603057861328125, 0.2709197998046875, 0.30580902099609375, 0.3406982421875, 0.37558746337890625, 0.4104766845703125, 0.44536590576171875, 0.480255126953125, 0.5151443481445312, 0.5500335693359375, 0.5849227905273438, 0.61981201171875, 0.6547012329101562, 0.6895904541015625, 0.7244796752929688, 0.759368896484375, 0.7942581176757812, 0.8291473388671875, 0.8640365600585938, 0.89892578125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 5.0, 5.0, 17.0, 10.0, 16.0, 25.0, 36.0, 41.0, 109.0, 145.0, 277.0, 641.0, 1292.0, 3260.0, 10539.0, 45466.0, 394649.0, 518339.0, 55039.0, 12147.0, 3687.0, 1405.0, 628.0, 282.0, 195.0, 101.0, 50.0, 38.0, 30.0, 17.0, 18.0, 11.0, 10.0, 10.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06707763671875, -0.06484603881835938, -0.06261444091796875, -0.060382843017578125, -0.0581512451171875, -0.055919647216796875, -0.05368804931640625, -0.051456451416015625, -0.049224853515625, -0.046993255615234375, -0.04476165771484375, -0.042530059814453125, -0.0402984619140625, -0.038066864013671875, -0.03583526611328125, -0.033603668212890625, -0.0313720703125, -0.029140472412109375, -0.02690887451171875, -0.024677276611328125, -0.0224456787109375, -0.020214080810546875, -0.01798248291015625, -0.015750885009765625, -0.013519287109375, -0.011287689208984375, -0.00905609130859375, -0.006824493408203125, -0.0045928955078125, -0.002361297607421875, -0.00012969970703125, 0.002101898193359375, 0.00433349609375, 0.006565093994140625, 0.00879669189453125, 0.011028289794921875, 0.0132598876953125, 0.015491485595703125, 0.01772308349609375, 0.019954681396484375, 0.022186279296875, 0.024417877197265625, 0.02664947509765625, 0.028881072998046875, 0.0311126708984375, 0.033344268798828125, 0.03557586669921875, 0.037807464599609375, 0.0400390625, 0.042270660400390625, 0.04450225830078125, 0.046733856201171875, 0.0489654541015625, 0.051197052001953125, 0.05342864990234375, 0.055660247802734375, 0.057891845703125, 0.060123443603515625, 0.06235504150390625, 0.06458663940429688, 0.0668182373046875, 0.06904983520507812, 0.07128143310546875, 0.07351303100585938, 0.07574462890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 3.0, 9.0, 19.0, 15.0, 12.0, 31.0, 45.0, 42.0, 89.0, 94.0, 106.0, 116.0, 93.0, 82.0, 48.0, 48.0, 33.0, 24.0, 18.0, 13.0, 4.0, 10.0, 13.0, 4.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193450927734375e-05, -2.0951032638549805e-05, -1.996755599975586e-05, -1.8984079360961914e-05, -1.800060272216797e-05, -1.7017126083374023e-05, -1.6033649444580078e-05, -1.5050172805786133e-05, -1.4066696166992188e-05, -1.3083219528198242e-05, -1.2099742889404297e-05, -1.1116266250610352e-05, -1.0132789611816406e-05, -9.149312973022461e-06, -8.165836334228516e-06, -7.18235969543457e-06, -6.198883056640625e-06, -5.21540641784668e-06, -4.231929779052734e-06, -3.248453140258789e-06, -2.2649765014648438e-06, -1.2814998626708984e-06, -2.980232238769531e-07, 6.854534149169922e-07, 1.6689300537109375e-06, 2.652406692504883e-06, 3.635883331298828e-06, 4.6193599700927734e-06, 5.602836608886719e-06, 6.586313247680664e-06, 7.569789886474609e-06, 8.553266525268555e-06, 9.5367431640625e-06, 1.0520219802856445e-05, 1.150369644165039e-05, 1.2487173080444336e-05, 1.3470649719238281e-05, 1.4454126358032227e-05, 1.5437602996826172e-05, 1.6421079635620117e-05, 1.7404556274414062e-05, 1.8388032913208008e-05, 1.9371509552001953e-05, 2.03549861907959e-05, 2.1338462829589844e-05, 2.232193946838379e-05, 2.3305416107177734e-05, 2.428889274597168e-05, 2.5272369384765625e-05, 2.625584602355957e-05, 2.7239322662353516e-05, 2.822279930114746e-05, 2.9206275939941406e-05, 3.018975257873535e-05, 3.11732292175293e-05, 3.215670585632324e-05, 3.314018249511719e-05, 3.412365913391113e-05, 3.510713577270508e-05, 3.6090612411499023e-05, 3.707408905029297e-05, 3.8057565689086914e-05, 3.904104232788086e-05, 4.0024518966674805e-05, 4.100799560546875e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 6.0, 5.0, 3.0, 8.0, 20.0, 22.0, 35.0, 44.0, 67.0, 131.0, 239.0, 459.0, 994.0, 2273.0, 5665.0, 16813.0, 60320.0, 317728.0, 510042.0, 96050.0, 24270.0, 7910.0, 2921.0, 1222.0, 565.0, 305.0, 136.0, 93.0, 49.0, 46.0, 29.0, 17.0, 12.0, 8.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.05902099609375, -0.057240962982177734, -0.05546092987060547, -0.0536808967590332, -0.05190086364746094, -0.05012083053588867, -0.048340797424316406, -0.04656076431274414, -0.044780731201171875, -0.04300069808959961, -0.041220664978027344, -0.03944063186645508, -0.03766059875488281, -0.03588056564331055, -0.03410053253173828, -0.032320499420166016, -0.03054046630859375, -0.028760433197021484, -0.02698040008544922, -0.025200366973876953, -0.023420333862304688, -0.021640300750732422, -0.019860267639160156, -0.01808023452758789, -0.016300201416015625, -0.01452016830444336, -0.012740135192871094, -0.010960102081298828, -0.009180068969726562, -0.007400035858154297, -0.005620002746582031, -0.0038399696350097656, -0.0020599365234375, -0.0002799034118652344, 0.0015001296997070312, 0.003280162811279297, 0.0050601959228515625, 0.006840229034423828, 0.008620262145996094, 0.01040029525756836, 0.012180328369140625, 0.01396036148071289, 0.015740394592285156, 0.017520427703857422, 0.019300460815429688, 0.021080493927001953, 0.02286052703857422, 0.024640560150146484, 0.02642059326171875, 0.028200626373291016, 0.02998065948486328, 0.03176069259643555, 0.03354072570800781, 0.03532075881958008, 0.037100791931152344, 0.03888082504272461, 0.040660858154296875, 0.04244089126586914, 0.044220924377441406, 0.04600095748901367, 0.04778099060058594, 0.0495610237121582, 0.05134105682373047, 0.053121089935302734, 0.054901123046875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 6.0, 10.0, 14.0, 10.0, 9.0, 21.0, 13.0, 16.0, 16.0, 36.0, 39.0, 48.0, 61.0, 91.0, 93.0, 99.0, 81.0, 67.0, 58.0, 39.0, 35.0, 18.0, 27.0, 16.0, 9.0, 9.0, 11.0, 8.0, 5.0, 3.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.013336181640625, -0.012967109680175781, -0.012598037719726562, -0.012228965759277344, -0.011859893798828125, -0.011490821838378906, -0.011121749877929688, -0.010752677917480469, -0.01038360595703125, -0.010014533996582031, -0.009645462036132812, -0.009276390075683594, -0.008907318115234375, -0.008538246154785156, -0.008169174194335938, -0.007800102233886719, -0.0074310302734375, -0.007061958312988281, -0.0066928863525390625, -0.006323814392089844, -0.005954742431640625, -0.005585670471191406, -0.0052165985107421875, -0.004847526550292969, -0.00447845458984375, -0.004109382629394531, -0.0037403106689453125, -0.0033712387084960938, -0.003002166748046875, -0.0026330947875976562, -0.0022640228271484375, -0.0018949508666992188, -0.00152587890625, -0.0011568069458007812, -0.0007877349853515625, -0.00041866302490234375, -4.9591064453125e-05, 0.00031948089599609375, 0.0006885528564453125, 0.0010576248168945312, 0.00142669677734375, 0.0017957687377929688, 0.0021648406982421875, 0.0025339126586914062, 0.002902984619140625, 0.0032720565795898438, 0.0036411285400390625, 0.004010200500488281, 0.0043792724609375, 0.004748344421386719, 0.0051174163818359375, 0.005486488342285156, 0.005855560302734375, 0.006224632263183594, 0.0065937042236328125, 0.006962776184082031, 0.00733184814453125, 0.007700920104980469, 0.008069992065429688, 0.008439064025878906, 0.008808135986328125, 0.009177207946777344, 0.009546279907226562, 0.009915351867675781, 0.010284423828125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 10.0, 21.0, 31.0, 58.0, 107.0, 199.0, 232.0, 184.0, 81.0, 30.0, 18.0, 10.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4329123497009277, -1.37594735622406, -1.3189823627471924, -1.2620173692703247, -1.205052375793457, -1.1480873823165894, -1.0911223888397217, -1.034157395362854, -0.9771924018859863, -0.9202274084091187, -0.863262414932251, -0.8062974214553833, -0.7493324279785156, -0.692367434501648, -0.6354024410247803, -0.5784374475479126, -0.5214724540710449, -0.46450746059417725, -0.40754246711730957, -0.3505774736404419, -0.2936124801635742, -0.23664748668670654, -0.17968249320983887, -0.12271749973297119, -0.06575250625610352, -0.00878751277923584, 0.048177480697631836, 0.10514247417449951, 0.1621074676513672, 0.21907246112823486, 0.27603745460510254, 0.3330024480819702, 0.3899674415588379, 0.44693243503570557, 0.5038974285125732, 0.5608624219894409, 0.6178274154663086, 0.6747924089431763, 0.731757402420044, 0.7887223958969116, 0.8456873893737793, 0.902652382850647, 0.9596173763275146, 1.0165823698043823, 1.07354736328125, 1.1305123567581177, 1.1874773502349854, 1.244442343711853, 1.3014073371887207, 1.3583723306655884, 1.415337324142456, 1.4723023176193237, 1.5292673110961914, 1.586232304573059, 1.6431972980499268, 1.7001622915267944, 1.757127285003662, 1.8140922784805298, 1.8710572719573975, 1.9280222654342651, 1.9849872589111328, 2.041952133178711, 2.098917245864868, 2.1558823585510254, 2.2128472328186035]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 3.0, 2.0, 10.0, 13.0, 11.0, 11.0, 23.0, 27.0, 40.0, 44.0, 52.0, 49.0, 61.0, 60.0, 77.0, 60.0, 64.0, 56.0, 58.0, 54.0, 44.0, 37.0, 23.0, 18.0, 25.0, 14.0, 12.0, 11.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.649139404296875, -0.6276806592941284, -0.6062219142913818, -0.5847631692886353, -0.5633044838905334, -0.5418457388877869, -0.5203869938850403, -0.4989282488822937, -0.4774695336818695, -0.4560107886791229, -0.43455207347869873, -0.41309332847595215, -0.39163458347320557, -0.37017586827278137, -0.3487171232700348, -0.3272584080696106, -0.305799663066864, -0.28434091806411743, -0.26288220286369324, -0.24142345786094666, -0.21996472775936127, -0.19850599765777588, -0.1770472526550293, -0.1555885225534439, -0.13412979245185852, -0.11267106235027313, -0.09121232479810715, -0.06975358724594116, -0.048294857144355774, -0.026836127042770386, -0.005377382040023804, 0.016081348061561584, 0.03754013776779175, 0.058998871594667435, 0.08045760542154312, 0.1019163429737091, 0.1233750730752945, 0.14483380317687988, 0.16629254817962646, 0.18775127828121185, 0.20921000838279724, 0.23066873848438263, 0.252127468585968, 0.2735862135887146, 0.2950449585914612, 0.3165036737918854, 0.33796241879463196, 0.35942113399505615, 0.38087987899780273, 0.4023386240005493, 0.4237973392009735, 0.4452560842037201, 0.4667147994041443, 0.48817354440689087, 0.5096322894096375, 0.531091034412384, 0.5525497198104858, 0.5740084648132324, 0.595467209815979, 0.6169259548187256, 0.6383846402168274, 0.659843385219574, 0.6813021302223206, 0.7027608752250671, 0.7242196202278137]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 6.0, 22.0, 22.0, 26.0, 59.0, 64.0, 111.0, 169.0, 270.0, 397.0, 695.0, 1203.0, 1978.0, 3790.0, 7049.0, 14527.0, 33298.0, 92344.0, 340244.0, 379365.0, 103536.0, 36688.0, 15926.0, 7564.0, 3855.0, 2112.0, 1240.0, 760.0, 428.0, 278.0, 199.0, 113.0, 76.0, 57.0, 23.0, 16.0, 15.0, 9.0, 8.0, 2.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48193359375, -0.464752197265625, -0.44757080078125, -0.430389404296875, -0.4132080078125, -0.396026611328125, -0.37884521484375, -0.361663818359375, -0.344482421875, -0.327301025390625, -0.31011962890625, -0.292938232421875, -0.2757568359375, -0.258575439453125, -0.24139404296875, -0.224212646484375, -0.20703125, -0.189849853515625, -0.17266845703125, -0.155487060546875, -0.1383056640625, -0.121124267578125, -0.10394287109375, -0.086761474609375, -0.069580078125, -0.052398681640625, -0.03521728515625, -0.018035888671875, -0.0008544921875, 0.016326904296875, 0.03350830078125, 0.050689697265625, 0.06787109375, 0.085052490234375, 0.10223388671875, 0.119415283203125, 0.1365966796875, 0.153778076171875, 0.17095947265625, 0.188140869140625, 0.205322265625, 0.222503662109375, 0.23968505859375, 0.256866455078125, 0.2740478515625, 0.291229248046875, 0.30841064453125, 0.325592041015625, 0.3427734375, 0.359954833984375, 0.37713623046875, 0.394317626953125, 0.4114990234375, 0.428680419921875, 0.44586181640625, 0.463043212890625, 0.480224609375, 0.497406005859375, 0.51458740234375, 0.531768798828125, 0.5489501953125, 0.566131591796875, 0.58331298828125, 0.600494384765625, 0.61767578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 4.0, 11.0, 15.0, 16.0, 17.0, 30.0, 36.0, 52.0, 52.0, 56.0, 67.0, 87.0, 75.0, 89.0, 60.0, 57.0, 53.0, 56.0, 30.0, 24.0, 28.0, 16.0, 10.0, 15.0, 7.0, 10.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.51556396484375, -1.4608154296875, -1.40606689453125, -1.351318359375, -1.29656982421875, -1.2418212890625, -1.18707275390625, -1.13232421875, -1.07757568359375, -1.0228271484375, -0.96807861328125, -0.913330078125, -0.85858154296875, -0.8038330078125, -0.74908447265625, -0.6943359375, -0.63958740234375, -0.5848388671875, -0.53009033203125, -0.475341796875, -0.42059326171875, -0.3658447265625, -0.31109619140625, -0.25634765625, -0.20159912109375, -0.1468505859375, -0.09210205078125, -0.037353515625, 0.01739501953125, 0.0721435546875, 0.12689208984375, 0.181640625, 0.23638916015625, 0.2911376953125, 0.34588623046875, 0.400634765625, 0.45538330078125, 0.5101318359375, 0.56488037109375, 0.61962890625, 0.67437744140625, 0.7291259765625, 0.78387451171875, 0.838623046875, 0.89337158203125, 0.9481201171875, 1.00286865234375, 1.0576171875, 1.11236572265625, 1.1671142578125, 1.22186279296875, 1.276611328125, 1.33135986328125, 1.3861083984375, 1.44085693359375, 1.49560546875, 1.55035400390625, 1.6051025390625, 1.65985107421875, 1.714599609375, 1.76934814453125, 1.8240966796875, 1.87884521484375, 1.93359375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 10.0, 9.0, 18.0, 17.0, 36.0, 51.0, 65.0, 77.0, 109.0, 171.0, 235.0, 449.0, 769.0, 1550.0, 3762.0, 10478.0, 38136.0, 225757.0, 620059.0, 111222.0, 23037.0, 7003.0, 2696.0, 1220.0, 599.0, 306.0, 231.0, 125.0, 102.0, 58.0, 61.0, 33.0, 32.0, 24.0, 16.0, 9.0, 9.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52587890625, -0.5066299438476562, -0.4873809814453125, -0.46813201904296875, -0.448883056640625, -0.42963409423828125, -0.4103851318359375, -0.39113616943359375, -0.37188720703125, -0.35263824462890625, -0.3333892822265625, -0.31414031982421875, -0.294891357421875, -0.27564239501953125, -0.2563934326171875, -0.23714447021484375, -0.2178955078125, -0.19864654541015625, -0.1793975830078125, -0.16014862060546875, -0.140899658203125, -0.12165069580078125, -0.1024017333984375, -0.08315277099609375, -0.06390380859375, -0.04465484619140625, -0.0254058837890625, -0.00615692138671875, 0.013092041015625, 0.03234100341796875, 0.0515899658203125, 0.07083892822265625, 0.090087890625, 0.10933685302734375, 0.1285858154296875, 0.14783477783203125, 0.167083740234375, 0.18633270263671875, 0.2055816650390625, 0.22483062744140625, 0.24407958984375, 0.26332855224609375, 0.2825775146484375, 0.30182647705078125, 0.321075439453125, 0.34032440185546875, 0.3595733642578125, 0.37882232666015625, 0.3980712890625, 0.41732025146484375, 0.4365692138671875, 0.45581817626953125, 0.475067138671875, 0.49431610107421875, 0.5135650634765625, 0.5328140258789062, 0.55206298828125, 0.5713119506835938, 0.5905609130859375, 0.6098098754882812, 0.629058837890625, 0.6483078002929688, 0.6675567626953125, 0.6868057250976562, 0.7060546875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 8.0, 4.0, 10.0, 8.0, 12.0, 13.0, 11.0, 20.0, 21.0, 16.0, 21.0, 18.0, 35.0, 33.0, 29.0, 29.0, 41.0, 44.0, 31.0, 42.0, 48.0, 58.0, 25.0, 55.0, 41.0, 37.0, 33.0, 40.0, 35.0, 28.0, 25.0, 20.0, 9.0, 15.0, 18.0, 17.0, 16.0, 10.0, 5.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.275390625, -1.23309326171875, -1.1907958984375, -1.14849853515625, -1.106201171875, -1.06390380859375, -1.0216064453125, -0.97930908203125, -0.93701171875, -0.89471435546875, -0.8524169921875, -0.81011962890625, -0.767822265625, -0.72552490234375, -0.6832275390625, -0.64093017578125, -0.5986328125, -0.55633544921875, -0.5140380859375, -0.47174072265625, -0.429443359375, -0.38714599609375, -0.3448486328125, -0.30255126953125, -0.26025390625, -0.21795654296875, -0.1756591796875, -0.13336181640625, -0.091064453125, -0.04876708984375, -0.0064697265625, 0.03582763671875, 0.078125, 0.12042236328125, 0.1627197265625, 0.20501708984375, 0.247314453125, 0.28961181640625, 0.3319091796875, 0.37420654296875, 0.41650390625, 0.45880126953125, 0.5010986328125, 0.54339599609375, 0.585693359375, 0.62799072265625, 0.6702880859375, 0.71258544921875, 0.7548828125, 0.79718017578125, 0.8394775390625, 0.88177490234375, 0.924072265625, 0.96636962890625, 1.0086669921875, 1.05096435546875, 1.09326171875, 1.13555908203125, 1.1778564453125, 1.22015380859375, 1.262451171875, 1.30474853515625, 1.3470458984375, 1.38934326171875, 1.431640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 1.0, 6.0, 14.0, 14.0, 23.0, 43.0, 69.0, 147.0, 314.0, 973.0, 3963.0, 29364.0, 678912.0, 313845.0, 16893.0, 2706.0, 759.0, 240.0, 108.0, 65.0, 26.0, 25.0, 11.0, 12.0, 6.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4677734375, -0.45574188232421875, -0.4437103271484375, -0.43167877197265625, -0.419647216796875, -0.40761566162109375, -0.3955841064453125, -0.38355255126953125, -0.37152099609375, -0.35948944091796875, -0.3474578857421875, -0.33542633056640625, -0.323394775390625, -0.31136322021484375, -0.2993316650390625, -0.28730010986328125, -0.2752685546875, -0.26323699951171875, -0.2512054443359375, -0.23917388916015625, -0.227142333984375, -0.21511077880859375, -0.2030792236328125, -0.19104766845703125, -0.17901611328125, -0.16698455810546875, -0.1549530029296875, -0.14292144775390625, -0.130889892578125, -0.11885833740234375, -0.1068267822265625, -0.09479522705078125, -0.082763671875, -0.07073211669921875, -0.0587005615234375, -0.04666900634765625, -0.034637451171875, -0.02260589599609375, -0.0105743408203125, 0.00145721435546875, 0.01348876953125, 0.02552032470703125, 0.0375518798828125, 0.04958343505859375, 0.061614990234375, 0.07364654541015625, 0.0856781005859375, 0.09770965576171875, 0.1097412109375, 0.12177276611328125, 0.1338043212890625, 0.14583587646484375, 0.157867431640625, 0.16989898681640625, 0.1819305419921875, 0.19396209716796875, 0.20599365234375, 0.21802520751953125, 0.2300567626953125, 0.24208831787109375, 0.254119873046875, 0.26615142822265625, 0.2781829833984375, 0.29021453857421875, 0.30224609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 10.0, 9.0, 25.0, 17.0, 26.0, 43.0, 50.0, 79.0, 108.0, 115.0, 126.0, 99.0, 80.0, 61.0, 32.0, 30.0, 21.0, 7.0, 17.0, 8.0, 8.0, 11.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.667043685913086e-05, -4.541035741567612e-05, -4.4150277972221375e-05, -4.289019852876663e-05, -4.163011908531189e-05, -4.037003964185715e-05, -3.9109960198402405e-05, -3.784988075494766e-05, -3.658980131149292e-05, -3.532972186803818e-05, -3.4069642424583435e-05, -3.280956298112869e-05, -3.154948353767395e-05, -3.0289404094219208e-05, -2.9029324650764465e-05, -2.7769245207309723e-05, -2.650916576385498e-05, -2.5249086320400238e-05, -2.3989006876945496e-05, -2.2728927433490753e-05, -2.146884799003601e-05, -2.020876854658127e-05, -1.8948689103126526e-05, -1.7688609659671783e-05, -1.642853021621704e-05, -1.5168450772762299e-05, -1.3908371329307556e-05, -1.2648291885852814e-05, -1.1388212442398071e-05, -1.0128132998943329e-05, -8.868053555488586e-06, -7.607974112033844e-06, -6.3478946685791016e-06, -5.087815225124359e-06, -3.827735781669617e-06, -2.5676563382148743e-06, -1.3075768947601318e-06, -4.7497451305389404e-08, 1.212581992149353e-06, 2.4726614356040955e-06, 3.732740879058838e-06, 4.99282032251358e-06, 6.252899765968323e-06, 7.512979209423065e-06, 8.773058652877808e-06, 1.003313809633255e-05, 1.1293217539787292e-05, 1.2553296983242035e-05, 1.3813376426696777e-05, 1.507345587015152e-05, 1.6333535313606262e-05, 1.7593614757061005e-05, 1.8853694200515747e-05, 2.011377364397049e-05, 2.1373853087425232e-05, 2.2633932530879974e-05, 2.3894011974334717e-05, 2.515409141778946e-05, 2.64141708612442e-05, 2.7674250304698944e-05, 2.8934329748153687e-05, 3.019440919160843e-05, 3.145448863506317e-05, 3.2714568078517914e-05, 3.3974647521972656e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 12.0, 19.0, 22.0, 41.0, 65.0, 160.0, 277.0, 747.0, 2101.0, 7615.0, 41751.0, 539244.0, 412549.0, 34117.0, 6601.0, 1938.0, 662.0, 291.0, 126.0, 80.0, 40.0, 27.0, 16.0, 15.0, 1.0, 7.0, 8.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.330810546875, -0.320770263671875, -0.31072998046875, -0.300689697265625, -0.2906494140625, -0.280609130859375, -0.27056884765625, -0.260528564453125, -0.25048828125, -0.240447998046875, -0.23040771484375, -0.220367431640625, -0.2103271484375, -0.200286865234375, -0.19024658203125, -0.180206298828125, -0.170166015625, -0.160125732421875, -0.15008544921875, -0.140045166015625, -0.1300048828125, -0.119964599609375, -0.10992431640625, -0.099884033203125, -0.08984375, -0.079803466796875, -0.06976318359375, -0.059722900390625, -0.0496826171875, -0.039642333984375, -0.02960205078125, -0.019561767578125, -0.009521484375, 0.000518798828125, 0.01055908203125, 0.020599365234375, 0.0306396484375, 0.040679931640625, 0.05072021484375, 0.060760498046875, 0.07080078125, 0.080841064453125, 0.09088134765625, 0.100921630859375, 0.1109619140625, 0.121002197265625, 0.13104248046875, 0.141082763671875, 0.151123046875, 0.161163330078125, 0.17120361328125, 0.181243896484375, 0.1912841796875, 0.201324462890625, 0.21136474609375, 0.221405029296875, 0.2314453125, 0.241485595703125, 0.25152587890625, 0.261566162109375, 0.2716064453125, 0.281646728515625, 0.29168701171875, 0.301727294921875, 0.311767578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 7.0, 7.0, 14.0, 17.0, 25.0, 38.0, 48.0, 89.0, 150.0, 207.0, 145.0, 81.0, 69.0, 37.0, 20.0, 11.0, 16.0, 11.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1806640625, -0.17457199096679688, -0.16847991943359375, -0.16238784790039062, -0.1562957763671875, -0.15020370483398438, -0.14411163330078125, -0.13801956176757812, -0.131927490234375, -0.12583541870117188, -0.11974334716796875, -0.11365127563476562, -0.1075592041015625, -0.10146713256835938, -0.09537506103515625, -0.08928298950195312, -0.08319091796875, -0.07709884643554688, -0.07100677490234375, -0.06491470336914062, -0.0588226318359375, -0.052730560302734375, -0.04663848876953125, -0.040546417236328125, -0.034454345703125, -0.028362274169921875, -0.02227020263671875, -0.016178131103515625, -0.0100860595703125, -0.003993988037109375, 0.00209808349609375, 0.008190155029296875, 0.0142822265625, 0.020374298095703125, 0.02646636962890625, 0.032558441162109375, 0.0386505126953125, 0.044742584228515625, 0.05083465576171875, 0.056926727294921875, 0.063018798828125, 0.06911087036132812, 0.07520294189453125, 0.08129501342773438, 0.0873870849609375, 0.09347915649414062, 0.09957122802734375, 0.10566329956054688, 0.11175537109375, 0.11784744262695312, 0.12393951416015625, 0.13003158569335938, 0.1361236572265625, 0.14221572875976562, 0.14830780029296875, 0.15439987182617188, 0.160491943359375, 0.16658401489257812, 0.17267608642578125, 0.17876815795898438, 0.1848602294921875, 0.19095230102539062, 0.19704437255859375, 0.20313644409179688, 0.209228515625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 15.0, 79.0, 546.0, 328.0, 29.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.42046546936035, -16.036869049072266, -15.653271675109863, -15.269674301147461, -14.886076927185059, -14.502479553222656, -14.11888313293457, -13.735285758972168, -13.351688385009766, -12.968091011047363, -12.584494590759277, -12.200897216796875, -11.817299842834473, -11.43370246887207, -11.050106048583984, -10.666508674621582, -10.28291130065918, -9.899313926696777, -9.515717506408691, -9.132120132446289, -8.748522758483887, -8.364925384521484, -7.981328964233398, -7.597731590270996, -7.21413516998291, -6.830538272857666, -6.446940898895264, -6.0633440017700195, -5.679746627807617, -5.296149730682373, -4.912552833557129, -4.528955459594727, -4.145358085632324, -3.761760950088501, -3.3781638145446777, -2.9945669174194336, -2.6109695434570312, -2.227372646331787, -1.8437755107879639, -1.4601783752441406, -1.0765812397003174, -0.6929841041564941, -0.3093870282173157, 0.07421004772186279, 0.45780718326568604, 0.8414043188095093, 1.225001335144043, 1.6085984706878662, 1.9921956062316895, 2.3757927417755127, 2.759389877319336, 3.14298677444458, 3.5265841484069824, 3.9101810455322266, 4.293778419494629, 4.677375316619873, 5.060972213745117, 5.444569110870361, 5.828166484832764, 6.211763381958008, 6.59536075592041, 6.978957653045654, 7.362554550170898, 7.746151924133301, 8.129749298095703]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 12.0, 14.0, 13.0, 13.0, 18.0, 17.0, 20.0, 19.0, 21.0, 22.0, 31.0, 29.0, 41.0, 33.0, 34.0, 33.0, 44.0, 32.0, 55.0, 39.0, 38.0, 56.0, 40.0, 30.0, 26.0, 24.0, 30.0, 30.0, 26.0, 25.0, 18.0, 15.0, 11.0, 16.0, 13.0, 9.0, 11.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0689823627471924, -1.9918403625488281, -1.9146983623504639, -1.8375563621520996, -1.7604142427444458, -1.6832722425460815, -1.6061302423477173, -1.5289881229400635, -1.4518461227416992, -1.374704122543335, -1.2975621223449707, -1.2204201221466064, -1.1432780027389526, -1.0661360025405884, -0.9889940023422241, -0.9118519425392151, -0.8347100019454956, -0.7575680017471313, -0.6804259419441223, -0.6032839417457581, -0.526141881942749, -0.44899988174438477, -0.3718578815460205, -0.2947158217430115, -0.21757382154464722, -0.14043179154396057, -0.06328977644443512, 0.013852238655090332, 0.09099426865577698, 0.16813629865646362, 0.24527829885482788, 0.3224203586578369, 0.39956235885620117, 0.4767043888568878, 0.5538464188575745, 0.6309884190559387, 0.7081304788589478, 0.785272479057312, 0.8624144792556763, 0.9395565390586853, 1.0166985988616943, 1.0938405990600586, 1.1709825992584229, 1.248124599456787, 1.325266718864441, 1.4024087190628052, 1.4795507192611694, 1.5566928386688232, 1.633834719657898, 1.7109767198562622, 1.7881187200546265, 1.8652608394622803, 1.9424028396606445, 2.019544839859009, 2.096686840057373, 2.1738288402557373, 2.2509708404541016, 2.328112840652466, 2.40525484085083, 2.4823968410491943, 2.5595388412475586, 2.636681079864502, 2.713822841644287, 2.7909650802612305, 2.8681070804595947]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 12.0, 13.0, 17.0, 24.0, 49.0, 69.0, 101.0, 149.0, 238.0, 418.0, 705.0, 1372.0, 2789.0, 6349.0, 18186.0, 78595.0, 856899.0, 2967969.0, 210380.0, 32696.0, 9192.0, 3787.0, 1818.0, 989.0, 524.0, 322.0, 211.0, 127.0, 95.0, 54.0, 41.0, 29.0, 14.0, 15.0, 15.0, 7.0, 2.0, 4.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98291015625, -0.9468307495117188, -0.9107513427734375, -0.8746719360351562, -0.838592529296875, -0.8025131225585938, -0.7664337158203125, -0.7303543090820312, -0.69427490234375, -0.6581954956054688, -0.6221160888671875, -0.5860366821289062, -0.549957275390625, -0.5138778686523438, -0.4777984619140625, -0.44171905517578125, -0.4056396484375, -0.36956024169921875, -0.3334808349609375, -0.29740142822265625, -0.261322021484375, -0.22524261474609375, -0.1891632080078125, -0.15308380126953125, -0.11700439453125, -0.08092498779296875, -0.0448455810546875, -0.00876617431640625, 0.027313232421875, 0.06339263916015625, 0.0994720458984375, 0.13555145263671875, 0.171630859375, 0.20771026611328125, 0.2437896728515625, 0.27986907958984375, 0.315948486328125, 0.35202789306640625, 0.3881072998046875, 0.42418670654296875, 0.46026611328125, 0.49634552001953125, 0.5324249267578125, 0.5685043334960938, 0.604583740234375, 0.6406631469726562, 0.6767425537109375, 0.7128219604492188, 0.7489013671875, 0.7849807739257812, 0.8210601806640625, 0.8571395874023438, 0.893218994140625, 0.9292984008789062, 0.9653778076171875, 1.0014572143554688, 1.03753662109375, 1.0736160278320312, 1.1096954345703125, 1.1457748413085938, 1.181854248046875, 1.2179336547851562, 1.2540130615234375, 1.2900924682617188, 1.326171875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 7.0, 5.0, 10.0, 10.0, 13.0, 22.0, 19.0, 30.0, 56.0, 56.0, 60.0, 87.0, 53.0, 80.0, 87.0, 73.0, 57.0, 65.0, 43.0, 38.0, 30.0, 23.0, 17.0, 16.0, 9.0, 6.0, 7.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84814453125, -0.8165817260742188, -0.7850189208984375, -0.7534561157226562, -0.721893310546875, -0.6903305053710938, -0.6587677001953125, -0.6272048950195312, -0.59564208984375, -0.5640792846679688, -0.5325164794921875, -0.5009536743164062, -0.469390869140625, -0.43782806396484375, -0.4062652587890625, -0.37470245361328125, -0.3431396484375, -0.31157684326171875, -0.2800140380859375, -0.24845123291015625, -0.216888427734375, -0.18532562255859375, -0.1537628173828125, -0.12220001220703125, -0.09063720703125, -0.05907440185546875, -0.0275115966796875, 0.00405120849609375, 0.035614013671875, 0.06717681884765625, 0.0987396240234375, 0.13030242919921875, 0.161865234375, 0.19342803955078125, 0.2249908447265625, 0.25655364990234375, 0.288116455078125, 0.31967926025390625, 0.3512420654296875, 0.38280487060546875, 0.41436767578125, 0.44593048095703125, 0.4774932861328125, 0.5090560913085938, 0.540618896484375, 0.5721817016601562, 0.6037445068359375, 0.6353073120117188, 0.6668701171875, 0.6984329223632812, 0.7299957275390625, 0.7615585327148438, 0.793121337890625, 0.8246841430664062, 0.8562469482421875, 0.8878097534179688, 0.91937255859375, 0.9509353637695312, 0.9824981689453125, 1.0140609741210938, 1.045623779296875, 1.0771865844726562, 1.1087493896484375, 1.1403121948242188, 1.171875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 5.0, 9.0, 18.0, 22.0, 42.0, 46.0, 62.0, 84.0, 133.0, 239.0, 410.0, 791.0, 1510.0, 3537.0, 10097.0, 40046.0, 353724.0, 3532304.0, 206696.0, 30159.0, 8313.0, 2979.0, 1355.0, 648.0, 351.0, 249.0, 131.0, 82.0, 57.0, 39.0, 42.0, 27.0, 15.0, 16.0, 5.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.1269989013671875, -1.089935302734375, -1.0528717041015625, -1.01580810546875, -0.9787445068359375, -0.941680908203125, -0.9046173095703125, -0.8675537109375, -0.8304901123046875, -0.793426513671875, -0.7563629150390625, -0.71929931640625, -0.6822357177734375, -0.645172119140625, -0.6081085205078125, -0.571044921875, -0.5339813232421875, -0.496917724609375, -0.4598541259765625, -0.42279052734375, -0.3857269287109375, -0.348663330078125, -0.3115997314453125, -0.2745361328125, -0.2374725341796875, -0.200408935546875, -0.1633453369140625, -0.12628173828125, -0.0892181396484375, -0.052154541015625, -0.0150909423828125, 0.02197265625, 0.0590362548828125, 0.096099853515625, 0.1331634521484375, 0.17022705078125, 0.2072906494140625, 0.244354248046875, 0.2814178466796875, 0.3184814453125, 0.3555450439453125, 0.392608642578125, 0.4296722412109375, 0.46673583984375, 0.5037994384765625, 0.540863037109375, 0.5779266357421875, 0.614990234375, 0.6520538330078125, 0.689117431640625, 0.7261810302734375, 0.76324462890625, 0.8003082275390625, 0.837371826171875, 0.8744354248046875, 0.9114990234375, 0.9485626220703125, 0.985626220703125, 1.0226898193359375, 1.05975341796875, 1.0968170166015625, 1.133880615234375, 1.1709442138671875, 1.2080078125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 7.0, 13.0, 14.0, 17.0, 27.0, 33.0, 38.0, 53.0, 108.0, 128.0, 258.0, 452.0, 792.0, 813.0, 508.0, 287.0, 179.0, 91.0, 63.0, 41.0, 36.0, 23.0, 17.0, 12.0, 16.0, 7.0, 4.0, 3.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.300537109375, -0.2905387878417969, -0.28054046630859375, -0.2705421447753906, -0.2605438232421875, -0.2505455017089844, -0.24054718017578125, -0.23054885864257812, -0.220550537109375, -0.21055221557617188, -0.20055389404296875, -0.19055557250976562, -0.1805572509765625, -0.17055892944335938, -0.16056060791015625, -0.15056228637695312, -0.14056396484375, -0.13056564331054688, -0.12056732177734375, -0.11056900024414062, -0.1005706787109375, -0.09057235717773438, -0.08057403564453125, -0.07057571411132812, -0.060577392578125, -0.050579071044921875, -0.04058074951171875, -0.030582427978515625, -0.0205841064453125, -0.010585784912109375, -0.00058746337890625, 0.009410858154296875, 0.0194091796875, 0.029407501220703125, 0.03940582275390625, 0.049404144287109375, 0.0594024658203125, 0.06940078735351562, 0.07939910888671875, 0.08939743041992188, 0.099395751953125, 0.10939407348632812, 0.11939239501953125, 0.12939071655273438, 0.1393890380859375, 0.14938735961914062, 0.15938568115234375, 0.16938400268554688, 0.17938232421875, 0.18938064575195312, 0.19937896728515625, 0.20937728881835938, 0.2193756103515625, 0.22937393188476562, 0.23937225341796875, 0.24937057495117188, 0.259368896484375, 0.2693672180175781, 0.27936553955078125, 0.2893638610839844, 0.2993621826171875, 0.3093605041503906, 0.31935882568359375, 0.3293571472167969, 0.33935546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 15.0, 36.0, 47.0, 88.0, 153.0, 189.0, 187.0, 141.0, 61.0, 30.0, 20.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.561295986175537, -1.4857509136199951, -1.4102059602737427, -1.3346608877182007, -1.2591159343719482, -1.1835708618164062, -1.1080257892608643, -1.0324807167053223, -0.9569357633590698, -0.8813907504081726, -0.8058457374572754, -0.7303006649017334, -0.6547556519508362, -0.579210638999939, -0.503665566444397, -0.42812055349349976, -0.35257554054260254, -0.2770305275917053, -0.20148548483848572, -0.1259404569864273, -0.050395429134368896, 0.02514958381652832, 0.10069462656974792, 0.17623966932296753, 0.25178468227386475, 0.32732969522476196, 0.40287473797798157, 0.47841978073120117, 0.5539647936820984, 0.6295098066329956, 0.7050548791885376, 0.7805998921394348, 0.856144905090332, 0.9316899180412292, 1.0072349309921265, 1.0827800035476685, 1.158324956893921, 1.233870029449463, 1.3094151020050049, 1.3849601745605469, 1.4605051279067993, 1.5360502004623413, 1.6115951538085938, 1.6871402263641357, 1.7626852989196777, 1.8382302522659302, 1.9137753248214722, 1.9893202781677246, 2.0648653507232666, 2.1404104232788086, 2.2159554958343506, 2.2915003299713135, 2.3670454025268555, 2.4425904750823975, 2.5181355476379395, 2.5936806201934814, 2.6692256927490234, 2.7447707653045654, 2.8203158378601074, 2.8958606719970703, 2.9714057445526123, 3.0469508171081543, 3.1224958896636963, 3.1980409622192383, 3.273585796356201]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 2.0, 4.0, 11.0, 13.0, 7.0, 21.0, 20.0, 24.0, 29.0, 35.0, 29.0, 46.0, 54.0, 53.0, 62.0, 70.0, 63.0, 66.0, 59.0, 54.0, 43.0, 45.0, 34.0, 29.0, 23.0, 18.0, 28.0, 13.0, 10.0, 10.0, 3.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7976272702217102, -0.7679049968719482, -0.7381827235221863, -0.7084604501724243, -0.6787381768226624, -0.6490159034729004, -0.6192936301231384, -0.5895713567733765, -0.5598490834236145, -0.5301268100738525, -0.5004045367240906, -0.4706822633743286, -0.44095999002456665, -0.4112377166748047, -0.3815154433250427, -0.35179316997528076, -0.3220708966255188, -0.29234862327575684, -0.2626263499259949, -0.2329040765762329, -0.20318180322647095, -0.17345952987670898, -0.14373725652694702, -0.11401498317718506, -0.0842927098274231, -0.05457043647766113, -0.02484816312789917, 0.004874110221862793, 0.034596383571624756, 0.06431865692138672, 0.09404093027114868, 0.12376320362091064, 0.15348541736602783, 0.1832076907157898, 0.21292996406555176, 0.24265223741531372, 0.2723745107650757, 0.30209678411483765, 0.3318190574645996, 0.3615413308143616, 0.39126360416412354, 0.4209858775138855, 0.45070815086364746, 0.4804304242134094, 0.5101526975631714, 0.5398749709129333, 0.5695972442626953, 0.5993195176124573, 0.6290417909622192, 0.6587640643119812, 0.6884863376617432, 0.7182086110115051, 0.7479308843612671, 0.777653157711029, 0.807375431060791, 0.837097704410553, 0.8668199777603149, 0.8965422511100769, 0.9262645244598389, 0.9559867978096008, 0.9857090711593628, 1.0154314041137695, 1.0451536178588867, 1.074875831604004, 1.1045981645584106]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 6.0, 5.0, 2.0, 11.0, 18.0, 23.0, 18.0, 42.0, 63.0, 79.0, 124.0, 191.0, 318.0, 581.0, 1136.0, 2195.0, 4808.0, 12682.0, 40908.0, 173885.0, 501504.0, 230991.0, 52189.0, 15415.0, 5847.0, 2618.0, 1288.0, 650.0, 336.0, 203.0, 157.0, 75.0, 50.0, 30.0, 31.0, 23.0, 18.0, 9.0, 10.0, 1.0, 7.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1314697265625, -0.12717247009277344, -0.12287521362304688, -0.11857795715332031, -0.11428070068359375, -0.10998344421386719, -0.10568618774414062, -0.10138893127441406, -0.0970916748046875, -0.09279441833496094, -0.08849716186523438, -0.08419990539550781, -0.07990264892578125, -0.07560539245605469, -0.07130813598632812, -0.06701087951660156, -0.062713623046875, -0.05841636657714844, -0.054119110107421875, -0.04982185363769531, -0.04552459716796875, -0.04122734069824219, -0.036930084228515625, -0.03263282775878906, -0.0283355712890625, -0.024038314819335938, -0.019741058349609375, -0.015443801879882812, -0.01114654541015625, -0.0068492889404296875, -0.002552032470703125, 0.0017452239990234375, 0.00604248046875, 0.010339736938476562, 0.014636993408203125, 0.018934249877929688, 0.02323150634765625, 0.027528762817382812, 0.031826019287109375, 0.03612327575683594, 0.0404205322265625, 0.04471778869628906, 0.049015045166015625, 0.05331230163574219, 0.05760955810546875, 0.06190681457519531, 0.06620407104492188, 0.07050132751464844, 0.074798583984375, 0.07909584045410156, 0.08339309692382812, 0.08769035339355469, 0.09198760986328125, 0.09628486633300781, 0.10058212280273438, 0.10487937927246094, 0.1091766357421875, 0.11347389221191406, 0.11777114868164062, 0.12206840515136719, 0.12636566162109375, 0.1306629180908203, 0.13496017456054688, 0.13925743103027344, 0.1435546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 3.0, 10.0, 8.0, 7.0, 12.0, 18.0, 20.0, 21.0, 39.0, 26.0, 37.0, 46.0, 58.0, 75.0, 60.0, 74.0, 54.0, 57.0, 60.0, 61.0, 44.0, 38.0, 35.0, 28.0, 21.0, 15.0, 19.0, 12.0, 5.0, 9.0, 6.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6163177490234375, -0.594940185546875, -0.5735626220703125, -0.55218505859375, -0.5308074951171875, -0.509429931640625, -0.4880523681640625, -0.4666748046875, -0.4452972412109375, -0.423919677734375, -0.4025421142578125, -0.38116455078125, -0.3597869873046875, -0.338409423828125, -0.3170318603515625, -0.295654296875, -0.2742767333984375, -0.252899169921875, -0.2315216064453125, -0.21014404296875, -0.1887664794921875, -0.167388916015625, -0.1460113525390625, -0.1246337890625, -0.1032562255859375, -0.081878662109375, -0.0605010986328125, -0.03912353515625, -0.0177459716796875, 0.003631591796875, 0.0250091552734375, 0.04638671875, 0.0677642822265625, 0.089141845703125, 0.1105194091796875, 0.13189697265625, 0.1532745361328125, 0.174652099609375, 0.1960296630859375, 0.2174072265625, 0.2387847900390625, 0.260162353515625, 0.2815399169921875, 0.30291748046875, 0.3242950439453125, 0.345672607421875, 0.3670501708984375, 0.388427734375, 0.4098052978515625, 0.431182861328125, 0.4525604248046875, 0.47393798828125, 0.4953155517578125, 0.516693115234375, 0.5380706787109375, 0.5594482421875, 0.5808258056640625, 0.602203369140625, 0.6235809326171875, 0.64495849609375, 0.6663360595703125, 0.687713623046875, 0.7090911865234375, 0.73046875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 6.0, 6.0, 9.0, 14.0, 26.0, 21.0, 58.0, 83.0, 161.0, 302.0, 652.0, 1492.0, 4153.0, 16195.0, 119246.0, 648013.0, 222932.0, 26196.0, 5469.0, 1849.0, 808.0, 372.0, 199.0, 105.0, 69.0, 34.0, 17.0, 16.0, 6.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.16162109375, -0.15616798400878906, -0.15071487426757812, -0.1452617645263672, -0.13980865478515625, -0.1343555450439453, -0.12890243530273438, -0.12344932556152344, -0.1179962158203125, -0.11254310607910156, -0.10708999633789062, -0.10163688659667969, -0.09618377685546875, -0.09073066711425781, -0.08527755737304688, -0.07982444763183594, -0.074371337890625, -0.06891822814941406, -0.06346511840820312, -0.05801200866699219, -0.05255889892578125, -0.04710578918457031, -0.041652679443359375, -0.03619956970214844, -0.0307464599609375, -0.025293350219726562, -0.019840240478515625, -0.014387130737304688, -0.00893402099609375, -0.0034809112548828125, 0.001972198486328125, 0.0074253082275390625, 0.01287841796875, 0.018331527709960938, 0.023784637451171875, 0.029237747192382812, 0.03469085693359375, 0.04014396667480469, 0.045597076416015625, 0.05105018615722656, 0.0565032958984375, 0.06195640563964844, 0.06740951538085938, 0.07286262512207031, 0.07831573486328125, 0.08376884460449219, 0.08922195434570312, 0.09467506408691406, 0.100128173828125, 0.10558128356933594, 0.11103439331054688, 0.11648750305175781, 0.12194061279296875, 0.1273937225341797, 0.13284683227539062, 0.13829994201660156, 0.1437530517578125, 0.14920616149902344, 0.15465927124023438, 0.1601123809814453, 0.16556549072265625, 0.1710186004638672, 0.17647171020507812, 0.18192481994628906, 0.1873779296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 11.0, 8.0, 25.0, 22.0, 28.0, 23.0, 34.0, 32.0, 30.0, 44.0, 48.0, 48.0, 45.0, 58.0, 49.0, 50.0, 44.0, 42.0, 37.0, 31.0, 41.0, 22.0, 30.0, 20.0, 23.0, 20.0, 17.0, 14.0, 11.0, 14.0, 13.0, 4.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.083984375, -1.0517654418945312, -1.0195465087890625, -0.9873275756835938, -0.955108642578125, -0.9228897094726562, -0.8906707763671875, -0.8584518432617188, -0.82623291015625, -0.7940139770507812, -0.7617950439453125, -0.7295761108398438, -0.697357177734375, -0.6651382446289062, -0.6329193115234375, -0.6007003784179688, -0.5684814453125, -0.5362625122070312, -0.5040435791015625, -0.47182464599609375, -0.439605712890625, -0.40738677978515625, -0.3751678466796875, -0.34294891357421875, -0.31072998046875, -0.27851104736328125, -0.2462921142578125, -0.21407318115234375, -0.181854248046875, -0.14963531494140625, -0.1174163818359375, -0.08519744873046875, -0.052978515625, -0.02075958251953125, 0.0114593505859375, 0.04367828369140625, 0.075897216796875, 0.10811614990234375, 0.1403350830078125, 0.17255401611328125, 0.20477294921875, 0.23699188232421875, 0.2692108154296875, 0.30142974853515625, 0.333648681640625, 0.36586761474609375, 0.3980865478515625, 0.43030548095703125, 0.4625244140625, 0.49474334716796875, 0.5269622802734375, 0.5591812133789062, 0.591400146484375, 0.6236190795898438, 0.6558380126953125, 0.6880569458007812, 0.72027587890625, 0.7524948120117188, 0.7847137451171875, 0.8169326782226562, 0.849151611328125, 0.8813705444335938, 0.9135894775390625, 0.9458084106445312, 0.97802734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 9.0, 14.0, 25.0, 44.0, 63.0, 102.0, 226.0, 446.0, 1165.0, 3842.0, 20299.0, 232999.0, 713769.0, 63497.0, 8503.0, 2095.0, 742.0, 308.0, 164.0, 96.0, 52.0, 35.0, 24.0, 13.0, 10.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0673828125, -0.06499862670898438, -0.06261444091796875, -0.060230255126953125, -0.0578460693359375, -0.055461883544921875, -0.05307769775390625, -0.050693511962890625, -0.048309326171875, -0.045925140380859375, -0.04354095458984375, -0.041156768798828125, -0.0387725830078125, -0.036388397216796875, -0.03400421142578125, -0.031620025634765625, -0.02923583984375, -0.026851654052734375, -0.02446746826171875, -0.022083282470703125, -0.0196990966796875, -0.017314910888671875, -0.01493072509765625, -0.012546539306640625, -0.010162353515625, -0.007778167724609375, -0.00539398193359375, -0.003009796142578125, -0.0006256103515625, 0.001758575439453125, 0.00414276123046875, 0.006526947021484375, 0.0089111328125, 0.011295318603515625, 0.01367950439453125, 0.016063690185546875, 0.0184478759765625, 0.020832061767578125, 0.02321624755859375, 0.025600433349609375, 0.027984619140625, 0.030368804931640625, 0.03275299072265625, 0.035137176513671875, 0.0375213623046875, 0.039905548095703125, 0.04228973388671875, 0.044673919677734375, 0.04705810546875, 0.049442291259765625, 0.05182647705078125, 0.054210662841796875, 0.0565948486328125, 0.058979034423828125, 0.06136322021484375, 0.06374740600585938, 0.066131591796875, 0.06851577758789062, 0.07089996337890625, 0.07328414916992188, 0.0756683349609375, 0.07805252075195312, 0.08043670654296875, 0.08282089233398438, 0.085205078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 11.0, 10.0, 8.0, 25.0, 27.0, 40.0, 58.0, 81.0, 98.0, 113.0, 107.0, 106.0, 87.0, 57.0, 42.0, 39.0, 25.0, 17.0, 15.0, 14.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.9381906390190125e-05, -3.8292258977890015e-05, -3.7202611565589905e-05, -3.6112964153289795e-05, -3.5023316740989685e-05, -3.3933669328689575e-05, -3.2844021916389465e-05, -3.1754374504089355e-05, -3.0664727091789246e-05, -2.9575079679489136e-05, -2.8485432267189026e-05, -2.7395784854888916e-05, -2.6306137442588806e-05, -2.5216490030288696e-05, -2.4126842617988586e-05, -2.3037195205688477e-05, -2.1947547793388367e-05, -2.0857900381088257e-05, -1.9768252968788147e-05, -1.8678605556488037e-05, -1.7588958144187927e-05, -1.6499310731887817e-05, -1.5409663319587708e-05, -1.4320015907287598e-05, -1.3230368494987488e-05, -1.2140721082687378e-05, -1.1051073670387268e-05, -9.961426258087158e-06, -8.871778845787048e-06, -7.782131433486938e-06, -6.692484021186829e-06, -5.602836608886719e-06, -4.513189196586609e-06, -3.423541784286499e-06, -2.333894371986389e-06, -1.2442469596862793e-06, -1.5459954738616943e-07, 9.350478649139404e-07, 2.0246952772140503e-06, 3.11434268951416e-06, 4.20399010181427e-06, 5.29363751411438e-06, 6.38328492641449e-06, 7.4729323387146e-06, 8.56257975101471e-06, 9.65222716331482e-06, 1.074187457561493e-05, 1.1831521987915039e-05, 1.2921169400215149e-05, 1.4010816812515259e-05, 1.5100464224815369e-05, 1.619011163711548e-05, 1.727975904941559e-05, 1.8369406461715698e-05, 1.9459053874015808e-05, 2.0548701286315918e-05, 2.1638348698616028e-05, 2.2727996110916138e-05, 2.3817643523216248e-05, 2.4907290935516357e-05, 2.5996938347816467e-05, 2.7086585760116577e-05, 2.8176233172416687e-05, 2.9265880584716797e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 9.0, 14.0, 20.0, 40.0, 47.0, 74.0, 102.0, 184.0, 290.0, 423.0, 814.0, 1830.0, 4004.0, 11207.0, 40763.0, 233845.0, 589320.0, 125827.0, 25613.0, 7917.0, 3038.0, 1457.0, 690.0, 386.0, 231.0, 127.0, 76.0, 50.0, 35.0, 26.0, 21.0, 21.0, 8.0, 12.0, 11.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055511474609375, -0.05384635925292969, -0.052181243896484375, -0.05051612854003906, -0.04885101318359375, -0.04718589782714844, -0.045520782470703125, -0.04385566711425781, -0.0421905517578125, -0.04052543640136719, -0.038860321044921875, -0.03719520568847656, -0.03553009033203125, -0.03386497497558594, -0.032199859619140625, -0.030534744262695312, -0.02886962890625, -0.027204513549804688, -0.025539398193359375, -0.023874282836914062, -0.02220916748046875, -0.020544052124023438, -0.018878936767578125, -0.017213821411132812, -0.0155487060546875, -0.013883590698242188, -0.012218475341796875, -0.010553359985351562, -0.00888824462890625, -0.0072231292724609375, -0.005558013916015625, -0.0038928985595703125, -0.002227783203125, -0.0005626678466796875, 0.001102447509765625, 0.0027675628662109375, 0.00443267822265625, 0.0060977935791015625, 0.007762908935546875, 0.009428024291992188, 0.0110931396484375, 0.012758255004882812, 0.014423370361328125, 0.016088485717773438, 0.01775360107421875, 0.019418716430664062, 0.021083831787109375, 0.022748947143554688, 0.0244140625, 0.026079177856445312, 0.027744293212890625, 0.029409408569335938, 0.03107452392578125, 0.03273963928222656, 0.034404754638671875, 0.03606986999511719, 0.0377349853515625, 0.03940010070800781, 0.041065216064453125, 0.04273033142089844, 0.04439544677734375, 0.04606056213378906, 0.047725677490234375, 0.04939079284667969, 0.051055908203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 9.0, 4.0, 7.0, 4.0, 17.0, 14.0, 29.0, 32.0, 40.0, 43.0, 65.0, 81.0, 88.0, 101.0, 88.0, 91.0, 67.0, 51.0, 40.0, 23.0, 22.0, 23.0, 16.0, 10.0, 4.0, 7.0, 6.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.010650634765625, -0.010300517082214355, -0.009950399398803711, -0.009600281715393066, -0.009250164031982422, -0.008900046348571777, -0.008549928665161133, -0.008199810981750488, -0.007849693298339844, -0.007499575614929199, -0.007149457931518555, -0.00679934024810791, -0.006449222564697266, -0.006099104881286621, -0.0057489871978759766, -0.005398869514465332, -0.0050487518310546875, -0.004698634147644043, -0.0043485164642333984, -0.003998398780822754, -0.0036482810974121094, -0.003298163414001465, -0.0029480457305908203, -0.0025979280471801758, -0.0022478103637695312, -0.0018976926803588867, -0.0015475749969482422, -0.0011974573135375977, -0.0008473396301269531, -0.0004972219467163086, -0.00014710426330566406, 0.00020301342010498047, 0.000553131103515625, 0.0009032487869262695, 0.001253366470336914, 0.0016034841537475586, 0.001953601837158203, 0.0023037195205688477, 0.002653837203979492, 0.0030039548873901367, 0.0033540725708007812, 0.0037041902542114258, 0.00405430793762207, 0.004404425621032715, 0.004754543304443359, 0.005104660987854004, 0.0054547786712646484, 0.005804896354675293, 0.0061550140380859375, 0.006505131721496582, 0.0068552494049072266, 0.007205367088317871, 0.007555484771728516, 0.00790560245513916, 0.008255720138549805, 0.00860583782196045, 0.008955955505371094, 0.009306073188781738, 0.009656190872192383, 0.010006308555603027, 0.010356426239013672, 0.010706543922424316, 0.011056661605834961, 0.011406779289245605, 0.01175689697265625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 10.0, 19.0, 38.0, 57.0, 123.0, 198.0, 232.0, 177.0, 78.0, 37.0, 14.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3662750720977783, -1.3071032762527466, -1.2479315996170044, -1.1887598037719727, -1.1295881271362305, -1.0704163312911987, -1.0112446546554565, -0.9520728588104248, -0.8929011821746826, -0.8337294459342957, -0.7745577096939087, -0.7153859734535217, -0.6562142372131348, -0.597042441368103, -0.5378707647323608, -0.4786989986896515, -0.41952723264694214, -0.3603554964065552, -0.3011837601661682, -0.24201200902462006, -0.1828402727842331, -0.12366852164268494, -0.06449678540229797, -0.005325049161911011, 0.05384668707847595, 0.11301842331886292, 0.17219015955924988, 0.23136191070079803, 0.2905336618423462, 0.34970539808273315, 0.4088771343231201, 0.4680488705635071, 0.527220606803894, 0.586392343044281, 0.645564079284668, 0.7047358155250549, 0.7639075517654419, 0.8230793476104736, 0.8822510242462158, 0.9414228200912476, 1.0005944967269897, 1.0597662925720215, 1.1189379692077637, 1.1781097650527954, 1.2372814416885376, 1.2964532375335693, 1.3556249141693115, 1.4147967100143433, 1.473968505859375, 1.5331403017044067, 1.592311978340149, 1.6514837741851807, 1.7106554508209229, 1.7698272466659546, 1.8289989233016968, 1.8881707191467285, 1.9473423957824707, 2.006514072418213, 2.065685987472534, 2.1248576641082764, 2.1840293407440186, 2.2432010173797607, 2.302372932434082, 2.361544609069824, 2.4207162857055664]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 4.0, 9.0, 8.0, 10.0, 14.0, 19.0, 30.0, 23.0, 35.0, 33.0, 52.0, 58.0, 69.0, 65.0, 74.0, 83.0, 69.0, 56.0, 58.0, 46.0, 40.0, 25.0, 28.0, 20.0, 25.0, 10.0, 7.0, 5.0, 9.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5985667705535889, -0.5761913657188416, -0.5538159608840942, -0.5314406156539917, -0.5090652108192444, -0.48668980598449707, -0.46431440114974976, -0.44193899631500244, -0.4195636212825775, -0.3971882164478302, -0.3748128414154053, -0.35243743658065796, -0.33006203174591064, -0.3076866567134857, -0.2853112518787384, -0.2629358768463135, -0.24056047201156616, -0.21818508207798004, -0.19580969214439392, -0.1734342873096466, -0.15105889737606049, -0.12868350744247437, -0.10630810260772705, -0.08393271267414093, -0.06155732274055481, -0.03918192908167839, -0.01680653542280197, 0.005568861961364746, 0.027944251894950867, 0.05031964182853699, 0.0726950466632843, 0.09507043659687042, 0.11744576692581177, 0.1398211568593979, 0.162196546792984, 0.18457195162773132, 0.20694734156131744, 0.22932273149490356, 0.2516981363296509, 0.2740735411643982, 0.2964489161968231, 0.31882432103157043, 0.34119969606399536, 0.3635751008987427, 0.38595050573349, 0.4083258807659149, 0.43070128560066223, 0.45307666063308716, 0.4754520654678345, 0.4978274703025818, 0.5202028751373291, 0.5425782203674316, 0.564953625202179, 0.5873290300369263, 0.6097044348716736, 0.6320798397064209, 0.6544551849365234, 0.6768305897712708, 0.6992059946060181, 0.7215813398361206, 0.7439567446708679, 0.7663321495056152, 0.7887075543403625, 0.8110829591751099, 0.8334583640098572]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 10.0, 13.0, 11.0, 13.0, 35.0, 39.0, 51.0, 73.0, 110.0, 148.0, 222.0, 344.0, 471.0, 691.0, 1073.0, 1647.0, 2770.0, 4502.0, 7784.0, 14079.0, 28109.0, 62039.0, 189781.0, 488001.0, 141223.0, 51253.0, 23915.0, 12361.0, 6816.0, 3939.0, 2433.0, 1556.0, 927.0, 632.0, 440.0, 311.0, 220.0, 135.0, 98.0, 73.0, 59.0, 38.0, 28.0, 26.0, 14.0, 9.0, 4.0, 12.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.38134765625, -0.36992645263671875, -0.3585052490234375, -0.34708404541015625, -0.335662841796875, -0.32424163818359375, -0.3128204345703125, -0.30139923095703125, -0.28997802734375, -0.27855682373046875, -0.2671356201171875, -0.25571441650390625, -0.244293212890625, -0.23287200927734375, -0.2214508056640625, -0.21002960205078125, -0.1986083984375, -0.18718719482421875, -0.1757659912109375, -0.16434478759765625, -0.152923583984375, -0.14150238037109375, -0.1300811767578125, -0.11865997314453125, -0.10723876953125, -0.09581756591796875, -0.0843963623046875, -0.07297515869140625, -0.061553955078125, -0.05013275146484375, -0.0387115478515625, -0.02729034423828125, -0.015869140625, -0.00444793701171875, 0.0069732666015625, 0.01839447021484375, 0.029815673828125, 0.04123687744140625, 0.0526580810546875, 0.06407928466796875, 0.07550048828125, 0.08692169189453125, 0.0983428955078125, 0.10976409912109375, 0.121185302734375, 0.13260650634765625, 0.1440277099609375, 0.15544891357421875, 0.1668701171875, 0.17829132080078125, 0.1897125244140625, 0.20113372802734375, 0.212554931640625, 0.22397613525390625, 0.2353973388671875, 0.24681854248046875, 0.25823974609375, 0.26966094970703125, 0.2810821533203125, 0.29250335693359375, 0.303924560546875, 0.31534576416015625, 0.3267669677734375, 0.33818817138671875, 0.349609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 8.0, 9.0, 13.0, 29.0, 36.0, 34.0, 44.0, 57.0, 74.0, 69.0, 84.0, 74.0, 77.0, 81.0, 63.0, 38.0, 43.0, 35.0, 26.0, 23.0, 17.0, 12.0, 11.0, 10.0, 5.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3740234375, -1.3219451904296875, -1.269866943359375, -1.2177886962890625, -1.16571044921875, -1.1136322021484375, -1.061553955078125, -1.0094757080078125, -0.9573974609375, -0.9053192138671875, -0.853240966796875, -0.8011627197265625, -0.74908447265625, -0.6970062255859375, -0.644927978515625, -0.5928497314453125, -0.540771484375, -0.4886932373046875, -0.436614990234375, -0.3845367431640625, -0.33245849609375, -0.2803802490234375, -0.228302001953125, -0.1762237548828125, -0.1241455078125, -0.0720672607421875, -0.019989013671875, 0.0320892333984375, 0.08416748046875, 0.1362457275390625, 0.188323974609375, 0.2404022216796875, 0.29248046875, 0.3445587158203125, 0.396636962890625, 0.4487152099609375, 0.50079345703125, 0.5528717041015625, 0.604949951171875, 0.6570281982421875, 0.7091064453125, 0.7611846923828125, 0.813262939453125, 0.8653411865234375, 0.91741943359375, 0.9694976806640625, 1.021575927734375, 1.0736541748046875, 1.125732421875, 1.1778106689453125, 1.229888916015625, 1.2819671630859375, 1.33404541015625, 1.3861236572265625, 1.438201904296875, 1.4902801513671875, 1.5423583984375, 1.5944366455078125, 1.646514892578125, 1.6985931396484375, 1.75067138671875, 1.8027496337890625, 1.854827880859375, 1.9069061279296875, 1.958984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 13.0, 11.0, 25.0, 33.0, 31.0, 54.0, 94.0, 100.0, 138.0, 245.0, 426.0, 903.0, 2437.0, 7269.0, 31462.0, 288701.0, 646878.0, 53252.0, 10729.0, 3216.0, 1204.0, 535.0, 262.0, 144.0, 112.0, 79.0, 56.0, 29.0, 23.0, 16.0, 21.0, 7.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.6911849975585938, -0.6689910888671875, -0.6467971801757812, -0.624603271484375, -0.6024093627929688, -0.5802154541015625, -0.5580215454101562, -0.53582763671875, -0.5136337280273438, -0.4914398193359375, -0.46924591064453125, -0.447052001953125, -0.42485809326171875, -0.4026641845703125, -0.38047027587890625, -0.3582763671875, -0.33608245849609375, -0.3138885498046875, -0.29169464111328125, -0.269500732421875, -0.24730682373046875, -0.2251129150390625, -0.20291900634765625, -0.18072509765625, -0.15853118896484375, -0.1363372802734375, -0.11414337158203125, -0.091949462890625, -0.06975555419921875, -0.0475616455078125, -0.02536773681640625, -0.003173828125, 0.01902008056640625, 0.0412139892578125, 0.06340789794921875, 0.085601806640625, 0.10779571533203125, 0.1299896240234375, 0.15218353271484375, 0.17437744140625, 0.19657135009765625, 0.2187652587890625, 0.24095916748046875, 0.263153076171875, 0.28534698486328125, 0.3075408935546875, 0.32973480224609375, 0.3519287109375, 0.37412261962890625, 0.3963165283203125, 0.41851043701171875, 0.440704345703125, 0.46289825439453125, 0.4850921630859375, 0.5072860717773438, 0.52947998046875, 0.5516738891601562, 0.5738677978515625, 0.5960617065429688, 0.618255615234375, 0.6404495239257812, 0.6626434326171875, 0.6848373413085938, 0.70703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 2.0, 2.0, 10.0, 10.0, 18.0, 10.0, 17.0, 23.0, 28.0, 23.0, 21.0, 32.0, 21.0, 33.0, 42.0, 38.0, 57.0, 39.0, 47.0, 53.0, 49.0, 50.0, 36.0, 66.0, 43.0, 31.0, 35.0, 29.0, 19.0, 24.0, 16.0, 20.0, 19.0, 12.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4585723876953125, -1.412261962890625, -1.3659515380859375, -1.31964111328125, -1.2733306884765625, -1.227020263671875, -1.1807098388671875, -1.1343994140625, -1.0880889892578125, -1.041778564453125, -0.9954681396484375, -0.94915771484375, -0.9028472900390625, -0.856536865234375, -0.8102264404296875, -0.763916015625, -0.7176055908203125, -0.671295166015625, -0.6249847412109375, -0.57867431640625, -0.5323638916015625, -0.486053466796875, -0.4397430419921875, -0.3934326171875, -0.3471221923828125, -0.300811767578125, -0.2545013427734375, -0.20819091796875, -0.1618804931640625, -0.115570068359375, -0.0692596435546875, -0.02294921875, 0.0233612060546875, 0.069671630859375, 0.1159820556640625, 0.16229248046875, 0.2086029052734375, 0.254913330078125, 0.3012237548828125, 0.3475341796875, 0.3938446044921875, 0.440155029296875, 0.4864654541015625, 0.53277587890625, 0.5790863037109375, 0.625396728515625, 0.6717071533203125, 0.718017578125, 0.7643280029296875, 0.810638427734375, 0.8569488525390625, 0.90325927734375, 0.9495697021484375, 0.995880126953125, 1.0421905517578125, 1.0885009765625, 1.1348114013671875, 1.181121826171875, 1.2274322509765625, 1.27374267578125, 1.3200531005859375, 1.366363525390625, 1.4126739501953125, 1.458984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 12.0, 16.0, 17.0, 26.0, 40.0, 49.0, 135.0, 193.0, 450.0, 1161.0, 3894.0, 18641.0, 259349.0, 724582.0, 31863.0, 5509.0, 1510.0, 535.0, 247.0, 118.0, 72.0, 34.0, 23.0, 16.0, 13.0, 10.0, 5.0, 6.0, 8.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4085578918457031, -0.39499664306640625, -0.3814353942871094, -0.3678741455078125, -0.3543128967285156, -0.34075164794921875, -0.3271903991699219, -0.313629150390625, -0.3000679016113281, -0.28650665283203125, -0.2729454040527344, -0.2593841552734375, -0.24582290649414062, -0.23226165771484375, -0.21870040893554688, -0.20513916015625, -0.19157791137695312, -0.17801666259765625, -0.16445541381835938, -0.1508941650390625, -0.13733291625976562, -0.12377166748046875, -0.11021041870117188, -0.096649169921875, -0.08308792114257812, -0.06952667236328125, -0.055965423583984375, -0.0424041748046875, -0.028842926025390625, -0.01528167724609375, -0.001720428466796875, 0.0118408203125, 0.025402069091796875, 0.03896331787109375, 0.052524566650390625, 0.0660858154296875, 0.07964706420898438, 0.09320831298828125, 0.10676956176757812, 0.120330810546875, 0.13389205932617188, 0.14745330810546875, 0.16101455688476562, 0.1745758056640625, 0.18813705444335938, 0.20169830322265625, 0.21525955200195312, 0.22882080078125, 0.24238204956054688, 0.25594329833984375, 0.2695045471191406, 0.2830657958984375, 0.2966270446777344, 0.31018829345703125, 0.3237495422363281, 0.337310791015625, 0.3508720397949219, 0.36443328857421875, 0.3779945373535156, 0.3915557861328125, 0.4051170349121094, 0.41867828369140625, 0.4322395324707031, 0.44580078125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 3.0, 12.0, 19.0, 27.0, 39.0, 97.0, 150.0, 299.0, 116.0, 92.0, 55.0, 34.0, 13.0, 12.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.987550735473633e-05, -3.7929974496364594e-05, -3.598444163799286e-05, -3.4038908779621124e-05, -3.209337592124939e-05, -3.0147843062877655e-05, -2.820231020450592e-05, -2.6256777346134186e-05, -2.431124448776245e-05, -2.2365711629390717e-05, -2.0420178771018982e-05, -1.8474645912647247e-05, -1.6529113054275513e-05, -1.4583580195903778e-05, -1.2638047337532043e-05, -1.0692514479160309e-05, -8.746981620788574e-06, -6.80144876241684e-06, -4.855915904045105e-06, -2.9103830456733704e-06, -9.648501873016357e-07, 9.806826710700989e-07, 2.9262155294418335e-06, 4.871748387813568e-06, 6.817281246185303e-06, 8.762814104557037e-06, 1.0708346962928772e-05, 1.2653879821300507e-05, 1.4599412679672241e-05, 1.6544945538043976e-05, 1.849047839641571e-05, 2.0436011254787445e-05, 2.238154411315918e-05, 2.4327076971530914e-05, 2.627260982990265e-05, 2.8218142688274384e-05, 3.0163675546646118e-05, 3.210920840501785e-05, 3.405474126338959e-05, 3.600027412176132e-05, 3.794580698013306e-05, 3.989133983850479e-05, 4.1836872696876526e-05, 4.378240555524826e-05, 4.5727938413619995e-05, 4.767347127199173e-05, 4.9619004130363464e-05, 5.15645369887352e-05, 5.3510069847106934e-05, 5.545560270547867e-05, 5.74011355638504e-05, 5.934666842222214e-05, 6.129220128059387e-05, 6.32377341389656e-05, 6.518326699733734e-05, 6.712879985570908e-05, 6.907433271408081e-05, 7.101986557245255e-05, 7.296539843082428e-05, 7.491093128919601e-05, 7.685646414756775e-05, 7.880199700593948e-05, 8.074752986431122e-05, 8.269306272268295e-05, 8.463859558105469e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 10.0, 6.0, 14.0, 17.0, 35.0, 41.0, 76.0, 139.0, 278.0, 685.0, 1809.0, 6173.0, 30615.0, 508290.0, 461470.0, 29805.0, 6141.0, 1678.0, 665.0, 266.0, 132.0, 78.0, 52.0, 30.0, 15.0, 9.0, 13.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.2591400146484375, -0.246795654296875, -0.2344512939453125, -0.22210693359375, -0.2097625732421875, -0.197418212890625, -0.1850738525390625, -0.1727294921875, -0.1603851318359375, -0.148040771484375, -0.1356964111328125, -0.12335205078125, -0.1110076904296875, -0.098663330078125, -0.0863189697265625, -0.073974609375, -0.0616302490234375, -0.049285888671875, -0.0369415283203125, -0.02459716796875, -0.0122528076171875, 9.1552734375e-05, 0.0124359130859375, 0.0247802734375, 0.0371246337890625, 0.049468994140625, 0.0618133544921875, 0.07415771484375, 0.0865020751953125, 0.098846435546875, 0.1111907958984375, 0.12353515625, 0.1358795166015625, 0.148223876953125, 0.1605682373046875, 0.17291259765625, 0.1852569580078125, 0.197601318359375, 0.2099456787109375, 0.2222900390625, 0.2346343994140625, 0.246978759765625, 0.2593231201171875, 0.27166748046875, 0.2840118408203125, 0.296356201171875, 0.3087005615234375, 0.321044921875, 0.3333892822265625, 0.345733642578125, 0.3580780029296875, 0.37042236328125, 0.3827667236328125, 0.395111083984375, 0.4074554443359375, 0.4197998046875, 0.4321441650390625, 0.444488525390625, 0.4568328857421875, 0.46917724609375, 0.4815216064453125, 0.493865966796875, 0.5062103271484375, 0.5185546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 8.0, 18.0, 11.0, 17.0, 24.0, 47.0, 74.0, 88.0, 185.0, 179.0, 111.0, 59.0, 46.0, 35.0, 17.0, 14.0, 12.0, 7.0, 7.0, 7.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1981201171875, -0.1931629180908203, -0.18820571899414062, -0.18324851989746094, -0.17829132080078125, -0.17333412170410156, -0.16837692260742188, -0.1634197235107422, -0.1584625244140625, -0.1535053253173828, -0.14854812622070312, -0.14359092712402344, -0.13863372802734375, -0.13367652893066406, -0.12871932983398438, -0.12376213073730469, -0.118804931640625, -0.11384773254394531, -0.10889053344726562, -0.10393333435058594, -0.09897613525390625, -0.09401893615722656, -0.08906173706054688, -0.08410453796386719, -0.0791473388671875, -0.07419013977050781, -0.06923294067382812, -0.06427574157714844, -0.05931854248046875, -0.05436134338378906, -0.049404144287109375, -0.04444694519042969, -0.03948974609375, -0.03453254699707031, -0.029575347900390625, -0.024618148803710938, -0.01966094970703125, -0.014703750610351562, -0.009746551513671875, -0.0047893524169921875, 0.0001678466796875, 0.0051250457763671875, 0.010082244873046875, 0.015039443969726562, 0.01999664306640625, 0.024953842163085938, 0.029911041259765625, 0.03486824035644531, 0.039825439453125, 0.04478263854980469, 0.049739837646484375, 0.05469703674316406, 0.05965423583984375, 0.06461143493652344, 0.06956863403320312, 0.07452583312988281, 0.0794830322265625, 0.08444023132324219, 0.08939743041992188, 0.09435462951660156, 0.09931182861328125, 0.10426902770996094, 0.10922622680664062, 0.11418342590332031, 0.119140625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 10.0, 24.0, 43.0, 89.0, 222.0, 272.0, 200.0, 89.0, 31.0, 7.0, 5.0, 3.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.550769567489624, -2.4033043384552, -2.2558391094207764, -2.1083738803863525, -1.9609086513519287, -1.8134434223175049, -1.665978193283081, -1.5185129642486572, -1.3710477352142334, -1.2235825061798096, -1.0761172771453857, -0.9286520481109619, -0.7811868190765381, -0.6337215900421143, -0.48625636100769043, -0.3387911319732666, -0.19132590293884277, -0.043860673904418945, 0.10360455513000488, 0.2510697841644287, 0.39853501319885254, 0.5460002422332764, 0.6934654712677002, 0.840930700302124, 0.9883959293365479, 1.1358611583709717, 1.2833263874053955, 1.4307916164398193, 1.5782568454742432, 1.725722074508667, 1.8731873035430908, 2.0206525325775146, 2.1681175231933594, 2.315582752227783, 2.463047981262207, 2.610513210296631, 2.7579784393310547, 2.9054436683654785, 3.0529088973999023, 3.200374126434326, 3.34783935546875, 3.495304584503174, 3.6427698135375977, 3.7902350425720215, 3.9377002716064453, 4.085165500640869, 4.232630729675293, 4.380095958709717, 4.527561187744141, 4.6750264167785645, 4.822491645812988, 4.969956874847412, 5.117422103881836, 5.26488733291626, 5.412352561950684, 5.559817790985107, 5.707283020019531, 5.854748249053955, 6.002213478088379, 6.149678707122803, 6.297143936157227, 6.44460916519165, 6.592074394226074, 6.739539623260498, 6.887004852294922]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 16.0, 21.0, 21.0, 22.0, 29.0, 23.0, 30.0, 18.0, 25.0, 33.0, 40.0, 27.0, 48.0, 49.0, 59.0, 45.0, 48.0, 45.0, 48.0, 43.0, 31.0, 36.0, 27.0, 25.0, 39.0, 24.0, 19.0, 17.0, 16.0, 8.0, 12.0, 9.0, 9.0, 7.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.2585690021514893, -2.1818594932556152, -2.105149745941162, -2.028440237045288, -1.951730728149414, -1.87502121925354, -1.7983115911483765, -1.721601963043213, -1.6448924541473389, -1.5681829452514648, -1.4914733171463013, -1.4147636890411377, -1.3380541801452637, -1.2613446712493896, -1.184635043144226, -1.1079254150390625, -1.0312159061431885, -0.9545063376426697, -0.8777967691421509, -0.8010872006416321, -0.7243776321411133, -0.6476680636405945, -0.5709584951400757, -0.4942489266395569, -0.4175393581390381, -0.3408297896385193, -0.2641202211380005, -0.1874106526374817, -0.11070108413696289, -0.03399151563644409, 0.04271805286407471, 0.1194276213645935, 0.1961369514465332, 0.272846519947052, 0.3495560884475708, 0.4262656569480896, 0.5029752254486084, 0.5796847939491272, 0.656394362449646, 0.7331039309501648, 0.8098134994506836, 0.8865230679512024, 0.9632326364517212, 1.0399422645568848, 1.1166517734527588, 1.1933612823486328, 1.2700709104537964, 1.34678053855896, 1.423490047454834, 1.500199556350708, 1.5769091844558716, 1.6536188125610352, 1.7303283214569092, 1.8070378303527832, 1.8837474584579468, 1.9604570865631104, 2.0371665954589844, 2.1138761043548584, 2.1905856132507324, 2.2672953605651855, 2.3440048694610596, 2.4207143783569336, 2.4974241256713867, 2.5741336345672607, 2.6508431434631348]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 13.0, 14.0, 16.0, 15.0, 31.0, 47.0, 79.0, 110.0, 154.0, 221.0, 397.0, 655.0, 1391.0, 3043.0, 7577.0, 24408.0, 147014.0, 2965880.0, 950192.0, 70076.0, 14149.0, 4481.0, 1927.0, 984.0, 505.0, 329.0, 182.0, 119.0, 87.0, 54.0, 31.0, 25.0, 26.0, 12.0, 11.0, 10.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.99609375, -0.9559478759765625, -0.915802001953125, -0.8756561279296875, -0.83551025390625, -0.7953643798828125, -0.755218505859375, -0.7150726318359375, -0.6749267578125, -0.6347808837890625, -0.594635009765625, -0.5544891357421875, -0.51434326171875, -0.4741973876953125, -0.434051513671875, -0.3939056396484375, -0.353759765625, -0.3136138916015625, -0.273468017578125, -0.2333221435546875, -0.19317626953125, -0.1530303955078125, -0.112884521484375, -0.0727386474609375, -0.0325927734375, 0.0075531005859375, 0.047698974609375, 0.0878448486328125, 0.12799072265625, 0.1681365966796875, 0.208282470703125, 0.2484283447265625, 0.28857421875, 0.3287200927734375, 0.368865966796875, 0.4090118408203125, 0.44915771484375, 0.4893035888671875, 0.529449462890625, 0.5695953369140625, 0.6097412109375, 0.6498870849609375, 0.690032958984375, 0.7301788330078125, 0.77032470703125, 0.8104705810546875, 0.850616455078125, 0.8907623291015625, 0.930908203125, 0.9710540771484375, 1.011199951171875, 1.0513458251953125, 1.09149169921875, 1.1316375732421875, 1.171783447265625, 1.2119293212890625, 1.2520751953125, 1.2922210693359375, 1.332366943359375, 1.3725128173828125, 1.41265869140625, 1.4528045654296875, 1.492950439453125, 1.5330963134765625, 1.5732421875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 11.0, 15.0, 10.0, 19.0, 26.0, 26.0, 47.0, 65.0, 65.0, 82.0, 107.0, 96.0, 100.0, 80.0, 67.0, 54.0, 44.0, 22.0, 22.0, 16.0, 12.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9326171875, -0.8956756591796875, -0.858734130859375, -0.8217926025390625, -0.78485107421875, -0.7479095458984375, -0.710968017578125, -0.6740264892578125, -0.6370849609375, -0.6001434326171875, -0.563201904296875, -0.5262603759765625, -0.48931884765625, -0.4523773193359375, -0.415435791015625, -0.3784942626953125, -0.341552734375, -0.3046112060546875, -0.267669677734375, -0.2307281494140625, -0.19378662109375, -0.1568450927734375, -0.119903564453125, -0.0829620361328125, -0.0460205078125, -0.0090789794921875, 0.027862548828125, 0.0648040771484375, 0.10174560546875, 0.1386871337890625, 0.175628662109375, 0.2125701904296875, 0.24951171875, 0.2864532470703125, 0.323394775390625, 0.3603363037109375, 0.39727783203125, 0.4342193603515625, 0.471160888671875, 0.5081024169921875, 0.5450439453125, 0.5819854736328125, 0.618927001953125, 0.6558685302734375, 0.69281005859375, 0.7297515869140625, 0.766693115234375, 0.8036346435546875, 0.840576171875, 0.8775177001953125, 0.914459228515625, 0.9514007568359375, 0.98834228515625, 1.0252838134765625, 1.062225341796875, 1.0991668701171875, 1.1361083984375, 1.1730499267578125, 1.209991455078125, 1.2469329833984375, 1.28387451171875, 1.3208160400390625, 1.357757568359375, 1.3946990966796875, 1.431640625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 2.0, 6.0, 3.0, 7.0, 10.0, 22.0, 25.0, 40.0, 64.0, 97.0, 205.0, 364.0, 882.0, 2514.0, 9166.0, 60632.0, 3337561.0, 741905.0, 31747.0, 5910.0, 1753.0, 691.0, 315.0, 127.0, 86.0, 52.0, 43.0, 15.0, 17.0, 6.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.267578125, -2.2133941650390625, -2.159210205078125, -2.1050262451171875, -2.05084228515625, -1.9966583251953125, -1.942474365234375, -1.8882904052734375, -1.8341064453125, -1.7799224853515625, -1.725738525390625, -1.6715545654296875, -1.61737060546875, -1.5631866455078125, -1.509002685546875, -1.4548187255859375, -1.400634765625, -1.3464508056640625, -1.292266845703125, -1.2380828857421875, -1.18389892578125, -1.1297149658203125, -1.075531005859375, -1.0213470458984375, -0.9671630859375, -0.9129791259765625, -0.858795166015625, -0.8046112060546875, -0.75042724609375, -0.6962432861328125, -0.642059326171875, -0.5878753662109375, -0.53369140625, -0.4795074462890625, -0.425323486328125, -0.3711395263671875, -0.31695556640625, -0.2627716064453125, -0.208587646484375, -0.1544036865234375, -0.1002197265625, -0.0460357666015625, 0.008148193359375, 0.0623321533203125, 0.11651611328125, 0.1707000732421875, 0.224884033203125, 0.2790679931640625, 0.333251953125, 0.3874359130859375, 0.441619873046875, 0.4958038330078125, 0.54998779296875, 0.6041717529296875, 0.658355712890625, 0.7125396728515625, 0.7667236328125, 0.8209075927734375, 0.875091552734375, 0.9292755126953125, 0.98345947265625, 1.0376434326171875, 1.091827392578125, 1.1460113525390625, 1.2001953125]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 10.0, 4.0, 18.0, 15.0, 23.0, 49.0, 69.0, 83.0, 143.0, 292.0, 514.0, 940.0, 855.0, 439.0, 248.0, 142.0, 71.0, 49.0, 18.0, 26.0, 16.0, 10.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25927734375, -0.24742889404296875, -0.2355804443359375, -0.22373199462890625, -0.211883544921875, -0.20003509521484375, -0.1881866455078125, -0.17633819580078125, -0.16448974609375, -0.15264129638671875, -0.1407928466796875, -0.12894439697265625, -0.117095947265625, -0.10524749755859375, -0.0933990478515625, -0.08155059814453125, -0.0697021484375, -0.05785369873046875, -0.0460052490234375, -0.03415679931640625, -0.022308349609375, -0.01045989990234375, 0.0013885498046875, 0.01323699951171875, 0.02508544921875, 0.03693389892578125, 0.0487823486328125, 0.06063079833984375, 0.072479248046875, 0.08432769775390625, 0.0961761474609375, 0.10802459716796875, 0.119873046875, 0.13172149658203125, 0.1435699462890625, 0.15541839599609375, 0.167266845703125, 0.17911529541015625, 0.1909637451171875, 0.20281219482421875, 0.21466064453125, 0.22650909423828125, 0.2383575439453125, 0.25020599365234375, 0.262054443359375, 0.27390289306640625, 0.2857513427734375, 0.29759979248046875, 0.3094482421875, 0.32129669189453125, 0.3331451416015625, 0.34499359130859375, 0.356842041015625, 0.36869049072265625, 0.3805389404296875, 0.39238739013671875, 0.40423583984375, 0.41608428955078125, 0.4279327392578125, 0.43978118896484375, 0.451629638671875, 0.46347808837890625, 0.4753265380859375, 0.48717498779296875, 0.4990234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 34.0, 66.0, 112.0, 176.0, 209.0, 184.0, 113.0, 53.0, 22.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0143930912017822, -1.9246292114257812, -1.8348653316497803, -1.7451014518737793, -1.6553376913070679, -1.565573811531067, -1.475809931755066, -1.3860461711883545, -1.2962822914123535, -1.2065184116363525, -1.1167545318603516, -1.0269906520843506, -0.9372268915176392, -0.8474630117416382, -0.7576991319656372, -0.667935311794281, -0.5781713724136353, -0.48840752243995667, -0.3986436724662781, -0.3088797926902771, -0.2191159427165985, -0.12935209274291992, -0.039588212966918945, 0.050175607204437256, 0.13993948698043823, 0.22970333695411682, 0.3194671869277954, 0.4092310667037964, 0.498994916677475, 0.5887587666511536, 0.6785226464271545, 0.7682864665985107, 0.8580503463745117, 0.9478142261505127, 1.0375781059265137, 1.1273419857025146, 1.217105746269226, 1.306869626045227, 1.396633505821228, 1.4863972663879395, 1.5761611461639404, 1.6659250259399414, 1.7556889057159424, 1.8454527854919434, 1.9352165460586548, 2.0249805450439453, 2.114744186401367, 2.204508066177368, 2.294271945953369, 2.38403582572937, 2.473799705505371, 2.563563585281372, 2.653327465057373, 2.743091106414795, 2.832855224609375, 2.922618865966797, 3.012382984161377, 3.102146863937378, 3.191910743713379, 3.28167462348938, 3.371438503265381, 3.4612021446228027, 3.550966262817383, 3.6407299041748047, 3.7304937839508057]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 5.0, 3.0, 15.0, 19.0, 16.0, 30.0, 21.0, 38.0, 32.0, 50.0, 40.0, 29.0, 53.0, 56.0, 46.0, 50.0, 51.0, 53.0, 45.0, 53.0, 48.0, 46.0, 36.0, 30.0, 23.0, 18.0, 19.0, 15.0, 13.0, 9.0, 6.0, 1.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.8203262090682983, -0.7937299609184265, -0.7671337127685547, -0.7405374646186829, -0.713941216468811, -0.6873449683189392, -0.6607487201690674, -0.6341524124145508, -0.6075562238693237, -0.5809599757194519, -0.5543637275695801, -0.5277674794197083, -0.5011712312698364, -0.4745749831199646, -0.4479787051677704, -0.42138245701789856, -0.39478617906570435, -0.3681899309158325, -0.3415936827659607, -0.31499743461608887, -0.28840118646621704, -0.2618049383163452, -0.235208660364151, -0.20861241221427917, -0.18201616406440735, -0.15541991591453552, -0.1288236677646637, -0.10222740471363068, -0.07563115656375885, -0.049034908413887024, -0.022438645362854004, 0.004157602787017822, 0.030753910541534424, 0.05735016241669655, 0.08394641429185867, 0.1105426698923111, 0.13713891804218292, 0.16373516619205475, 0.19033142924308777, 0.2169276773929596, 0.24352392554283142, 0.27012017369270325, 0.2967164218425751, 0.3233126997947693, 0.3499089479446411, 0.37650519609451294, 0.40310144424438477, 0.4296976923942566, 0.4562939405441284, 0.48289018869400024, 0.5094864368438721, 0.5360826849937439, 0.5626789331436157, 0.5892751812934875, 0.6158714294433594, 0.642467737197876, 0.669063925743103, 0.6956601738929749, 0.7222564220428467, 0.7488526701927185, 0.7754489183425903, 0.8020451664924622, 0.828641414642334, 0.8552377223968506, 0.8818339705467224]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 10.0, 2.0, 8.0, 17.0, 29.0, 29.0, 31.0, 44.0, 91.0, 121.0, 171.0, 329.0, 469.0, 841.0, 1564.0, 3132.0, 6821.0, 20004.0, 95922.0, 511608.0, 330761.0, 52532.0, 13311.0, 5080.0, 2348.0, 1352.0, 713.0, 462.0, 237.0, 184.0, 103.0, 53.0, 45.0, 24.0, 28.0, 18.0, 15.0, 9.0, 4.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2012939453125, -0.19551467895507812, -0.18973541259765625, -0.18395614624023438, -0.1781768798828125, -0.17239761352539062, -0.16661834716796875, -0.16083908081054688, -0.155059814453125, -0.14928054809570312, -0.14350128173828125, -0.13772201538085938, -0.1319427490234375, -0.12616348266601562, -0.12038421630859375, -0.11460494995117188, -0.10882568359375, -0.10304641723632812, -0.09726715087890625, -0.09148788452148438, -0.0857086181640625, -0.07992935180664062, -0.07415008544921875, -0.06837081909179688, -0.062591552734375, -0.056812286376953125, -0.05103302001953125, -0.045253753662109375, -0.0394744873046875, -0.033695220947265625, -0.02791595458984375, -0.022136688232421875, -0.016357421875, -0.010578155517578125, -0.00479888916015625, 0.000980377197265625, 0.0067596435546875, 0.012538909912109375, 0.01831817626953125, 0.024097442626953125, 0.029876708984375, 0.035655975341796875, 0.04143524169921875, 0.047214508056640625, 0.0529937744140625, 0.058773040771484375, 0.06455230712890625, 0.07033157348632812, 0.07611083984375, 0.08189010620117188, 0.08766937255859375, 0.09344863891601562, 0.0992279052734375, 0.10500717163085938, 0.11078643798828125, 0.11656570434570312, 0.122344970703125, 0.12812423706054688, 0.13390350341796875, 0.13968276977539062, 0.1454620361328125, 0.15124130249023438, 0.15702056884765625, 0.16279983520507812, 0.1685791015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 5.0, 9.0, 8.0, 11.0, 28.0, 23.0, 30.0, 37.0, 50.0, 63.0, 53.0, 50.0, 57.0, 61.0, 61.0, 75.0, 62.0, 56.0, 59.0, 41.0, 22.0, 26.0, 17.0, 22.0, 14.0, 18.0, 10.0, 4.0, 2.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.7001953125, -0.67950439453125, -0.6588134765625, -0.63812255859375, -0.617431640625, -0.59674072265625, -0.5760498046875, -0.55535888671875, -0.53466796875, -0.51397705078125, -0.4932861328125, -0.47259521484375, -0.451904296875, -0.43121337890625, -0.4105224609375, -0.38983154296875, -0.369140625, -0.34844970703125, -0.3277587890625, -0.30706787109375, -0.286376953125, -0.26568603515625, -0.2449951171875, -0.22430419921875, -0.20361328125, -0.18292236328125, -0.1622314453125, -0.14154052734375, -0.120849609375, -0.10015869140625, -0.0794677734375, -0.05877685546875, -0.0380859375, -0.01739501953125, 0.0032958984375, 0.02398681640625, 0.044677734375, 0.06536865234375, 0.0860595703125, 0.10675048828125, 0.12744140625, 0.14813232421875, 0.1688232421875, 0.18951416015625, 0.210205078125, 0.23089599609375, 0.2515869140625, 0.27227783203125, 0.29296875, 0.31365966796875, 0.3343505859375, 0.35504150390625, 0.375732421875, 0.39642333984375, 0.4171142578125, 0.43780517578125, 0.45849609375, 0.47918701171875, 0.4998779296875, 0.52056884765625, 0.541259765625, 0.56195068359375, 0.5826416015625, 0.60333251953125, 0.6240234375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 8.0, 8.0, 11.0, 9.0, 18.0, 17.0, 25.0, 38.0, 57.0, 93.0, 151.0, 226.0, 356.0, 675.0, 1193.0, 2300.0, 4849.0, 13209.0, 54903.0, 321830.0, 506199.0, 107557.0, 21306.0, 7082.0, 2950.0, 1467.0, 776.0, 452.0, 271.0, 176.0, 106.0, 78.0, 50.0, 30.0, 20.0, 11.0, 16.0, 12.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12404632568359375, -0.1197967529296875, -0.11554718017578125, -0.111297607421875, -0.10704803466796875, -0.1027984619140625, -0.09854888916015625, -0.09429931640625, -0.09004974365234375, -0.0858001708984375, -0.08155059814453125, -0.077301025390625, -0.07305145263671875, -0.0688018798828125, -0.06455230712890625, -0.060302734375, -0.05605316162109375, -0.0518035888671875, -0.04755401611328125, -0.043304443359375, -0.03905487060546875, -0.0348052978515625, -0.03055572509765625, -0.02630615234375, -0.02205657958984375, -0.0178070068359375, -0.01355743408203125, -0.009307861328125, -0.00505828857421875, -0.0008087158203125, 0.00344085693359375, 0.0076904296875, 0.01194000244140625, 0.0161895751953125, 0.02043914794921875, 0.024688720703125, 0.02893829345703125, 0.0331878662109375, 0.03743743896484375, 0.04168701171875, 0.04593658447265625, 0.0501861572265625, 0.05443572998046875, 0.058685302734375, 0.06293487548828125, 0.0671844482421875, 0.07143402099609375, 0.07568359375, 0.07993316650390625, 0.0841827392578125, 0.08843231201171875, 0.092681884765625, 0.09693145751953125, 0.1011810302734375, 0.10543060302734375, 0.10968017578125, 0.11392974853515625, 0.1181793212890625, 0.12242889404296875, 0.126678466796875, 0.13092803955078125, 0.1351776123046875, 0.13942718505859375, 0.1436767578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 9.0, 16.0, 17.0, 18.0, 24.0, 26.0, 33.0, 32.0, 42.0, 44.0, 51.0, 50.0, 43.0, 43.0, 43.0, 45.0, 52.0, 41.0, 53.0, 46.0, 35.0, 22.0, 30.0, 23.0, 23.0, 18.0, 19.0, 19.0, 10.0, 14.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.86669921875, -0.8379440307617188, -0.8091888427734375, -0.7804336547851562, -0.751678466796875, -0.7229232788085938, -0.6941680908203125, -0.6654129028320312, -0.63665771484375, -0.6079025268554688, -0.5791473388671875, -0.5503921508789062, -0.521636962890625, -0.49288177490234375, -0.4641265869140625, -0.43537139892578125, -0.4066162109375, -0.37786102294921875, -0.3491058349609375, -0.32035064697265625, -0.291595458984375, -0.26284027099609375, -0.2340850830078125, -0.20532989501953125, -0.17657470703125, -0.14781951904296875, -0.1190643310546875, -0.09030914306640625, -0.061553955078125, -0.03279876708984375, -0.0040435791015625, 0.02471160888671875, 0.053466796875, 0.08222198486328125, 0.1109771728515625, 0.13973236083984375, 0.168487548828125, 0.19724273681640625, 0.2259979248046875, 0.25475311279296875, 0.28350830078125, 0.31226348876953125, 0.3410186767578125, 0.36977386474609375, 0.398529052734375, 0.42728424072265625, 0.4560394287109375, 0.48479461669921875, 0.5135498046875, 0.5423049926757812, 0.5710601806640625, 0.5998153686523438, 0.628570556640625, 0.6573257446289062, 0.6860809326171875, 0.7148361206054688, 0.74359130859375, 0.7723464965820312, 0.8011016845703125, 0.8298568725585938, 0.858612060546875, 0.8873672485351562, 0.9161224365234375, 0.9448776245117188, 0.9736328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 8.0, 16.0, 21.0, 49.0, 105.0, 169.0, 460.0, 1299.0, 6625.0, 112140.0, 894980.0, 27749.0, 3391.0, 873.0, 340.0, 126.0, 69.0, 38.0, 23.0, 18.0, 13.0, 3.0, 9.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12744140625, -0.12219810485839844, -0.11695480346679688, -0.11171150207519531, -0.10646820068359375, -0.10122489929199219, -0.09598159790039062, -0.09073829650878906, -0.0854949951171875, -0.08025169372558594, -0.07500839233398438, -0.06976509094238281, -0.06452178955078125, -0.05927848815917969, -0.054035186767578125, -0.04879188537597656, -0.043548583984375, -0.03830528259277344, -0.033061981201171875, -0.027818679809570312, -0.02257537841796875, -0.017332077026367188, -0.012088775634765625, -0.0068454742431640625, -0.0016021728515625, 0.0036411285400390625, 0.008884429931640625, 0.014127731323242188, 0.01937103271484375, 0.024614334106445312, 0.029857635498046875, 0.03510093688964844, 0.04034423828125, 0.04558753967285156, 0.050830841064453125, 0.05607414245605469, 0.06131744384765625, 0.06656074523925781, 0.07180404663085938, 0.07704734802246094, 0.0822906494140625, 0.08753395080566406, 0.09277725219726562, 0.09802055358886719, 0.10326385498046875, 0.10850715637207031, 0.11375045776367188, 0.11899375915527344, 0.124237060546875, 0.12948036193847656, 0.13472366333007812, 0.1399669647216797, 0.14521026611328125, 0.1504535675048828, 0.15569686889648438, 0.16094017028808594, 0.1661834716796875, 0.17142677307128906, 0.17667007446289062, 0.1819133758544922, 0.18715667724609375, 0.1923999786376953, 0.19764328002929688, 0.20288658142089844, 0.2081298828125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 15.0, 25.0, 24.0, 33.0, 46.0, 58.0, 86.0, 112.0, 108.0, 108.0, 88.0, 65.0, 39.0, 40.0, 38.0, 23.0, 24.0, 13.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.355741500854492e-05, -3.25031578540802e-05, -3.144890069961548e-05, -3.0394643545150757e-05, -2.9340386390686035e-05, -2.8286129236221313e-05, -2.7231872081756592e-05, -2.617761492729187e-05, -2.512335777282715e-05, -2.4069100618362427e-05, -2.3014843463897705e-05, -2.1960586309432983e-05, -2.0906329154968262e-05, -1.985207200050354e-05, -1.879781484603882e-05, -1.7743557691574097e-05, -1.6689300537109375e-05, -1.5635043382644653e-05, -1.4580786228179932e-05, -1.352652907371521e-05, -1.2472271919250488e-05, -1.1418014764785767e-05, -1.0363757610321045e-05, -9.309500455856323e-06, -8.255243301391602e-06, -7.20098614692688e-06, -6.146728992462158e-06, -5.0924718379974365e-06, -4.038214683532715e-06, -2.983957529067993e-06, -1.9297003746032715e-06, -8.754432201385498e-07, 1.7881393432617188e-07, 1.2330710887908936e-06, 2.2873282432556152e-06, 3.341585397720337e-06, 4.395842552185059e-06, 5.45009970664978e-06, 6.504356861114502e-06, 7.558614015579224e-06, 8.612871170043945e-06, 9.667128324508667e-06, 1.0721385478973389e-05, 1.177564263343811e-05, 1.2829899787902832e-05, 1.3884156942367554e-05, 1.4938414096832275e-05, 1.5992671251296997e-05, 1.704692840576172e-05, 1.810118556022644e-05, 1.9155442714691162e-05, 2.0209699869155884e-05, 2.1263957023620605e-05, 2.2318214178085327e-05, 2.337247133255005e-05, 2.442672848701477e-05, 2.5480985641479492e-05, 2.6535242795944214e-05, 2.7589499950408936e-05, 2.8643757104873657e-05, 2.969801425933838e-05, 3.07522714138031e-05, 3.180652856826782e-05, 3.2860785722732544e-05, 3.3915042877197266e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 4.0, 5.0, 7.0, 8.0, 13.0, 21.0, 22.0, 40.0, 62.0, 115.0, 182.0, 230.0, 400.0, 640.0, 1032.0, 1866.0, 3624.0, 8123.0, 22116.0, 93703.0, 516142.0, 318080.0, 54308.0, 14924.0, 6093.0, 2921.0, 1527.0, 885.0, 536.0, 321.0, 201.0, 132.0, 88.0, 60.0, 33.0, 31.0, 18.0, 13.0, 9.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.069091796875, -0.06692123413085938, -0.06475067138671875, -0.06258010864257812, -0.0604095458984375, -0.058238983154296875, -0.05606842041015625, -0.053897857666015625, -0.051727294921875, -0.049556732177734375, -0.04738616943359375, -0.045215606689453125, -0.0430450439453125, -0.040874481201171875, -0.03870391845703125, -0.036533355712890625, -0.03436279296875, -0.032192230224609375, -0.03002166748046875, -0.027851104736328125, -0.0256805419921875, -0.023509979248046875, -0.02133941650390625, -0.019168853759765625, -0.016998291015625, -0.014827728271484375, -0.01265716552734375, -0.010486602783203125, -0.0083160400390625, -0.006145477294921875, -0.00397491455078125, -0.001804351806640625, 0.0003662109375, 0.002536773681640625, 0.00470733642578125, 0.006877899169921875, 0.0090484619140625, 0.011219024658203125, 0.01338958740234375, 0.015560150146484375, 0.017730712890625, 0.019901275634765625, 0.02207183837890625, 0.024242401123046875, 0.0264129638671875, 0.028583526611328125, 0.03075408935546875, 0.032924652099609375, 0.03509521484375, 0.037265777587890625, 0.03943634033203125, 0.041606903076171875, 0.0437774658203125, 0.045948028564453125, 0.04811859130859375, 0.050289154052734375, 0.052459716796875, 0.054630279541015625, 0.05680084228515625, 0.058971405029296875, 0.0611419677734375, 0.06331253051757812, 0.06548309326171875, 0.06765365600585938, 0.06982421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 3.0, 5.0, 7.0, 21.0, 17.0, 25.0, 22.0, 49.0, 56.0, 83.0, 100.0, 124.0, 113.0, 98.0, 64.0, 46.0, 43.0, 30.0, 21.0, 8.0, 15.0, 7.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0161590576171875, -0.015506505966186523, -0.014853954315185547, -0.01420140266418457, -0.013548851013183594, -0.012896299362182617, -0.01224374771118164, -0.011591196060180664, -0.010938644409179688, -0.010286092758178711, -0.009633541107177734, -0.008980989456176758, -0.008328437805175781, -0.007675886154174805, -0.007023334503173828, -0.0063707828521728516, -0.005718231201171875, -0.0050656795501708984, -0.004413127899169922, -0.0037605762481689453, -0.0031080245971679688, -0.002455472946166992, -0.0018029212951660156, -0.001150369644165039, -0.0004978179931640625, 0.00015473365783691406, 0.0008072853088378906, 0.0014598369598388672, 0.0021123886108398438, 0.0027649402618408203, 0.003417491912841797, 0.0040700435638427734, 0.00472259521484375, 0.0053751468658447266, 0.006027698516845703, 0.00668025016784668, 0.007332801818847656, 0.007985353469848633, 0.00863790512084961, 0.009290456771850586, 0.009943008422851562, 0.010595560073852539, 0.011248111724853516, 0.011900663375854492, 0.012553215026855469, 0.013205766677856445, 0.013858318328857422, 0.014510869979858398, 0.015163421630859375, 0.01581597328186035, 0.016468524932861328, 0.017121076583862305, 0.01777362823486328, 0.018426179885864258, 0.019078731536865234, 0.01973128318786621, 0.020383834838867188, 0.021036386489868164, 0.02168893814086914, 0.022341489791870117, 0.022994041442871094, 0.02364659309387207, 0.024299144744873047, 0.024951696395874023, 0.025604248046875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 17.0, 24.0, 49.0, 110.0, 209.0, 241.0, 176.0, 104.0, 42.0, 14.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.659118413925171, -1.596024751663208, -1.5329309701919556, -1.4698373079299927, -1.4067436456680298, -1.3436498641967773, -1.2805562019348145, -1.2174625396728516, -1.1543688774108887, -1.0912752151489258, -1.0281814336776733, -0.9650877714157104, -0.9019941091537476, -0.8389003872871399, -0.7758066654205322, -0.7127130031585693, -0.6496192216873169, -0.5865254998207092, -0.5234318375587463, -0.46033811569213867, -0.3972444236278534, -0.3341507315635681, -0.27105700969696045, -0.20796331763267517, -0.1448696255683899, -0.08177592605352402, -0.018682226538658142, 0.04441148042678833, 0.10750517249107361, 0.1705988645553589, 0.23369258642196655, 0.29678627848625183, 0.3598799705505371, 0.4229736626148224, 0.48606735467910767, 0.5491610765457153, 0.6122547388076782, 0.6753484606742859, 0.7384421825408936, 0.8015358448028564, 0.8646295666694641, 0.9277232885360718, 0.9908169507980347, 1.053910732269287, 1.11700439453125, 1.180098056793213, 1.2431917190551758, 1.3062855005264282, 1.3693791627883911, 1.432472825050354, 1.4955666065216064, 1.5586602687835693, 1.6217539310455322, 1.6848475933074951, 1.7479413747787476, 1.8110350370407104, 1.874128818511963, 1.9372224807739258, 2.0003161430358887, 2.0634098052978516, 2.1265037059783936, 2.1895973682403564, 2.2526910305023193, 2.3157846927642822, 2.378878355026245]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 4.0, 3.0, 5.0, 12.0, 7.0, 16.0, 18.0, 18.0, 21.0, 41.0, 39.0, 37.0, 56.0, 39.0, 49.0, 68.0, 40.0, 70.0, 57.0, 52.0, 54.0, 54.0, 46.0, 39.0, 33.0, 20.0, 23.0, 22.0, 12.0, 9.0, 12.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5706307888031006, -0.5522164702415466, -0.5338022112846375, -0.5153878927230835, -0.4969736337661743, -0.47855934500694275, -0.4601450562477112, -0.4417307376861572, -0.42331647872924805, -0.4049021899700165, -0.3864879012107849, -0.36807361245155334, -0.3496593236923218, -0.3312450349330902, -0.31283074617385864, -0.2944164276123047, -0.2760021388530731, -0.25758785009384155, -0.23917356133460999, -0.22075927257537842, -0.20234498381614685, -0.18393069505691528, -0.16551639139652252, -0.14710210263729095, -0.1286878138780594, -0.11027352511882782, -0.09185923635959625, -0.07344494014978409, -0.05503065139055252, -0.03661636263132095, -0.01820206642150879, 0.00021222233772277832, 0.018626511096954346, 0.03704079985618591, 0.05545509234070778, 0.07386938482522964, 0.09228367358446121, 0.11069796234369278, 0.12911225855350494, 0.1475265473127365, 0.16594083607196808, 0.18435512483119965, 0.2027694135904312, 0.22118371725082397, 0.23959800601005554, 0.2580122947692871, 0.2764265835285187, 0.29484087228775024, 0.3132551610469818, 0.3316694498062134, 0.35008373856544495, 0.3684980273246765, 0.3869123160839081, 0.40532660484313965, 0.4237409234046936, 0.4421551823616028, 0.46056950092315674, 0.4789837896823883, 0.4973980784416199, 0.5158123970031738, 0.534226655960083, 0.552640974521637, 0.5710552334785461, 0.5894695520401001, 0.6078838109970093]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 30.0, 43.0, 75.0, 93.0, 234.0, 410.0, 831.0, 1644.0, 3985.0, 10604.0, 33868.0, 202921.0, 702112.0, 63775.0, 17289.0, 5940.0, 2409.0, 1112.0, 517.0, 267.0, 151.0, 84.0, 59.0, 28.0, 24.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5750656127929688, -0.5539398193359375, -0.5328140258789062, -0.511688232421875, -0.49056243896484375, -0.4694366455078125, -0.44831085205078125, -0.42718505859375, -0.40605926513671875, -0.3849334716796875, -0.36380767822265625, -0.342681884765625, -0.32155609130859375, -0.3004302978515625, -0.27930450439453125, -0.2581787109375, -0.23705291748046875, -0.2159271240234375, -0.19480133056640625, -0.173675537109375, -0.15254974365234375, -0.1314239501953125, -0.11029815673828125, -0.08917236328125, -0.06804656982421875, -0.0469207763671875, -0.02579498291015625, -0.004669189453125, 0.01645660400390625, 0.0375823974609375, 0.05870819091796875, 0.079833984375, 0.10095977783203125, 0.1220855712890625, 0.14321136474609375, 0.164337158203125, 0.18546295166015625, 0.2065887451171875, 0.22771453857421875, 0.24884033203125, 0.26996612548828125, 0.2910919189453125, 0.31221771240234375, 0.333343505859375, 0.35446929931640625, 0.3755950927734375, 0.39672088623046875, 0.4178466796875, 0.43897247314453125, 0.4600982666015625, 0.48122406005859375, 0.502349853515625, 0.5234756469726562, 0.5446014404296875, 0.5657272338867188, 0.58685302734375, 0.6079788208007812, 0.6291046142578125, 0.6502304077148438, 0.671356201171875, 0.6924819946289062, 0.7136077880859375, 0.7347335815429688, 0.755859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 3.0, 5.0, 11.0, 10.0, 21.0, 28.0, 40.0, 38.0, 52.0, 58.0, 65.0, 69.0, 72.0, 80.0, 71.0, 56.0, 71.0, 50.0, 48.0, 28.0, 33.0, 21.0, 25.0, 10.0, 8.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.169921875, -1.12158203125, -1.0732421875, -1.02490234375, -0.9765625, -0.92822265625, -0.8798828125, -0.83154296875, -0.783203125, -0.73486328125, -0.6865234375, -0.63818359375, -0.58984375, -0.54150390625, -0.4931640625, -0.44482421875, -0.396484375, -0.34814453125, -0.2998046875, -0.25146484375, -0.203125, -0.15478515625, -0.1064453125, -0.05810546875, -0.009765625, 0.03857421875, 0.0869140625, 0.13525390625, 0.18359375, 0.23193359375, 0.2802734375, 0.32861328125, 0.376953125, 0.42529296875, 0.4736328125, 0.52197265625, 0.5703125, 0.61865234375, 0.6669921875, 0.71533203125, 0.763671875, 0.81201171875, 0.8603515625, 0.90869140625, 0.95703125, 1.00537109375, 1.0537109375, 1.10205078125, 1.150390625, 1.19873046875, 1.2470703125, 1.29541015625, 1.34375, 1.39208984375, 1.4404296875, 1.48876953125, 1.537109375, 1.58544921875, 1.6337890625, 1.68212890625, 1.73046875, 1.77880859375, 1.8271484375, 1.87548828125, 1.923828125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 4.0, 15.0, 11.0, 13.0, 20.0, 25.0, 22.0, 28.0, 53.0, 39.0, 68.0, 156.0, 373.0, 1484.0, 10981.0, 322135.0, 696020.0, 14488.0, 1750.0, 377.0, 157.0, 68.0, 49.0, 40.0, 28.0, 24.0, 17.0, 16.0, 17.0, 16.0, 11.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.181396484375, -1.14208984375, -1.102783203125, -1.0634765625, -1.024169921875, -0.98486328125, -0.945556640625, -0.90625, -0.866943359375, -0.82763671875, -0.788330078125, -0.7490234375, -0.709716796875, -0.67041015625, -0.631103515625, -0.591796875, -0.552490234375, -0.51318359375, -0.473876953125, -0.4345703125, -0.395263671875, -0.35595703125, -0.316650390625, -0.27734375, -0.238037109375, -0.19873046875, -0.159423828125, -0.1201171875, -0.080810546875, -0.04150390625, -0.002197265625, 0.037109375, 0.076416015625, 0.11572265625, 0.155029296875, 0.1943359375, 0.233642578125, 0.27294921875, 0.312255859375, 0.3515625, 0.390869140625, 0.43017578125, 0.469482421875, 0.5087890625, 0.548095703125, 0.58740234375, 0.626708984375, 0.666015625, 0.705322265625, 0.74462890625, 0.783935546875, 0.8232421875, 0.862548828125, 0.90185546875, 0.941162109375, 0.98046875, 1.019775390625, 1.05908203125, 1.098388671875, 1.1376953125, 1.177001953125, 1.21630859375, 1.255615234375, 1.294921875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 9.0, 14.0, 9.0, 13.0, 9.0, 18.0, 18.0, 19.0, 32.0, 23.0, 27.0, 28.0, 43.0, 47.0, 48.0, 46.0, 50.0, 50.0, 44.0, 44.0, 40.0, 47.0, 38.0, 39.0, 41.0, 26.0, 21.0, 27.0, 18.0, 20.0, 9.0, 11.0, 17.0, 7.0, 12.0, 3.0, 8.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.07427978515625, -1.0382080078125, -1.00213623046875, -0.966064453125, -0.92999267578125, -0.8939208984375, -0.85784912109375, -0.82177734375, -0.78570556640625, -0.7496337890625, -0.71356201171875, -0.677490234375, -0.64141845703125, -0.6053466796875, -0.56927490234375, -0.533203125, -0.49713134765625, -0.4610595703125, -0.42498779296875, -0.388916015625, -0.35284423828125, -0.3167724609375, -0.28070068359375, -0.24462890625, -0.20855712890625, -0.1724853515625, -0.13641357421875, -0.100341796875, -0.06427001953125, -0.0281982421875, 0.00787353515625, 0.0439453125, 0.08001708984375, 0.1160888671875, 0.15216064453125, 0.188232421875, 0.22430419921875, 0.2603759765625, 0.29644775390625, 0.33251953125, 0.36859130859375, 0.4046630859375, 0.44073486328125, 0.476806640625, 0.51287841796875, 0.5489501953125, 0.58502197265625, 0.62109375, 0.65716552734375, 0.6932373046875, 0.72930908203125, 0.765380859375, 0.80145263671875, 0.8375244140625, 0.87359619140625, 0.90966796875, 0.94573974609375, 0.9818115234375, 1.01788330078125, 1.053955078125, 1.09002685546875, 1.1260986328125, 1.16217041015625, 1.1982421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 11.0, 14.0, 21.0, 36.0, 54.0, 85.0, 188.0, 337.0, 744.0, 2058.0, 7743.0, 48790.0, 855735.0, 113678.0, 13983.0, 3081.0, 1026.0, 484.0, 204.0, 109.0, 55.0, 41.0, 16.0, 12.0, 5.0, 12.0, 8.0, 3.0, 3.0, 5.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23046875, -0.21983718872070312, -0.20920562744140625, -0.19857406616210938, -0.1879425048828125, -0.17731094360351562, -0.16667938232421875, -0.15604782104492188, -0.145416259765625, -0.13478469848632812, -0.12415313720703125, -0.11352157592773438, -0.1028900146484375, -0.09225845336914062, -0.08162689208984375, -0.07099533081054688, -0.06036376953125, -0.049732208251953125, -0.03910064697265625, -0.028469085693359375, -0.0178375244140625, -0.007205963134765625, 0.00342559814453125, 0.014057159423828125, 0.024688720703125, 0.035320281982421875, 0.04595184326171875, 0.056583404541015625, 0.0672149658203125, 0.07784652709960938, 0.08847808837890625, 0.09910964965820312, 0.1097412109375, 0.12037277221679688, 0.13100433349609375, 0.14163589477539062, 0.1522674560546875, 0.16289901733398438, 0.17353057861328125, 0.18416213989257812, 0.194793701171875, 0.20542526245117188, 0.21605682373046875, 0.22668838500976562, 0.2373199462890625, 0.24795150756835938, 0.25858306884765625, 0.2692146301269531, 0.27984619140625, 0.2904777526855469, 0.30110931396484375, 0.3117408752441406, 0.3223724365234375, 0.3330039978027344, 0.34363555908203125, 0.3542671203613281, 0.364898681640625, 0.3755302429199219, 0.38616180419921875, 0.3967933654785156, 0.4074249267578125, 0.4180564880371094, 0.42868804931640625, 0.4393196105957031, 0.449951171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 3.0, 17.0, 11.0, 18.0, 30.0, 32.0, 64.0, 145.0, 345.0, 136.0, 60.0, 38.0, 23.0, 17.0, 14.0, 9.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9948692321777344e-05, -4.861410707235336e-05, -4.727952182292938e-05, -4.59449365735054e-05, -4.461035132408142e-05, -4.327576607465744e-05, -4.194118082523346e-05, -4.060659557580948e-05, -3.92720103263855e-05, -3.793742507696152e-05, -3.660283982753754e-05, -3.5268254578113556e-05, -3.3933669328689575e-05, -3.2599084079265594e-05, -3.1264498829841614e-05, -2.9929913580417633e-05, -2.8595328330993652e-05, -2.726074308156967e-05, -2.592615783214569e-05, -2.459157258272171e-05, -2.325698733329773e-05, -2.192240208387375e-05, -2.0587816834449768e-05, -1.9253231585025787e-05, -1.7918646335601807e-05, -1.6584061086177826e-05, -1.5249475836753845e-05, -1.3914890587329865e-05, -1.2580305337905884e-05, -1.1245720088481903e-05, -9.911134839057922e-06, -8.576549589633942e-06, -7.241964340209961e-06, -5.90737909078598e-06, -4.5727938413619995e-06, -3.238208591938019e-06, -1.903623342514038e-06, -5.690380930900574e-07, 7.655471563339233e-07, 2.100132405757904e-06, 3.4347176551818848e-06, 4.7693029046058655e-06, 6.103888154029846e-06, 7.438473403453827e-06, 8.773058652877808e-06, 1.0107643902301788e-05, 1.1442229151725769e-05, 1.277681440114975e-05, 1.411139965057373e-05, 1.544598489999771e-05, 1.6780570149421692e-05, 1.8115155398845673e-05, 1.9449740648269653e-05, 2.0784325897693634e-05, 2.2118911147117615e-05, 2.3453496396541595e-05, 2.4788081645965576e-05, 2.6122666895389557e-05, 2.7457252144813538e-05, 2.879183739423752e-05, 3.01264226436615e-05, 3.146100789308548e-05, 3.279559314250946e-05, 3.413017839193344e-05, 3.546476364135742e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 11.0, 11.0, 24.0, 42.0, 78.0, 163.0, 465.0, 1282.0, 5165.0, 31803.0, 826739.0, 163388.0, 15017.0, 2918.0, 836.0, 310.0, 128.0, 77.0, 39.0, 26.0, 9.0, 3.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.55078125, -0.5376091003417969, -0.5244369506835938, -0.5112648010253906, -0.4980926513671875, -0.4849205017089844, -0.47174835205078125, -0.4585762023925781, -0.445404052734375, -0.4322319030761719, -0.41905975341796875, -0.4058876037597656, -0.3927154541015625, -0.3795433044433594, -0.36637115478515625, -0.3531990051269531, -0.34002685546875, -0.3268547058105469, -0.31368255615234375, -0.3005104064941406, -0.2873382568359375, -0.2741661071777344, -0.26099395751953125, -0.24782180786132812, -0.234649658203125, -0.22147750854492188, -0.20830535888671875, -0.19513320922851562, -0.1819610595703125, -0.16878890991210938, -0.15561676025390625, -0.14244461059570312, -0.1292724609375, -0.11610031127929688, -0.10292816162109375, -0.08975601196289062, -0.0765838623046875, -0.06341171264648438, -0.05023956298828125, -0.037067413330078125, -0.023895263671875, -0.010723114013671875, 0.00244903564453125, 0.015621185302734375, 0.0287933349609375, 0.041965484619140625, 0.05513763427734375, 0.06830978393554688, 0.08148193359375, 0.09465408325195312, 0.10782623291015625, 0.12099838256835938, 0.1341705322265625, 0.14734268188476562, 0.16051483154296875, 0.17368698120117188, 0.186859130859375, 0.20003128051757812, 0.21320343017578125, 0.22637557983398438, 0.2395477294921875, 0.2527198791503906, 0.26589202880859375, 0.2790641784667969, 0.292236328125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 1.0, 5.0, 10.0, 14.0, 9.0, 12.0, 22.0, 31.0, 42.0, 76.0, 149.0, 357.0, 96.0, 55.0, 35.0, 13.0, 20.0, 15.0, 13.0, 13.0, 4.0, 3.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09694957733154297, -0.09215354919433594, -0.0873575210571289, -0.08256149291992188, -0.07776546478271484, -0.07296943664550781, -0.06817340850830078, -0.06337738037109375, -0.05858135223388672, -0.05378532409667969, -0.048989295959472656, -0.044193267822265625, -0.039397239685058594, -0.03460121154785156, -0.02980518341064453, -0.0250091552734375, -0.02021312713623047, -0.015417098999023438, -0.010621070861816406, -0.005825042724609375, -0.0010290145874023438, 0.0037670135498046875, 0.008563041687011719, 0.01335906982421875, 0.01815509796142578, 0.022951126098632812, 0.027747154235839844, 0.032543182373046875, 0.037339210510253906, 0.04213523864746094, 0.04693126678466797, 0.051727294921875, 0.05652332305908203, 0.06131935119628906, 0.0661153793334961, 0.07091140747070312, 0.07570743560791016, 0.08050346374511719, 0.08529949188232422, 0.09009552001953125, 0.09489154815673828, 0.09968757629394531, 0.10448360443115234, 0.10927963256835938, 0.1140756607055664, 0.11887168884277344, 0.12366771697998047, 0.1284637451171875, 0.13325977325439453, 0.13805580139160156, 0.1428518295288086, 0.14764785766601562, 0.15244388580322266, 0.1572399139404297, 0.16203594207763672, 0.16683197021484375, 0.17162799835205078, 0.1764240264892578, 0.18122005462646484, 0.18601608276367188, 0.1908121109008789, 0.19560813903808594, 0.20040416717529297, 0.2052001953125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 12.0, 18.0, 46.0, 133.0, 215.0, 298.0, 181.0, 69.0, 22.0, 10.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.805270195007324, -5.644710540771484, -5.4841508865356445, -5.323591232299805, -5.163031578063965, -5.002471446990967, -4.841911792755127, -4.681352138519287, -4.520792484283447, -4.360232830047607, -4.199673175811768, -4.039113521575928, -3.878553628921509, -3.717993974685669, -3.55743408203125, -3.39687442779541, -3.2363147735595703, -3.0757551193237305, -2.9151954650878906, -2.7546355724334717, -2.594075918197632, -2.433516263961792, -2.272956371307373, -2.112396717071533, -1.9518370628356934, -1.7912774085998535, -1.6307176351547241, -1.4701578617095947, -1.3095982074737549, -1.149038553237915, -0.9884787797927856, -0.8279190063476562, -0.6673588752746582, -0.5067991614341736, -0.34623944759368896, -0.18567973375320435, -0.025120019912719727, 0.1354396939277649, 0.2959994077682495, 0.4565591812133789, 0.6171188354492188, 0.7776785492897034, 0.938238263130188, 1.0987980365753174, 1.2593576908111572, 1.419917345046997, 1.5804771184921265, 1.7410368919372559, 1.9015965461730957, 2.0621562004089355, 2.2227158546447754, 2.3832757472991943, 2.543835401535034, 2.704395055770874, 2.864954948425293, 3.025514602661133, 3.1860742568969727, 3.3466339111328125, 3.5071935653686523, 3.6677534580230713, 3.828313112258911, 3.988872766494751, 4.14943265914917, 4.30999231338501, 4.47055196762085]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 1.0, 7.0, 6.0, 11.0, 16.0, 14.0, 27.0, 24.0, 30.0, 29.0, 21.0, 33.0, 37.0, 41.0, 24.0, 49.0, 36.0, 39.0, 44.0, 44.0, 42.0, 39.0, 39.0, 28.0, 44.0, 26.0, 23.0, 23.0, 32.0, 16.0, 24.0, 21.0, 10.0, 14.0, 16.0, 15.0, 11.0, 13.0, 2.0, 5.0, 5.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7687351703643799, -1.7140032052993774, -1.6592713594436646, -1.604539394378662, -1.5498074293136597, -1.4950755834579468, -1.4403436183929443, -1.3856117725372314, -1.330879807472229, -1.2761478424072266, -1.2214159965515137, -1.1666840314865112, -1.1119520664215088, -1.057220220565796, -1.0024882555007935, -0.9477563500404358, -0.8930243849754333, -0.8382924795150757, -0.7835605144500732, -0.7288286089897156, -0.6740967035293579, -0.6193647384643555, -0.5646328330039978, -0.5099009275436401, -0.4551689922809601, -0.40043705701828003, -0.34570515155792236, -0.2909732162952423, -0.23624129593372345, -0.1815093755722046, -0.12677744030952454, -0.07204553484916687, -0.017313599586486816, 0.03741832450032234, 0.0921502485871315, 0.14688217639923096, 0.20161409676074982, 0.2563460171222687, 0.31107795238494873, 0.3658098578453064, 0.42054179310798645, 0.4752737283706665, 0.5300056338310242, 0.5847375392913818, 0.6394695043563843, 0.6942014098167419, 0.7489333152770996, 0.803665280342102, 0.8583971858024597, 0.9131290912628174, 0.9678610563278198, 1.0225930213928223, 1.0773248672485352, 1.1320568323135376, 1.18678879737854, 1.241520643234253, 1.2962526082992554, 1.3509845733642578, 1.4057164192199707, 1.4604483842849731, 1.5151803493499756, 1.5699121952056885, 1.624644160270691, 1.6793761253356934, 1.7341079711914062]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 7.0, 3.0, 7.0, 10.0, 11.0, 19.0, 19.0, 34.0, 48.0, 64.0, 82.0, 139.0, 230.0, 344.0, 656.0, 1286.0, 3068.0, 8916.0, 46320.0, 1454726.0, 2598702.0, 63141.0, 10276.0, 3141.0, 1327.0, 710.0, 363.0, 216.0, 129.0, 78.0, 59.0, 47.0, 18.0, 27.0, 21.0, 11.0, 9.0, 9.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19140625, -1.14385986328125, -1.0963134765625, -1.04876708984375, -1.001220703125, -0.95367431640625, -0.9061279296875, -0.85858154296875, -0.81103515625, -0.76348876953125, -0.7159423828125, -0.66839599609375, -0.620849609375, -0.57330322265625, -0.5257568359375, -0.47821044921875, -0.4306640625, -0.38311767578125, -0.3355712890625, -0.28802490234375, -0.240478515625, -0.19293212890625, -0.1453857421875, -0.09783935546875, -0.05029296875, -0.00274658203125, 0.0447998046875, 0.09234619140625, 0.139892578125, 0.18743896484375, 0.2349853515625, 0.28253173828125, 0.330078125, 0.37762451171875, 0.4251708984375, 0.47271728515625, 0.520263671875, 0.56781005859375, 0.6153564453125, 0.66290283203125, 0.71044921875, 0.75799560546875, 0.8055419921875, 0.85308837890625, 0.900634765625, 0.94818115234375, 0.9957275390625, 1.04327392578125, 1.0908203125, 1.13836669921875, 1.1859130859375, 1.23345947265625, 1.281005859375, 1.32855224609375, 1.3760986328125, 1.42364501953125, 1.47119140625, 1.51873779296875, 1.5662841796875, 1.61383056640625, 1.661376953125, 1.70892333984375, 1.7564697265625, 1.80401611328125, 1.8515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 13.0, 13.0, 6.0, 27.0, 27.0, 24.0, 36.0, 56.0, 71.0, 46.0, 71.0, 67.0, 59.0, 71.0, 68.0, 64.0, 52.0, 40.0, 41.0, 29.0, 18.0, 26.0, 11.0, 10.0, 5.0, 5.0, 7.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.78271484375, -0.7592391967773438, -0.7357635498046875, -0.7122879028320312, -0.688812255859375, -0.6653366088867188, -0.6418609619140625, -0.6183853149414062, -0.59490966796875, -0.5714340209960938, -0.5479583740234375, -0.5244827270507812, -0.501007080078125, -0.47753143310546875, -0.4540557861328125, -0.43058013916015625, -0.4071044921875, -0.38362884521484375, -0.3601531982421875, -0.33667755126953125, -0.313201904296875, -0.28972625732421875, -0.2662506103515625, -0.24277496337890625, -0.21929931640625, -0.19582366943359375, -0.1723480224609375, -0.14887237548828125, -0.125396728515625, -0.10192108154296875, -0.0784454345703125, -0.05496978759765625, -0.031494140625, -0.00801849365234375, 0.0154571533203125, 0.03893280029296875, 0.062408447265625, 0.08588409423828125, 0.1093597412109375, 0.13283538818359375, 0.15631103515625, 0.17978668212890625, 0.2032623291015625, 0.22673797607421875, 0.250213623046875, 0.27368927001953125, 0.2971649169921875, 0.32064056396484375, 0.3441162109375, 0.36759185791015625, 0.3910675048828125, 0.41454315185546875, 0.438018798828125, 0.46149444580078125, 0.4849700927734375, 0.5084457397460938, 0.53192138671875, 0.5553970336914062, 0.5788726806640625, 0.6023483276367188, 0.625823974609375, 0.6492996215820312, 0.6727752685546875, 0.6962509155273438, 0.7197265625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 13.0, 9.0, 14.0, 17.0, 43.0, 84.0, 159.0, 266.0, 558.0, 1703.0, 7048.0, 74586.0, 3858036.0, 234675.0, 13136.0, 2444.0, 787.0, 345.0, 144.0, 81.0, 53.0, 28.0, 23.0, 14.0, 11.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2225494384765625, -1.157012939453125, -1.0914764404296875, -1.02593994140625, -0.9604034423828125, -0.894866943359375, -0.8293304443359375, -0.7637939453125, -0.6982574462890625, -0.632720947265625, -0.5671844482421875, -0.50164794921875, -0.4361114501953125, -0.370574951171875, -0.3050384521484375, -0.239501953125, -0.1739654541015625, -0.108428955078125, -0.0428924560546875, 0.02264404296875, 0.0881805419921875, 0.153717041015625, 0.2192535400390625, 0.2847900390625, 0.3503265380859375, 0.415863037109375, 0.4813995361328125, 0.54693603515625, 0.6124725341796875, 0.678009033203125, 0.7435455322265625, 0.80908203125, 0.8746185302734375, 0.940155029296875, 1.0056915283203125, 1.07122802734375, 1.1367645263671875, 1.202301025390625, 1.2678375244140625, 1.3333740234375, 1.3989105224609375, 1.464447021484375, 1.5299835205078125, 1.59552001953125, 1.6610565185546875, 1.726593017578125, 1.7921295166015625, 1.857666015625, 1.9232025146484375, 1.988739013671875, 2.0542755126953125, 2.11981201171875, 2.1853485107421875, 2.250885009765625, 2.3164215087890625, 2.3819580078125, 2.4474945068359375, 2.513031005859375, 2.5785675048828125, 2.64410400390625, 2.7096405029296875, 2.775177001953125, 2.8407135009765625, 2.90625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 18.0, 16.0, 27.0, 50.0, 60.0, 97.0, 174.0, 352.0, 776.0, 1188.0, 649.0, 292.0, 146.0, 85.0, 49.0, 28.0, 21.0, 14.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.400390625, -0.3867378234863281, -0.37308502197265625, -0.3594322204589844, -0.3457794189453125, -0.3321266174316406, -0.31847381591796875, -0.3048210144042969, -0.291168212890625, -0.2775154113769531, -0.26386260986328125, -0.2502098083496094, -0.2365570068359375, -0.22290420532226562, -0.20925140380859375, -0.19559860229492188, -0.18194580078125, -0.16829299926757812, -0.15464019775390625, -0.14098739624023438, -0.1273345947265625, -0.11368179321289062, -0.10002899169921875, -0.08637619018554688, -0.072723388671875, -0.059070587158203125, -0.04541778564453125, -0.031764984130859375, -0.0181121826171875, -0.004459381103515625, 0.00919342041015625, 0.022846221923828125, 0.0364990234375, 0.050151824951171875, 0.06380462646484375, 0.07745742797851562, 0.0911102294921875, 0.10476303100585938, 0.11841583251953125, 0.13206863403320312, 0.145721435546875, 0.15937423706054688, 0.17302703857421875, 0.18667984008789062, 0.2003326416015625, 0.21398544311523438, 0.22763824462890625, 0.24129104614257812, 0.25494384765625, 0.2685966491699219, 0.28224945068359375, 0.2959022521972656, 0.3095550537109375, 0.3232078552246094, 0.33686065673828125, 0.3505134582519531, 0.364166259765625, 0.3778190612792969, 0.39147186279296875, 0.4051246643066406, 0.4187774658203125, 0.4324302673339844, 0.44608306884765625, 0.4597358703613281, 0.473388671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 11.0, 11.0, 38.0, 80.0, 129.0, 177.0, 207.0, 151.0, 93.0, 58.0, 21.0, 14.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4264402389526367, -1.3439805507659912, -1.2615208625793457, -1.1790610551834106, -1.0966013669967651, -1.0141416788101196, -0.9316819310188293, -0.8492221832275391, -0.7667624950408936, -0.684302806854248, -0.6018430590629578, -0.5193833112716675, -0.436923623085022, -0.3544639050960541, -0.2720041871070862, -0.1895444393157959, -0.10708475112915039, -0.024625033140182495, 0.0578346848487854, 0.1402944028377533, 0.2227541208267212, 0.3052138388156891, 0.387673556804657, 0.47013330459594727, 0.5525929927825928, 0.6350526809692383, 0.7175124287605286, 0.7999721765518188, 0.8824318647384644, 0.9648915529251099, 1.047351360321045, 1.1298110485076904, 1.212270736694336, 1.2947304248809814, 1.377190113067627, 1.459649920463562, 1.5421096086502075, 1.624569296836853, 1.707029104232788, 1.7894887924194336, 1.871948480606079, 1.9544081687927246, 2.03686785697937, 2.1193275451660156, 2.2017874717712402, 2.2842471599578857, 2.3667068481445312, 2.4491665363311768, 2.5316262245178223, 2.6140859127044678, 2.6965456008911133, 2.779005289077759, 2.8614649772644043, 2.943924903869629, 3.0263845920562744, 3.10884428024292, 3.1913039684295654, 3.273763656616211, 3.3562233448028564, 3.438683032989502, 3.5211429595947266, 3.603602647781372, 3.6860623359680176, 3.768522024154663, 3.8509817123413086]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 3.0, 5.0, 5.0, 11.0, 4.0, 9.0, 14.0, 17.0, 17.0, 16.0, 27.0, 21.0, 31.0, 43.0, 33.0, 30.0, 32.0, 37.0, 50.0, 48.0, 49.0, 40.0, 51.0, 52.0, 44.0, 40.0, 38.0, 37.0, 43.0, 24.0, 21.0, 20.0, 13.0, 15.0, 10.0, 11.0, 10.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7144700288772583, -0.6918906569480896, -0.6693112850189209, -0.6467319130897522, -0.6241525411605835, -0.6015731692314148, -0.5789937973022461, -0.5564144849777222, -0.5338350534439087, -0.51125568151474, -0.4886763095855713, -0.4660969376564026, -0.4435175657272339, -0.4209381937980652, -0.39835885167121887, -0.37577947974205017, -0.35320013761520386, -0.33062076568603516, -0.30804139375686646, -0.28546202182769775, -0.26288264989852905, -0.24030329287052155, -0.21772393584251404, -0.19514456391334534, -0.17256519198417664, -0.14998582005500793, -0.12740644812583923, -0.10482709109783173, -0.08224771916866302, -0.059668347239494324, -0.037088990211486816, -0.014509618282318115, 0.008069813251495361, 0.030649181455373764, 0.05322854965925217, 0.07580791413784027, 0.09838728606700897, 0.12096665799617767, 0.14354601502418518, 0.16612538695335388, 0.18870475888252258, 0.21128413081169128, 0.23386350274085999, 0.2564428448677063, 0.279022216796875, 0.3016015887260437, 0.3241809606552124, 0.3467603325843811, 0.3693397045135498, 0.3919190764427185, 0.4144984483718872, 0.4370778203010559, 0.4596571922302246, 0.4822365641593933, 0.504815936088562, 0.5273952484130859, 0.5499746799468994, 0.5725540518760681, 0.5951334238052368, 0.6177127957344055, 0.6402921676635742, 0.6628715395927429, 0.6854509115219116, 0.7080302238464355, 0.7306095957756042]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 16.0, 19.0, 17.0, 21.0, 40.0, 66.0, 85.0, 107.0, 172.0, 281.0, 414.0, 624.0, 985.0, 1564.0, 2687.0, 5022.0, 10425.0, 34752.0, 298987.0, 594305.0, 67513.0, 15316.0, 6451.0, 3333.0, 1947.0, 1190.0, 748.0, 467.0, 295.0, 201.0, 156.0, 82.0, 70.0, 61.0, 42.0, 18.0, 15.0, 19.0, 9.0, 3.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.30517578125, -0.2959785461425781, -0.28678131103515625, -0.2775840759277344, -0.2683868408203125, -0.2591896057128906, -0.24999237060546875, -0.24079513549804688, -0.231597900390625, -0.22240066528320312, -0.21320343017578125, -0.20400619506835938, -0.1948089599609375, -0.18561172485351562, -0.17641448974609375, -0.16721725463867188, -0.15802001953125, -0.14882278442382812, -0.13962554931640625, -0.13042831420898438, -0.1212310791015625, -0.11203384399414062, -0.10283660888671875, -0.09363937377929688, -0.084442138671875, -0.07524490356445312, -0.06604766845703125, -0.056850433349609375, -0.0476531982421875, -0.038455963134765625, -0.02925872802734375, -0.020061492919921875, -0.0108642578125, -0.001667022705078125, 0.00753021240234375, 0.016727447509765625, 0.0259246826171875, 0.035121917724609375, 0.04431915283203125, 0.053516387939453125, 0.062713623046875, 0.07191085815429688, 0.08110809326171875, 0.09030532836914062, 0.0995025634765625, 0.10869979858398438, 0.11789703369140625, 0.12709426879882812, 0.13629150390625, 0.14548873901367188, 0.15468597412109375, 0.16388320922851562, 0.1730804443359375, 0.18227767944335938, 0.19147491455078125, 0.20067214965820312, 0.209869384765625, 0.21906661987304688, 0.22826385498046875, 0.23746109008789062, 0.2466583251953125, 0.2558555603027344, 0.26505279541015625, 0.2742500305175781, 0.283447265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 3.0, 2.0, 7.0, 7.0, 7.0, 10.0, 14.0, 17.0, 22.0, 24.0, 26.0, 26.0, 40.0, 29.0, 33.0, 36.0, 40.0, 51.0, 54.0, 52.0, 48.0, 40.0, 46.0, 42.0, 51.0, 58.0, 33.0, 36.0, 26.0, 23.0, 13.0, 15.0, 14.0, 8.0, 10.0, 4.0, 6.0, 9.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.611328125, -0.5941925048828125, -0.577056884765625, -0.5599212646484375, -0.54278564453125, -0.5256500244140625, -0.508514404296875, -0.4913787841796875, -0.4742431640625, -0.4571075439453125, -0.439971923828125, -0.4228363037109375, -0.40570068359375, -0.3885650634765625, -0.371429443359375, -0.3542938232421875, -0.337158203125, -0.3200225830078125, -0.302886962890625, -0.2857513427734375, -0.26861572265625, -0.2514801025390625, -0.234344482421875, -0.2172088623046875, -0.2000732421875, -0.1829376220703125, -0.165802001953125, -0.1486663818359375, -0.13153076171875, -0.1143951416015625, -0.097259521484375, -0.0801239013671875, -0.06298828125, -0.0458526611328125, -0.028717041015625, -0.0115814208984375, 0.00555419921875, 0.0226898193359375, 0.039825439453125, 0.0569610595703125, 0.0740966796875, 0.0912322998046875, 0.108367919921875, 0.1255035400390625, 0.14263916015625, 0.1597747802734375, 0.176910400390625, 0.1940460205078125, 0.211181640625, 0.2283172607421875, 0.245452880859375, 0.2625885009765625, 0.27972412109375, 0.2968597412109375, 0.313995361328125, 0.3311309814453125, 0.3482666015625, 0.3654022216796875, 0.382537841796875, 0.3996734619140625, 0.41680908203125, 0.4339447021484375, 0.451080322265625, 0.4682159423828125, 0.4853515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 11.0, 17.0, 11.0, 16.0, 19.0, 36.0, 45.0, 71.0, 125.0, 189.0, 345.0, 667.0, 1508.0, 3936.0, 14322.0, 158866.0, 794929.0, 59325.0, 8937.0, 2790.0, 1097.0, 555.0, 261.0, 142.0, 118.0, 56.0, 41.0, 30.0, 16.0, 12.0, 12.0, 8.0, 7.0, 2.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33740234375, -0.3269691467285156, -0.31653594970703125, -0.3061027526855469, -0.2956695556640625, -0.2852363586425781, -0.27480316162109375, -0.2643699645996094, -0.253936767578125, -0.24350357055664062, -0.23307037353515625, -0.22263717651367188, -0.2122039794921875, -0.20177078247070312, -0.19133758544921875, -0.18090438842773438, -0.17047119140625, -0.16003799438476562, -0.14960479736328125, -0.13917160034179688, -0.1287384033203125, -0.11830520629882812, -0.10787200927734375, -0.09743881225585938, -0.087005615234375, -0.07657241821289062, -0.06613922119140625, -0.055706024169921875, -0.0452728271484375, -0.034839630126953125, -0.02440643310546875, -0.013973236083984375, -0.0035400390625, 0.006893157958984375, 0.01732635498046875, 0.027759552001953125, 0.0381927490234375, 0.048625946044921875, 0.05905914306640625, 0.06949234008789062, 0.079925537109375, 0.09035873413085938, 0.10079193115234375, 0.11122512817382812, 0.1216583251953125, 0.13209152221679688, 0.14252471923828125, 0.15295791625976562, 0.16339111328125, 0.17382431030273438, 0.18425750732421875, 0.19469070434570312, 0.2051239013671875, 0.21555709838867188, 0.22599029541015625, 0.23642349243164062, 0.246856689453125, 0.2572898864746094, 0.26772308349609375, 0.2781562805175781, 0.2885894775390625, 0.2990226745605469, 0.30945587158203125, 0.3198890686035156, 0.330322265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 8.0, 10.0, 12.0, 25.0, 17.0, 19.0, 17.0, 29.0, 30.0, 24.0, 41.0, 41.0, 34.0, 38.0, 51.0, 50.0, 56.0, 34.0, 63.0, 39.0, 38.0, 26.0, 39.0, 31.0, 35.0, 26.0, 23.0, 14.0, 23.0, 15.0, 10.0, 9.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0458984375, -1.01385498046875, -0.9818115234375, -0.94976806640625, -0.917724609375, -0.88568115234375, -0.8536376953125, -0.82159423828125, -0.78955078125, -0.75750732421875, -0.7254638671875, -0.69342041015625, -0.661376953125, -0.62933349609375, -0.5972900390625, -0.56524658203125, -0.533203125, -0.50115966796875, -0.4691162109375, -0.43707275390625, -0.405029296875, -0.37298583984375, -0.3409423828125, -0.30889892578125, -0.27685546875, -0.24481201171875, -0.2127685546875, -0.18072509765625, -0.148681640625, -0.11663818359375, -0.0845947265625, -0.05255126953125, -0.0205078125, 0.01153564453125, 0.0435791015625, 0.07562255859375, 0.107666015625, 0.13970947265625, 0.1717529296875, 0.20379638671875, 0.23583984375, 0.26788330078125, 0.2999267578125, 0.33197021484375, 0.364013671875, 0.39605712890625, 0.4281005859375, 0.46014404296875, 0.4921875, 0.52423095703125, 0.5562744140625, 0.58831787109375, 0.620361328125, 0.65240478515625, 0.6844482421875, 0.71649169921875, 0.74853515625, 0.78057861328125, 0.8126220703125, 0.84466552734375, 0.876708984375, 0.90875244140625, 0.9407958984375, 0.97283935546875, 1.0048828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 3.0, 7.0, 5.0, 14.0, 20.0, 36.0, 45.0, 79.0, 109.0, 167.0, 251.0, 396.0, 756.0, 1376.0, 2820.0, 6635.0, 22375.0, 129057.0, 692757.0, 152655.0, 25026.0, 7501.0, 3002.0, 1507.0, 781.0, 427.0, 263.0, 150.0, 118.0, 67.0, 44.0, 25.0, 17.0, 23.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08673095703125, -0.0842905044555664, -0.08185005187988281, -0.07940959930419922, -0.07696914672851562, -0.07452869415283203, -0.07208824157714844, -0.06964778900146484, -0.06720733642578125, -0.06476688385009766, -0.06232643127441406, -0.05988597869873047, -0.057445526123046875, -0.05500507354736328, -0.05256462097167969, -0.050124168395996094, -0.0476837158203125, -0.045243263244628906, -0.04280281066894531, -0.04036235809326172, -0.037921905517578125, -0.03548145294189453, -0.03304100036621094, -0.030600547790527344, -0.02816009521484375, -0.025719642639160156, -0.023279190063476562, -0.02083873748779297, -0.018398284912109375, -0.01595783233642578, -0.013517379760742188, -0.011076927185058594, -0.008636474609375, -0.006196022033691406, -0.0037555694580078125, -0.0013151168823242188, 0.001125335693359375, 0.0035657882690429688, 0.0060062408447265625, 0.008446693420410156, 0.01088714599609375, 0.013327598571777344, 0.015768051147460938, 0.01820850372314453, 0.020648956298828125, 0.02308940887451172, 0.025529861450195312, 0.027970314025878906, 0.0304107666015625, 0.032851219177246094, 0.03529167175292969, 0.03773212432861328, 0.040172576904296875, 0.04261302947998047, 0.04505348205566406, 0.047493934631347656, 0.04993438720703125, 0.052374839782714844, 0.05481529235839844, 0.05725574493408203, 0.059696197509765625, 0.06213665008544922, 0.06457710266113281, 0.0670175552368164, 0.0694580078125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 4.0, 9.0, 14.0, 21.0, 30.0, 33.0, 57.0, 89.0, 102.0, 130.0, 124.0, 103.0, 70.0, 73.0, 34.0, 29.0, 18.0, 13.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.798173904418945e-05, -4.652794450521469e-05, -4.507414996623993e-05, -4.362035542726517e-05, -4.2166560888290405e-05, -4.071276634931564e-05, -3.925897181034088e-05, -3.780517727136612e-05, -3.635138273239136e-05, -3.4897588193416595e-05, -3.3443793654441833e-05, -3.198999911546707e-05, -3.053620457649231e-05, -2.9082410037517548e-05, -2.7628615498542786e-05, -2.6174820959568024e-05, -2.4721026420593262e-05, -2.32672318816185e-05, -2.1813437342643738e-05, -2.0359642803668976e-05, -1.8905848264694214e-05, -1.7452053725719452e-05, -1.599825918674469e-05, -1.4544464647769928e-05, -1.3090670108795166e-05, -1.1636875569820404e-05, -1.0183081030845642e-05, -8.72928649187088e-06, -7.275491952896118e-06, -5.821697413921356e-06, -4.367902874946594e-06, -2.9141083359718323e-06, -1.4603137969970703e-06, -6.51925802230835e-09, 1.4472752809524536e-06, 2.9010698199272156e-06, 4.3548643589019775e-06, 5.8086588978767395e-06, 7.2624534368515015e-06, 8.716247975826263e-06, 1.0170042514801025e-05, 1.1623837053775787e-05, 1.307763159275055e-05, 1.4531426131725311e-05, 1.5985220670700073e-05, 1.7439015209674835e-05, 1.8892809748649597e-05, 2.034660428762436e-05, 2.180039882659912e-05, 2.3254193365573883e-05, 2.4707987904548645e-05, 2.6161782443523407e-05, 2.761557698249817e-05, 2.906937152147293e-05, 3.052316606044769e-05, 3.1976960599422455e-05, 3.343075513839722e-05, 3.488454967737198e-05, 3.633834421634674e-05, 3.77921387553215e-05, 3.9245933294296265e-05, 4.0699727833271027e-05, 4.215352237224579e-05, 4.360731691122055e-05, 4.506111145019531e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 7.0, 10.0, 7.0, 13.0, 18.0, 25.0, 43.0, 60.0, 97.0, 188.0, 300.0, 504.0, 825.0, 1535.0, 2837.0, 6017.0, 15584.0, 57284.0, 337379.0, 506911.0, 83533.0, 20445.0, 7396.0, 3319.0, 1804.0, 920.0, 590.0, 353.0, 218.0, 126.0, 77.0, 47.0, 22.0, 19.0, 11.0, 5.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07867431640625, -0.07614612579345703, -0.07361793518066406, -0.0710897445678711, -0.06856155395507812, -0.06603336334228516, -0.06350517272949219, -0.06097698211669922, -0.05844879150390625, -0.05592060089111328, -0.05339241027832031, -0.050864219665527344, -0.048336029052734375, -0.045807838439941406, -0.04327964782714844, -0.04075145721435547, -0.0382232666015625, -0.03569507598876953, -0.03316688537597656, -0.030638694763183594, -0.028110504150390625, -0.025582313537597656, -0.023054122924804688, -0.02052593231201172, -0.01799774169921875, -0.015469551086425781, -0.012941360473632812, -0.010413169860839844, -0.007884979248046875, -0.005356788635253906, -0.0028285980224609375, -0.00030040740966796875, 0.002227783203125, 0.004755973815917969, 0.0072841644287109375, 0.009812355041503906, 0.012340545654296875, 0.014868736267089844, 0.017396926879882812, 0.01992511749267578, 0.02245330810546875, 0.02498149871826172, 0.027509689331054688, 0.030037879943847656, 0.032566070556640625, 0.035094261169433594, 0.03762245178222656, 0.04015064239501953, 0.0426788330078125, 0.04520702362060547, 0.04773521423339844, 0.050263404846191406, 0.052791595458984375, 0.055319786071777344, 0.05784797668457031, 0.06037616729736328, 0.06290435791015625, 0.06543254852294922, 0.06796073913574219, 0.07048892974853516, 0.07301712036132812, 0.0755453109741211, 0.07807350158691406, 0.08060169219970703, 0.0831298828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 8.0, 10.0, 13.0, 12.0, 18.0, 34.0, 40.0, 48.0, 71.0, 122.0, 150.0, 127.0, 97.0, 73.0, 63.0, 28.0, 19.0, 14.0, 10.0, 12.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02764892578125, -0.02689814567565918, -0.02614736557006836, -0.02539658546447754, -0.02464580535888672, -0.0238950252532959, -0.023144245147705078, -0.022393465042114258, -0.021642684936523438, -0.020891904830932617, -0.020141124725341797, -0.019390344619750977, -0.018639564514160156, -0.017888784408569336, -0.017138004302978516, -0.016387224197387695, -0.015636444091796875, -0.014885663986206055, -0.014134883880615234, -0.013384103775024414, -0.012633323669433594, -0.011882543563842773, -0.011131763458251953, -0.010380983352661133, -0.009630203247070312, -0.008879423141479492, -0.008128643035888672, -0.0073778629302978516, -0.006627082824707031, -0.005876302719116211, -0.005125522613525391, -0.00437474250793457, -0.00362396240234375, -0.0028731822967529297, -0.0021224021911621094, -0.001371622085571289, -0.0006208419799804688, 0.00012993812561035156, 0.0008807182312011719, 0.0016314983367919922, 0.0023822784423828125, 0.003133058547973633, 0.003883838653564453, 0.0046346187591552734, 0.005385398864746094, 0.006136178970336914, 0.006886959075927734, 0.007637739181518555, 0.008388519287109375, 0.009139299392700195, 0.009890079498291016, 0.010640859603881836, 0.011391639709472656, 0.012142419815063477, 0.012893199920654297, 0.013643980026245117, 0.014394760131835938, 0.015145540237426758, 0.015896320343017578, 0.0166471004486084, 0.01739788055419922, 0.01814866065979004, 0.01889944076538086, 0.01965022087097168, 0.0204010009765625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 10.0, 16.0, 25.0, 76.0, 107.0, 162.0, 186.0, 170.0, 96.0, 70.0, 38.0, 13.0, 13.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2247660160064697, -1.1726794242858887, -1.1205928325653076, -1.0685062408447266, -1.016419768333435, -0.964333176612854, -0.912246584892273, -0.8601599931716919, -0.8080734610557556, -0.7559868693351746, -0.7039003372192383, -0.6518137454986572, -0.5997271537780762, -0.5476406216621399, -0.49555402994155884, -0.44346746802330017, -0.3913809061050415, -0.33929434418678284, -0.28720778226852417, -0.23512119054794312, -0.18303462862968445, -0.13094806671142578, -0.07886147499084473, -0.02677491307258606, 0.025311648845672607, 0.07739821821451187, 0.12948478758335114, 0.181571364402771, 0.23365792632102966, 0.28574448823928833, 0.3378310799598694, 0.38991764187812805, 0.4420042037963867, 0.4940907657146454, 0.546177327632904, 0.5982639193534851, 0.6503504514694214, 0.7024370431900024, 0.7545236349105835, 0.8066102266311646, 0.8586967587471008, 0.9107833504676819, 0.9628698825836182, 1.0149564743041992, 1.0670430660247803, 1.1191296577453613, 1.1712162494659424, 1.2233027219772339, 1.275389313697815, 1.327475905418396, 1.379562497138977, 1.4316489696502686, 1.4837355613708496, 1.5358221530914307, 1.5879087448120117, 1.6399953365325928, 1.6920819282531738, 1.7441685199737549, 1.796255111694336, 1.848341703414917, 1.9004281759262085, 1.9525147676467896, 2.00460147857666, 2.056687831878662, 2.108774423599243]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 7.0, 6.0, 6.0, 11.0, 9.0, 18.0, 17.0, 15.0, 16.0, 29.0, 32.0, 37.0, 36.0, 35.0, 26.0, 46.0, 45.0, 52.0, 42.0, 56.0, 39.0, 51.0, 40.0, 52.0, 49.0, 36.0, 36.0, 21.0, 22.0, 21.0, 11.0, 12.0, 6.0, 8.0, 13.0, 6.0, 6.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.5206981897354126, -0.5047340393066406, -0.48876985907554626, -0.4728056788444519, -0.45684152841567993, -0.44087734818458557, -0.4249131679534912, -0.40894901752471924, -0.39298486709594727, -0.3770206868648529, -0.36105653643608093, -0.3450923562049866, -0.3291282057762146, -0.31316402554512024, -0.2971998453140259, -0.2812356948852539, -0.26527151465415955, -0.24930734932422638, -0.2333431839942932, -0.21737900376319885, -0.20141485333442688, -0.18545067310333252, -0.16948650777339935, -0.1535223424434662, -0.13755817711353302, -0.12159401178359985, -0.10562984645366669, -0.08966567367315292, -0.07370150834321976, -0.05773734301328659, -0.04177317023277283, -0.02580900490283966, -0.009844839572906494, 0.006119327619671822, 0.022083494812250137, 0.0380476638674736, 0.05401182919740677, 0.06997599452733994, 0.0859401673078537, 0.10190433263778687, 0.11786849796772003, 0.1338326632976532, 0.14979682862758636, 0.16576099395751953, 0.1817251741886139, 0.19768932461738586, 0.21365350484848022, 0.2296176701784134, 0.24558183550834656, 0.2615460157394409, 0.2775101661682129, 0.29347434639930725, 0.3094384968280792, 0.3254026770591736, 0.34136682748794556, 0.3573310077190399, 0.3732951879501343, 0.38925936818122864, 0.4052235186100006, 0.42118769884109497, 0.43715184926986694, 0.4531160295009613, 0.46908020973205566, 0.48504436016082764, 0.5010085105895996]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 9.0, 10.0, 14.0, 35.0, 47.0, 80.0, 147.0, 187.0, 302.0, 524.0, 986.0, 1900.0, 3935.0, 9171.0, 26073.0, 117000.0, 699176.0, 140680.0, 29624.0, 9972.0, 4225.0, 2000.0, 996.0, 586.0, 353.0, 202.0, 135.0, 66.0, 43.0, 27.0, 13.0, 13.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63916015625, -0.6131210327148438, -0.5870819091796875, -0.5610427856445312, -0.535003662109375, -0.5089645385742188, -0.4829254150390625, -0.45688629150390625, -0.43084716796875, -0.40480804443359375, -0.3787689208984375, -0.35272979736328125, -0.326690673828125, -0.30065155029296875, -0.2746124267578125, -0.24857330322265625, -0.2225341796875, -0.19649505615234375, -0.1704559326171875, -0.14441680908203125, -0.118377685546875, -0.09233856201171875, -0.0662994384765625, -0.04026031494140625, -0.01422119140625, 0.01181793212890625, 0.0378570556640625, 0.06389617919921875, 0.089935302734375, 0.11597442626953125, 0.1420135498046875, 0.16805267333984375, 0.194091796875, 0.22013092041015625, 0.2461700439453125, 0.27220916748046875, 0.298248291015625, 0.32428741455078125, 0.3503265380859375, 0.37636566162109375, 0.40240478515625, 0.42844390869140625, 0.4544830322265625, 0.48052215576171875, 0.506561279296875, 0.5326004028320312, 0.5586395263671875, 0.5846786499023438, 0.6107177734375, 0.6367568969726562, 0.6627960205078125, 0.6888351440429688, 0.714874267578125, 0.7409133911132812, 0.7669525146484375, 0.7929916381835938, 0.81903076171875, 0.8450698852539062, 0.8711090087890625, 0.8971481323242188, 0.923187255859375, 0.9492263793945312, 0.9752655029296875, 1.0013046264648438, 1.02734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 6.0, 12.0, 8.0, 9.0, 13.0, 20.0, 27.0, 32.0, 31.0, 34.0, 38.0, 37.0, 45.0, 50.0, 43.0, 53.0, 61.0, 55.0, 57.0, 54.0, 46.0, 44.0, 34.0, 32.0, 22.0, 30.0, 20.0, 16.0, 13.0, 4.0, 9.0, 8.0, 5.0, 4.0, 5.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0146484375, -0.9809722900390625, -0.947296142578125, -0.9136199951171875, -0.87994384765625, -0.8462677001953125, -0.812591552734375, -0.7789154052734375, -0.7452392578125, -0.7115631103515625, -0.677886962890625, -0.6442108154296875, -0.61053466796875, -0.5768585205078125, -0.543182373046875, -0.5095062255859375, -0.475830078125, -0.4421539306640625, -0.408477783203125, -0.3748016357421875, -0.34112548828125, -0.3074493408203125, -0.273773193359375, -0.2400970458984375, -0.2064208984375, -0.1727447509765625, -0.139068603515625, -0.1053924560546875, -0.07171630859375, -0.0380401611328125, -0.004364013671875, 0.0293121337890625, 0.06298828125, 0.0966644287109375, 0.130340576171875, 0.1640167236328125, 0.19769287109375, 0.2313690185546875, 0.265045166015625, 0.2987213134765625, 0.3323974609375, 0.3660736083984375, 0.399749755859375, 0.4334259033203125, 0.46710205078125, 0.5007781982421875, 0.534454345703125, 0.5681304931640625, 0.601806640625, 0.6354827880859375, 0.669158935546875, 0.7028350830078125, 0.73651123046875, 0.7701873779296875, 0.803863525390625, 0.8375396728515625, 0.8712158203125, 0.9048919677734375, 0.938568115234375, 0.9722442626953125, 1.00592041015625, 1.0395965576171875, 1.073272705078125, 1.1069488525390625, 1.140625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 7.0, 11.0, 16.0, 19.0, 21.0, 23.0, 40.0, 53.0, 65.0, 78.0, 149.0, 423.0, 1781.0, 21261.0, 935318.0, 83949.0, 4088.0, 629.0, 227.0, 98.0, 58.0, 48.0, 28.0, 22.0, 27.0, 17.0, 16.0, 13.0, 10.0, 5.0, 7.0, 11.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3046875, -2.23419189453125, -2.1636962890625, -2.09320068359375, -2.022705078125, -1.95220947265625, -1.8817138671875, -1.81121826171875, -1.74072265625, -1.67022705078125, -1.5997314453125, -1.52923583984375, -1.458740234375, -1.38824462890625, -1.3177490234375, -1.24725341796875, -1.1767578125, -1.10626220703125, -1.0357666015625, -0.96527099609375, -0.894775390625, -0.82427978515625, -0.7537841796875, -0.68328857421875, -0.61279296875, -0.54229736328125, -0.4718017578125, -0.40130615234375, -0.330810546875, -0.26031494140625, -0.1898193359375, -0.11932373046875, -0.048828125, 0.02166748046875, 0.0921630859375, 0.16265869140625, 0.233154296875, 0.30364990234375, 0.3741455078125, 0.44464111328125, 0.51513671875, 0.58563232421875, 0.6561279296875, 0.72662353515625, 0.797119140625, 0.86761474609375, 0.9381103515625, 1.00860595703125, 1.0791015625, 1.14959716796875, 1.2200927734375, 1.29058837890625, 1.361083984375, 1.43157958984375, 1.5020751953125, 1.57257080078125, 1.64306640625, 1.71356201171875, 1.7840576171875, 1.85455322265625, 1.925048828125, 1.99554443359375, 2.0660400390625, 2.13653564453125, 2.20703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 11.0, 7.0, 12.0, 9.0, 34.0, 19.0, 26.0, 33.0, 36.0, 36.0, 38.0, 30.0, 43.0, 44.0, 42.0, 57.0, 47.0, 50.0, 44.0, 44.0, 39.0, 42.0, 27.0, 21.0, 23.0, 24.0, 18.0, 17.0, 23.0, 14.0, 16.0, 10.0, 11.0, 8.0, 5.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.177734375, -1.14117431640625, -1.1046142578125, -1.06805419921875, -1.031494140625, -0.99493408203125, -0.9583740234375, -0.92181396484375, -0.88525390625, -0.84869384765625, -0.8121337890625, -0.77557373046875, -0.739013671875, -0.70245361328125, -0.6658935546875, -0.62933349609375, -0.5927734375, -0.55621337890625, -0.5196533203125, -0.48309326171875, -0.446533203125, -0.40997314453125, -0.3734130859375, -0.33685302734375, -0.30029296875, -0.26373291015625, -0.2271728515625, -0.19061279296875, -0.154052734375, -0.11749267578125, -0.0809326171875, -0.04437255859375, -0.0078125, 0.02874755859375, 0.0653076171875, 0.10186767578125, 0.138427734375, 0.17498779296875, 0.2115478515625, 0.24810791015625, 0.28466796875, 0.32122802734375, 0.3577880859375, 0.39434814453125, 0.430908203125, 0.46746826171875, 0.5040283203125, 0.54058837890625, 0.5771484375, 0.61370849609375, 0.6502685546875, 0.68682861328125, 0.723388671875, 0.75994873046875, 0.7965087890625, 0.83306884765625, 0.86962890625, 0.90618896484375, 0.9427490234375, 0.97930908203125, 1.015869140625, 1.05242919921875, 1.0889892578125, 1.12554931640625, 1.162109375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 6.0, 4.0, 8.0, 5.0, 12.0, 18.0, 7.0, 14.0, 24.0, 31.0, 47.0, 64.0, 98.0, 182.0, 282.0, 486.0, 1026.0, 2503.0, 7864.0, 29184.0, 132647.0, 677302.0, 150705.0, 32099.0, 8647.0, 2767.0, 1099.0, 573.0, 301.0, 165.0, 105.0, 71.0, 48.0, 41.0, 30.0, 19.0, 14.0, 10.0, 12.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.181396484375, -0.17582130432128906, -0.17024612426757812, -0.1646709442138672, -0.15909576416015625, -0.1535205841064453, -0.14794540405273438, -0.14237022399902344, -0.1367950439453125, -0.13121986389160156, -0.12564468383789062, -0.12006950378417969, -0.11449432373046875, -0.10891914367675781, -0.10334396362304688, -0.09776878356933594, -0.092193603515625, -0.08661842346191406, -0.08104324340820312, -0.07546806335449219, -0.06989288330078125, -0.06431770324707031, -0.058742523193359375, -0.05316734313964844, -0.0475921630859375, -0.04201698303222656, -0.036441802978515625, -0.030866622924804688, -0.02529144287109375, -0.019716262817382812, -0.014141082763671875, -0.008565902709960938, -0.00299072265625, 0.0025844573974609375, 0.008159637451171875, 0.013734817504882812, 0.01930999755859375, 0.024885177612304688, 0.030460357666015625, 0.03603553771972656, 0.0416107177734375, 0.04718589782714844, 0.052761077880859375, 0.05833625793457031, 0.06391143798828125, 0.06948661804199219, 0.07506179809570312, 0.08063697814941406, 0.086212158203125, 0.09178733825683594, 0.09736251831054688, 0.10293769836425781, 0.10851287841796875, 0.11408805847167969, 0.11966323852539062, 0.12523841857910156, 0.1308135986328125, 0.13638877868652344, 0.14196395874023438, 0.1475391387939453, 0.15311431884765625, 0.1586894989013672, 0.16426467895507812, 0.16983985900878906, 0.1754150390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 5.0, 12.0, 10.0, 15.0, 19.0, 30.0, 30.0, 49.0, 72.0, 101.0, 151.0, 161.0, 93.0, 72.0, 42.0, 36.0, 20.0, 14.0, 16.0, 9.0, 7.0, 7.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.57763671875e-05, -4.468858242034912e-05, -4.360079765319824e-05, -4.251301288604736e-05, -4.1425228118896484e-05, -4.0337443351745605e-05, -3.9249658584594727e-05, -3.816187381744385e-05, -3.707408905029297e-05, -3.598630428314209e-05, -3.489851951599121e-05, -3.381073474884033e-05, -3.272294998168945e-05, -3.1635165214538574e-05, -3.0547380447387695e-05, -2.9459595680236816e-05, -2.8371810913085938e-05, -2.728402614593506e-05, -2.619624137878418e-05, -2.51084566116333e-05, -2.4020671844482422e-05, -2.2932887077331543e-05, -2.1845102310180664e-05, -2.0757317543029785e-05, -1.9669532775878906e-05, -1.8581748008728027e-05, -1.749396324157715e-05, -1.640617847442627e-05, -1.531839370727539e-05, -1.4230608940124512e-05, -1.3142824172973633e-05, -1.2055039405822754e-05, -1.0967254638671875e-05, -9.879469871520996e-06, -8.791685104370117e-06, -7.703900337219238e-06, -6.616115570068359e-06, -5.5283308029174805e-06, -4.4405460357666016e-06, -3.3527612686157227e-06, -2.2649765014648438e-06, -1.1771917343139648e-06, -8.940696716308594e-08, 9.98377799987793e-07, 2.086162567138672e-06, 3.1739473342895508e-06, 4.26173210144043e-06, 5.349516868591309e-06, 6.4373016357421875e-06, 7.525086402893066e-06, 8.612871170043945e-06, 9.700655937194824e-06, 1.0788440704345703e-05, 1.1876225471496582e-05, 1.2964010238647461e-05, 1.405179500579834e-05, 1.5139579772949219e-05, 1.6227364540100098e-05, 1.7315149307250977e-05, 1.8402934074401855e-05, 1.9490718841552734e-05, 2.0578503608703613e-05, 2.1666288375854492e-05, 2.275407314300537e-05, 2.384185791015625e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 13.0, 16.0, 19.0, 36.0, 69.0, 141.0, 235.0, 535.0, 1525.0, 4616.0, 20403.0, 147452.0, 762553.0, 91203.0, 14163.0, 3414.0, 1174.0, 499.0, 224.0, 113.0, 63.0, 34.0, 33.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.3357372283935547, -0.3269920349121094, -0.31824684143066406, -0.30950164794921875, -0.30075645446777344, -0.2920112609863281, -0.2832660675048828, -0.2745208740234375, -0.2657756805419922, -0.2570304870605469, -0.24828529357910156, -0.23954010009765625, -0.23079490661621094, -0.22204971313476562, -0.2133045196533203, -0.204559326171875, -0.1958141326904297, -0.18706893920898438, -0.17832374572753906, -0.16957855224609375, -0.16083335876464844, -0.15208816528320312, -0.1433429718017578, -0.1345977783203125, -0.1258525848388672, -0.11710739135742188, -0.10836219787597656, -0.09961700439453125, -0.09087181091308594, -0.08212661743164062, -0.07338142395019531, -0.06463623046875, -0.05589103698730469, -0.047145843505859375, -0.03840065002441406, -0.02965545654296875, -0.020910263061523438, -0.012165069580078125, -0.0034198760986328125, 0.0053253173828125, 0.014070510864257812, 0.022815704345703125, 0.03156089782714844, 0.04030609130859375, 0.04905128479003906, 0.057796478271484375, 0.06654167175292969, 0.075286865234375, 0.08403205871582031, 0.09277725219726562, 0.10152244567871094, 0.11026763916015625, 0.11901283264160156, 0.12775802612304688, 0.1365032196044922, 0.1452484130859375, 0.1539936065673828, 0.16273880004882812, 0.17148399353027344, 0.18022918701171875, 0.18897438049316406, 0.19771957397460938, 0.2064647674560547, 0.2152099609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 6.0, 10.0, 7.0, 18.0, 23.0, 23.0, 32.0, 35.0, 37.0, 53.0, 89.0, 144.0, 163.0, 87.0, 67.0, 40.0, 37.0, 28.0, 24.0, 18.0, 10.0, 14.0, 4.0, 9.0, 6.0, 0.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06280517578125, -0.060082435607910156, -0.05735969543457031, -0.05463695526123047, -0.051914215087890625, -0.04919147491455078, -0.04646873474121094, -0.043745994567871094, -0.04102325439453125, -0.038300514221191406, -0.03557777404785156, -0.03285503387451172, -0.030132293701171875, -0.02740955352783203, -0.024686813354492188, -0.021964073181152344, -0.0192413330078125, -0.016518592834472656, -0.013795852661132812, -0.011073112487792969, -0.008350372314453125, -0.005627632141113281, -0.0029048919677734375, -0.00018215179443359375, 0.00254058837890625, 0.005263328552246094, 0.007986068725585938, 0.010708808898925781, 0.013431549072265625, 0.01615428924560547, 0.018877029418945312, 0.021599769592285156, 0.024322509765625, 0.027045249938964844, 0.029767990112304688, 0.03249073028564453, 0.035213470458984375, 0.03793621063232422, 0.04065895080566406, 0.043381690979003906, 0.04610443115234375, 0.048827171325683594, 0.05154991149902344, 0.05427265167236328, 0.056995391845703125, 0.05971813201904297, 0.06244087219238281, 0.06516361236572266, 0.0678863525390625, 0.07060909271240234, 0.07333183288574219, 0.07605457305908203, 0.07877731323242188, 0.08150005340576172, 0.08422279357910156, 0.0869455337524414, 0.08966827392578125, 0.0923910140991211, 0.09511375427246094, 0.09783649444580078, 0.10055923461914062, 0.10328197479248047, 0.10600471496582031, 0.10872745513916016, 0.1114501953125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 13.0, 22.0, 48.0, 91.0, 169.0, 223.0, 198.0, 117.0, 55.0, 34.0, 8.0, 8.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.58935546875, -2.469377040863037, -2.3493988513946533, -2.2294204235076904, -2.1094419956207275, -1.9894636869430542, -1.8694853782653809, -1.749506950378418, -1.6295286417007446, -1.5095503330230713, -1.3895719051361084, -1.269593596458435, -1.1496152877807617, -1.0296368598937988, -0.9096585512161255, -0.7896801829338074, -0.6697018146514893, -0.5497234463691711, -0.4297451078891754, -0.3097667694091797, -0.18978840112686157, -0.06981003284454346, 0.05016827583312988, 0.170146644115448, 0.2901250123977661, 0.41010338068008423, 0.5300817489624023, 0.6500600576400757, 0.7700384259223938, 0.8900167942047119, 1.0099951028823853, 1.1299734115600586, 1.2499518394470215, 1.3699301481246948, 1.4899085760116577, 1.609886884689331, 1.729865312576294, 1.8498436212539673, 1.9698219299316406, 2.0898003578186035, 2.2097787857055664, 2.3297572135925293, 2.449735403060913, 2.569713830947876, 2.689692258834839, 2.8096704483032227, 2.9296488761901855, 3.0496273040771484, 3.1696054935455322, 3.289583921432495, 3.409562110900879, 3.529540538787842, 3.6495189666748047, 3.7694973945617676, 3.8894755840301514, 4.009453773498535, 4.129432201385498, 4.249410629272461, 4.369389057159424, 4.489367485046387, 4.609345436096191, 4.729323863983154, 4.849302291870117, 4.96928071975708, 5.089259147644043]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 7.0, 4.0, 8.0, 8.0, 11.0, 12.0, 18.0, 10.0, 13.0, 23.0, 19.0, 19.0, 30.0, 35.0, 23.0, 30.0, 29.0, 35.0, 38.0, 36.0, 30.0, 44.0, 29.0, 34.0, 39.0, 29.0, 33.0, 39.0, 39.0, 36.0, 31.0, 24.0, 32.0, 16.0, 22.0, 21.0, 16.0, 16.0, 15.0, 7.0, 8.0, 9.0, 2.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.7792351245880127, -1.7280083894729614, -1.6767816543579102, -1.6255549192428589, -1.5743281841278076, -1.5231014490127563, -1.471874713897705, -1.4206479787826538, -1.3694212436676025, -1.3181945085525513, -1.2669677734375, -1.2157410383224487, -1.1645143032073975, -1.1132875680923462, -1.062060832977295, -1.0108340978622437, -0.9596073627471924, -0.9083806276321411, -0.8571538925170898, -0.8059271574020386, -0.7547004222869873, -0.703473687171936, -0.6522469520568848, -0.6010202169418335, -0.5497934818267822, -0.49856674671173096, -0.4473400115966797, -0.3961132764816284, -0.34488654136657715, -0.2936598062515259, -0.2424330711364746, -0.19120633602142334, -0.13997960090637207, -0.0887528657913208, -0.03752613067626953, 0.013700604438781738, 0.06492733955383301, 0.11615407466888428, 0.16738080978393555, 0.21860754489898682, 0.2698342800140381, 0.32106101512908936, 0.3722877502441406, 0.4235144853591919, 0.47474122047424316, 0.5259679555892944, 0.5771946907043457, 0.628421425819397, 0.6796481609344482, 0.7308748960494995, 0.7821016311645508, 0.833328366279602, 0.8845551013946533, 0.9357818365097046, 0.9870085716247559, 1.0382353067398071, 1.0894620418548584, 1.1406887769699097, 1.191915512084961, 1.2431422472000122, 1.2943689823150635, 1.3455957174301147, 1.396822452545166, 1.4480491876602173, 1.4992759227752686]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 4.0, 4.0, 7.0, 17.0, 20.0, 24.0, 48.0, 77.0, 134.0, 190.0, 370.0, 536.0, 967.0, 2094.0, 4789.0, 15177.0, 85712.0, 2731668.0, 1278766.0, 55148.0, 10925.0, 3875.0, 1685.0, 908.0, 447.0, 272.0, 149.0, 97.0, 39.0, 40.0, 26.0, 17.0, 9.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.085052490234375, -1.04315185546875, -1.001251220703125, -0.9593505859375, -0.917449951171875, -0.87554931640625, -0.833648681640625, -0.791748046875, -0.749847412109375, -0.70794677734375, -0.666046142578125, -0.6241455078125, -0.582244873046875, -0.54034423828125, -0.498443603515625, -0.45654296875, -0.414642333984375, -0.37274169921875, -0.330841064453125, -0.2889404296875, -0.247039794921875, -0.20513916015625, -0.163238525390625, -0.121337890625, -0.079437255859375, -0.03753662109375, 0.004364013671875, 0.0462646484375, 0.088165283203125, 0.13006591796875, 0.171966552734375, 0.2138671875, 0.255767822265625, 0.29766845703125, 0.339569091796875, 0.3814697265625, 0.423370361328125, 0.46527099609375, 0.507171630859375, 0.549072265625, 0.590972900390625, 0.63287353515625, 0.674774169921875, 0.7166748046875, 0.758575439453125, 0.80047607421875, 0.842376708984375, 0.88427734375, 0.926177978515625, 0.96807861328125, 1.009979248046875, 1.0518798828125, 1.093780517578125, 1.13568115234375, 1.177581787109375, 1.219482421875, 1.261383056640625, 1.30328369140625, 1.345184326171875, 1.3870849609375, 1.428985595703125, 1.47088623046875, 1.512786865234375, 1.5546875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 14.0, 17.0, 22.0, 18.0, 36.0, 34.0, 50.0, 47.0, 69.0, 65.0, 77.0, 66.0, 71.0, 75.0, 62.0, 47.0, 37.0, 43.0, 31.0, 27.0, 15.0, 15.0, 18.0, 8.0, 9.0, 1.0, 5.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52099609375, -0.49895477294921875, -0.4769134521484375, -0.45487213134765625, -0.432830810546875, -0.41078948974609375, -0.3887481689453125, -0.36670684814453125, -0.34466552734375, -0.32262420654296875, -0.3005828857421875, -0.27854156494140625, -0.256500244140625, -0.23445892333984375, -0.2124176025390625, -0.19037628173828125, -0.1683349609375, -0.14629364013671875, -0.1242523193359375, -0.10221099853515625, -0.080169677734375, -0.05812835693359375, -0.0360870361328125, -0.01404571533203125, 0.00799560546875, 0.03003692626953125, 0.0520782470703125, 0.07411956787109375, 0.096160888671875, 0.11820220947265625, 0.1402435302734375, 0.16228485107421875, 0.184326171875, 0.20636749267578125, 0.2284088134765625, 0.25045013427734375, 0.272491455078125, 0.29453277587890625, 0.3165740966796875, 0.33861541748046875, 0.36065673828125, 0.38269805908203125, 0.4047393798828125, 0.42678070068359375, 0.448822021484375, 0.47086334228515625, 0.4929046630859375, 0.5149459838867188, 0.5369873046875, 0.5590286254882812, 0.5810699462890625, 0.6031112670898438, 0.625152587890625, 0.6471939086914062, 0.6692352294921875, 0.6912765502929688, 0.71331787109375, 0.7353591918945312, 0.7574005126953125, 0.7794418334960938, 0.801483154296875, 0.8235244750976562, 0.8455657958984375, 0.8676071166992188, 0.8896484375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 5.0, 4.0, 10.0, 9.0, 10.0, 12.0, 17.0, 17.0, 33.0, 46.0, 80.0, 133.0, 308.0, 725.0, 1785.0, 6521.0, 45448.0, 2967772.0, 1133904.0, 29938.0, 4943.0, 1463.0, 524.0, 226.0, 110.0, 88.0, 42.0, 29.0, 21.0, 17.0, 9.0, 4.0, 6.0, 6.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0], "bins": [-2.423828125, -2.361541748046875, -2.29925537109375, -2.236968994140625, -2.1746826171875, -2.112396240234375, -2.05010986328125, -1.987823486328125, -1.925537109375, -1.863250732421875, -1.80096435546875, -1.738677978515625, -1.6763916015625, -1.614105224609375, -1.55181884765625, -1.489532470703125, -1.42724609375, -1.364959716796875, -1.30267333984375, -1.240386962890625, -1.1781005859375, -1.115814208984375, -1.05352783203125, -0.991241455078125, -0.928955078125, -0.866668701171875, -0.80438232421875, -0.742095947265625, -0.6798095703125, -0.617523193359375, -0.55523681640625, -0.492950439453125, -0.4306640625, -0.368377685546875, -0.30609130859375, -0.243804931640625, -0.1815185546875, -0.119232177734375, -0.05694580078125, 0.005340576171875, 0.067626953125, 0.129913330078125, 0.19219970703125, 0.254486083984375, 0.3167724609375, 0.379058837890625, 0.44134521484375, 0.503631591796875, 0.56591796875, 0.628204345703125, 0.69049072265625, 0.752777099609375, 0.8150634765625, 0.877349853515625, 0.93963623046875, 1.001922607421875, 1.064208984375, 1.126495361328125, 1.18878173828125, 1.251068115234375, 1.3133544921875, 1.375640869140625, 1.43792724609375, 1.500213623046875, 1.5625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 8.0, 8.0, 14.0, 11.0, 19.0, 28.0, 51.0, 64.0, 79.0, 154.0, 245.0, 406.0, 587.0, 795.0, 562.0, 366.0, 238.0, 137.0, 88.0, 56.0, 30.0, 28.0, 14.0, 11.0, 16.0, 9.0, 5.0, 5.0, 5.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.241455078125, -0.23113250732421875, -0.2208099365234375, -0.21048736572265625, -0.200164794921875, -0.18984222412109375, -0.1795196533203125, -0.16919708251953125, -0.15887451171875, -0.14855194091796875, -0.1382293701171875, -0.12790679931640625, -0.117584228515625, -0.10726165771484375, -0.0969390869140625, -0.08661651611328125, -0.0762939453125, -0.06597137451171875, -0.0556488037109375, -0.04532623291015625, -0.035003662109375, -0.02468109130859375, -0.0143585205078125, -0.00403594970703125, 0.00628662109375, 0.01660919189453125, 0.0269317626953125, 0.03725433349609375, 0.047576904296875, 0.05789947509765625, 0.0682220458984375, 0.07854461669921875, 0.0888671875, 0.09918975830078125, 0.1095123291015625, 0.11983489990234375, 0.130157470703125, 0.14048004150390625, 0.1508026123046875, 0.16112518310546875, 0.17144775390625, 0.18177032470703125, 0.1920928955078125, 0.20241546630859375, 0.212738037109375, 0.22306060791015625, 0.2333831787109375, 0.24370574951171875, 0.2540283203125, 0.26435089111328125, 0.2746734619140625, 0.28499603271484375, 0.295318603515625, 0.30564117431640625, 0.3159637451171875, 0.32628631591796875, 0.33660888671875, 0.34693145751953125, 0.3572540283203125, 0.36757659912109375, 0.377899169921875, 0.38822174072265625, 0.3985443115234375, 0.40886688232421875, 0.419189453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 18.0, 19.0, 27.0, 44.0, 69.0, 76.0, 98.0, 129.0, 108.0, 100.0, 70.0, 66.0, 45.0, 34.0, 20.0, 22.0, 14.0, 13.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1530554294586182, -1.109147071838379, -1.06523859500885, -1.0213302373886108, -0.9774218201637268, -0.9335134029388428, -0.8896050453186035, -0.8456966280937195, -0.8017882108688354, -0.7578797936439514, -0.7139714360237122, -0.6700630187988281, -0.6261546015739441, -0.5822461843490601, -0.5383378267288208, -0.49442940950393677, -0.4505210518836975, -0.40661266446113586, -0.36270424723625183, -0.3187958598136902, -0.27488744258880615, -0.2309790551662445, -0.18707066774368286, -0.14316225051879883, -0.09925386309623718, -0.05534546449780464, -0.0114370658993721, 0.03247132897377014, 0.07637973129749298, 0.12028813362121582, 0.16419652104377747, 0.2081049382686615, 0.25201332569122314, 0.2959217131137848, 0.3398301303386688, 0.38373851776123047, 0.4276469349861145, 0.47155532240867615, 0.5154637098312378, 0.5593721270561218, 0.6032805442810059, 0.6471889615058899, 0.6910973191261292, 0.7350057363510132, 0.7789141535758972, 0.8228225708007812, 0.8667309284210205, 0.9106393456459045, 0.9545477032661438, 0.9984561204910278, 1.042364478111267, 1.086272954940796, 1.1301813125610352, 1.1740896701812744, 1.2179980278015137, 1.2619065046310425, 1.3058148622512817, 1.349723219871521, 1.3936316967010498, 1.437540054321289, 1.4814484119415283, 1.5253568887710571, 1.5692652463912964, 1.6131737232208252, 1.6570820808410645]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 4.0, 7.0, 5.0, 8.0, 7.0, 8.0, 19.0, 15.0, 15.0, 14.0, 14.0, 21.0, 34.0, 23.0, 31.0, 38.0, 47.0, 29.0, 35.0, 32.0, 42.0, 46.0, 34.0, 33.0, 32.0, 40.0, 50.0, 25.0, 35.0, 26.0, 27.0, 34.0, 21.0, 19.0, 20.0, 23.0, 16.0, 15.0, 16.0, 7.0, 9.0, 3.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6384267210960388, -0.6194890737533569, -0.600551426410675, -0.5816137790679932, -0.5626761317253113, -0.5437384843826294, -0.5248008370399475, -0.5058631896972656, -0.48692551255226135, -0.46798786520957947, -0.4490502178668976, -0.4301125705242157, -0.4111748933792114, -0.39223724603652954, -0.37329959869384766, -0.35436195135116577, -0.3354243040084839, -0.316486656665802, -0.2975490093231201, -0.27861136198043823, -0.25967371463775635, -0.24073605239391327, -0.2217983901500702, -0.2028607428073883, -0.18392309546470642, -0.16498544812202454, -0.14604780077934265, -0.12711013853549957, -0.10817249119281769, -0.0892348438501358, -0.07029718905687332, -0.05135953426361084, -0.03242182731628418, -0.013484176248311996, 0.005453474819660187, 0.02439112588763237, 0.04332877695560455, 0.06226642429828644, 0.08120407909154892, 0.1001417338848114, 0.11907938122749329, 0.13801702857017517, 0.15695467591285706, 0.17589233815670013, 0.19482998549938202, 0.2137676328420639, 0.23270529508590698, 0.25164294242858887, 0.27058058977127075, 0.28951823711395264, 0.3084558844566345, 0.3273935317993164, 0.3463311791419983, 0.3652688264846802, 0.38420650362968445, 0.40314415097236633, 0.4220817983150482, 0.4410194456577301, 0.459957093000412, 0.47889474034309387, 0.49783241748809814, 0.51677006483078, 0.5357077121734619, 0.5546453595161438, 0.5735830068588257]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 9.0, 11.0, 19.0, 22.0, 29.0, 46.0, 75.0, 80.0, 167.0, 241.0, 357.0, 640.0, 1005.0, 1898.0, 3579.0, 7053.0, 14714.0, 33823.0, 95494.0, 339753.0, 373987.0, 106676.0, 36865.0, 15827.0, 7513.0, 3747.0, 1998.0, 1163.0, 669.0, 367.0, 246.0, 165.0, 81.0, 68.0, 56.0, 40.0, 19.0, 22.0, 12.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1688232421875, -0.16355514526367188, -0.15828704833984375, -0.15301895141601562, -0.1477508544921875, -0.14248275756835938, -0.13721466064453125, -0.13194656372070312, -0.126678466796875, -0.12141036987304688, -0.11614227294921875, -0.11087417602539062, -0.1056060791015625, -0.10033798217773438, -0.09506988525390625, -0.08980178833007812, -0.08453369140625, -0.07926559448242188, -0.07399749755859375, -0.06872940063476562, -0.0634613037109375, -0.058193206787109375, -0.05292510986328125, -0.047657012939453125, -0.042388916015625, -0.037120819091796875, -0.03185272216796875, -0.026584625244140625, -0.0213165283203125, -0.016048431396484375, -0.01078033447265625, -0.005512237548828125, -0.000244140625, 0.005023956298828125, 0.01029205322265625, 0.015560150146484375, 0.0208282470703125, 0.026096343994140625, 0.03136444091796875, 0.036632537841796875, 0.041900634765625, 0.047168731689453125, 0.05243682861328125, 0.057704925537109375, 0.0629730224609375, 0.06824111938476562, 0.07350921630859375, 0.07877731323242188, 0.08404541015625, 0.08931350708007812, 0.09458160400390625, 0.09984970092773438, 0.1051177978515625, 0.11038589477539062, 0.11565399169921875, 0.12092208862304688, 0.126190185546875, 0.13145828247070312, 0.13672637939453125, 0.14199447631835938, 0.1472625732421875, 0.15253067016601562, 0.15779876708984375, 0.16306686401367188, 0.1683349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 8.0, 3.0, 6.0, 19.0, 8.0, 9.0, 19.0, 23.0, 23.0, 34.0, 38.0, 51.0, 46.0, 55.0, 55.0, 65.0, 39.0, 62.0, 58.0, 54.0, 47.0, 52.0, 48.0, 36.0, 29.0, 23.0, 20.0, 23.0, 15.0, 8.0, 9.0, 4.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53271484375, -0.5159072875976562, -0.4990997314453125, -0.48229217529296875, -0.465484619140625, -0.44867706298828125, -0.4318695068359375, -0.41506195068359375, -0.39825439453125, -0.38144683837890625, -0.3646392822265625, -0.34783172607421875, -0.331024169921875, -0.31421661376953125, -0.2974090576171875, -0.28060150146484375, -0.2637939453125, -0.24698638916015625, -0.2301788330078125, -0.21337127685546875, -0.196563720703125, -0.17975616455078125, -0.1629486083984375, -0.14614105224609375, -0.12933349609375, -0.11252593994140625, -0.0957183837890625, -0.07891082763671875, -0.062103271484375, -0.04529571533203125, -0.0284881591796875, -0.01168060302734375, 0.005126953125, 0.02193450927734375, 0.0387420654296875, 0.05554962158203125, 0.072357177734375, 0.08916473388671875, 0.1059722900390625, 0.12277984619140625, 0.13958740234375, 0.15639495849609375, 0.1732025146484375, 0.19001007080078125, 0.206817626953125, 0.22362518310546875, 0.2404327392578125, 0.25724029541015625, 0.2740478515625, 0.29085540771484375, 0.3076629638671875, 0.32447052001953125, 0.341278076171875, 0.35808563232421875, 0.3748931884765625, 0.39170074462890625, 0.40850830078125, 0.42531585693359375, 0.4421234130859375, 0.45893096923828125, 0.475738525390625, 0.49254608154296875, 0.5093536376953125, 0.5261611938476562, 0.54296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 2.0, 8.0, 12.0, 6.0, 19.0, 18.0, 18.0, 24.0, 34.0, 44.0, 69.0, 95.0, 132.0, 188.0, 283.0, 530.0, 948.0, 1865.0, 4200.0, 11297.0, 39922.0, 183186.0, 550352.0, 193491.0, 41637.0, 11638.0, 4280.0, 1862.0, 931.0, 503.0, 277.0, 170.0, 138.0, 97.0, 65.0, 57.0, 39.0, 21.0, 24.0, 16.0, 16.0, 7.0, 11.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1505126953125, -0.14558029174804688, -0.14064788818359375, -0.13571548461914062, -0.1307830810546875, -0.12585067749023438, -0.12091827392578125, -0.11598587036132812, -0.111053466796875, -0.10612106323242188, -0.10118865966796875, -0.09625625610351562, -0.0913238525390625, -0.08639144897460938, -0.08145904541015625, -0.07652664184570312, -0.07159423828125, -0.06666183471679688, -0.06172943115234375, -0.056797027587890625, -0.0518646240234375, -0.046932220458984375, -0.04199981689453125, -0.037067413330078125, -0.032135009765625, -0.027202606201171875, -0.02227020263671875, -0.017337799072265625, -0.0124053955078125, -0.007472991943359375, -0.00254058837890625, 0.002391815185546875, 0.00732421875, 0.012256622314453125, 0.01718902587890625, 0.022121429443359375, 0.0270538330078125, 0.031986236572265625, 0.03691864013671875, 0.041851043701171875, 0.046783447265625, 0.051715850830078125, 0.05664825439453125, 0.061580657958984375, 0.0665130615234375, 0.07144546508789062, 0.07637786865234375, 0.08131027221679688, 0.08624267578125, 0.09117507934570312, 0.09610748291015625, 0.10103988647460938, 0.1059722900390625, 0.11090469360351562, 0.11583709716796875, 0.12076950073242188, 0.125701904296875, 0.13063430786132812, 0.13556671142578125, 0.14049911499023438, 0.1454315185546875, 0.15036392211914062, 0.15529632568359375, 0.16022872924804688, 0.1651611328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 16.0, 6.0, 9.0, 18.0, 13.0, 10.0, 28.0, 27.0, 29.0, 36.0, 36.0, 34.0, 39.0, 37.0, 50.0, 63.0, 39.0, 51.0, 36.0, 34.0, 39.0, 37.0, 34.0, 36.0, 42.0, 32.0, 29.0, 21.0, 17.0, 20.0, 13.0, 9.0, 4.0, 4.0, 8.0, 9.0, 7.0, 4.0, 4.0, 9.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.84619140625, -0.8204803466796875, -0.794769287109375, -0.7690582275390625, -0.74334716796875, -0.7176361083984375, -0.691925048828125, -0.6662139892578125, -0.6405029296875, -0.6147918701171875, -0.589080810546875, -0.5633697509765625, -0.53765869140625, -0.5119476318359375, -0.486236572265625, -0.4605255126953125, -0.434814453125, -0.4091033935546875, -0.383392333984375, -0.3576812744140625, -0.33197021484375, -0.3062591552734375, -0.280548095703125, -0.2548370361328125, -0.2291259765625, -0.2034149169921875, -0.177703857421875, -0.1519927978515625, -0.12628173828125, -0.1005706787109375, -0.074859619140625, -0.0491485595703125, -0.0234375, 0.0022735595703125, 0.027984619140625, 0.0536956787109375, 0.07940673828125, 0.1051177978515625, 0.130828857421875, 0.1565399169921875, 0.1822509765625, 0.2079620361328125, 0.233673095703125, 0.2593841552734375, 0.28509521484375, 0.3108062744140625, 0.336517333984375, 0.3622283935546875, 0.387939453125, 0.4136505126953125, 0.439361572265625, 0.4650726318359375, 0.49078369140625, 0.5164947509765625, 0.542205810546875, 0.5679168701171875, 0.5936279296875, 0.6193389892578125, 0.645050048828125, 0.6707611083984375, 0.69647216796875, 0.7221832275390625, 0.747894287109375, 0.7736053466796875, 0.79931640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 12.0, 17.0, 24.0, 29.0, 49.0, 92.0, 185.0, 355.0, 667.0, 1733.0, 4756.0, 19234.0, 170929.0, 751612.0, 80503.0, 12198.0, 3515.0, 1314.0, 602.0, 289.0, 175.0, 93.0, 65.0, 31.0, 20.0, 12.0, 8.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1158447265625, -0.11189842224121094, -0.10795211791992188, -0.10400581359863281, -0.10005950927734375, -0.09611320495605469, -0.09216690063476562, -0.08822059631347656, -0.0842742919921875, -0.08032798767089844, -0.07638168334960938, -0.07243537902832031, -0.06848907470703125, -0.06454277038574219, -0.060596466064453125, -0.05665016174316406, -0.052703857421875, -0.04875755310058594, -0.044811248779296875, -0.04086494445800781, -0.03691864013671875, -0.03297233581542969, -0.029026031494140625, -0.025079727172851562, -0.0211334228515625, -0.017187118530273438, -0.013240814208984375, -0.009294509887695312, -0.00534820556640625, -0.0014019012451171875, 0.002544403076171875, 0.0064907073974609375, 0.01043701171875, 0.014383316040039062, 0.018329620361328125, 0.022275924682617188, 0.02622222900390625, 0.030168533325195312, 0.034114837646484375, 0.03806114196777344, 0.0420074462890625, 0.04595375061035156, 0.049900054931640625, 0.05384635925292969, 0.05779266357421875, 0.06173896789550781, 0.06568527221679688, 0.06963157653808594, 0.073577880859375, 0.07752418518066406, 0.08147048950195312, 0.08541679382324219, 0.08936309814453125, 0.09330940246582031, 0.09725570678710938, 0.10120201110839844, 0.1051483154296875, 0.10909461975097656, 0.11304092407226562, 0.11698722839355469, 0.12093353271484375, 0.12487983703613281, 0.12882614135742188, 0.13277244567871094, 0.13671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 9.0, 11.0, 15.0, 21.0, 26.0, 21.0, 34.0, 51.0, 59.0, 65.0, 104.0, 107.0, 127.0, 82.0, 67.0, 47.0, 40.0, 30.0, 16.0, 15.0, 9.0, 17.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.427267074584961e-05, -3.288406878709793e-05, -3.149546682834625e-05, -3.0106864869594574e-05, -2.8718262910842896e-05, -2.7329660952091217e-05, -2.594105899333954e-05, -2.455245703458786e-05, -2.316385507583618e-05, -2.1775253117084503e-05, -2.0386651158332825e-05, -1.8998049199581146e-05, -1.7609447240829468e-05, -1.622084528207779e-05, -1.483224332332611e-05, -1.3443641364574432e-05, -1.2055039405822754e-05, -1.0666437447071075e-05, -9.277835488319397e-06, -7.889233529567719e-06, -6.50063157081604e-06, -5.1120296120643616e-06, -3.723427653312683e-06, -2.3348256945610046e-06, -9.462237358093262e-07, 4.423782229423523e-07, 1.8309801816940308e-06, 3.2195821404457092e-06, 4.608184099197388e-06, 5.996786057949066e-06, 7.385388016700745e-06, 8.773989975452423e-06, 1.0162591934204102e-05, 1.155119389295578e-05, 1.2939795851707458e-05, 1.4328397810459137e-05, 1.5716999769210815e-05, 1.7105601727962494e-05, 1.8494203686714172e-05, 1.988280564546585e-05, 2.127140760421753e-05, 2.2660009562969208e-05, 2.4048611521720886e-05, 2.5437213480472565e-05, 2.6825815439224243e-05, 2.821441739797592e-05, 2.96030193567276e-05, 3.099162131547928e-05, 3.238022327423096e-05, 3.3768825232982635e-05, 3.5157427191734314e-05, 3.654602915048599e-05, 3.793463110923767e-05, 3.932323306798935e-05, 4.071183502674103e-05, 4.2100436985492706e-05, 4.3489038944244385e-05, 4.487764090299606e-05, 4.626624286174774e-05, 4.765484482049942e-05, 4.90434467792511e-05, 5.043204873800278e-05, 5.1820650696754456e-05, 5.3209252655506134e-05, 5.459785461425781e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 17.0, 19.0, 24.0, 20.0, 55.0, 77.0, 109.0, 163.0, 278.0, 457.0, 719.0, 1284.0, 2438.0, 4829.0, 11388.0, 30889.0, 105186.0, 401146.0, 348920.0, 92291.0, 27955.0, 10375.0, 4570.0, 2225.0, 1269.0, 648.0, 413.0, 255.0, 173.0, 125.0, 74.0, 53.0, 35.0, 20.0, 16.0, 8.0, 9.0, 7.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0780029296875, -0.07539844512939453, -0.07279396057128906, -0.0701894760131836, -0.06758499145507812, -0.06498050689697266, -0.06237602233886719, -0.05977153778076172, -0.05716705322265625, -0.05456256866455078, -0.05195808410644531, -0.049353599548339844, -0.046749114990234375, -0.044144630432128906, -0.04154014587402344, -0.03893566131591797, -0.0363311767578125, -0.03372669219970703, -0.031122207641601562, -0.028517723083496094, -0.025913238525390625, -0.023308753967285156, -0.020704269409179688, -0.01809978485107422, -0.01549530029296875, -0.012890815734863281, -0.010286331176757812, -0.007681846618652344, -0.005077362060546875, -0.0024728775024414062, 0.0001316070556640625, 0.0027360916137695312, 0.005340576171875, 0.007945060729980469, 0.010549545288085938, 0.013154029846191406, 0.015758514404296875, 0.018362998962402344, 0.020967483520507812, 0.02357196807861328, 0.02617645263671875, 0.02878093719482422, 0.03138542175292969, 0.033989906311035156, 0.036594390869140625, 0.039198875427246094, 0.04180335998535156, 0.04440784454345703, 0.0470123291015625, 0.04961681365966797, 0.05222129821777344, 0.054825782775878906, 0.057430267333984375, 0.060034751892089844, 0.06263923645019531, 0.06524372100830078, 0.06784820556640625, 0.07045269012451172, 0.07305717468261719, 0.07566165924072266, 0.07826614379882812, 0.0808706283569336, 0.08347511291503906, 0.08607959747314453, 0.08868408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 11.0, 15.0, 27.0, 23.0, 42.0, 52.0, 74.0, 87.0, 120.0, 148.0, 91.0, 79.0, 58.0, 54.0, 26.0, 28.0, 12.0, 14.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0279541015625, -0.027162551879882812, -0.026371002197265625, -0.025579452514648438, -0.02478790283203125, -0.023996353149414062, -0.023204803466796875, -0.022413253784179688, -0.0216217041015625, -0.020830154418945312, -0.020038604736328125, -0.019247055053710938, -0.01845550537109375, -0.017663955688476562, -0.016872406005859375, -0.016080856323242188, -0.015289306640625, -0.014497756958007812, -0.013706207275390625, -0.012914657592773438, -0.01212310791015625, -0.011331558227539062, -0.010540008544921875, -0.009748458862304688, -0.0089569091796875, -0.008165359497070312, -0.007373809814453125, -0.0065822601318359375, -0.00579071044921875, -0.0049991607666015625, -0.004207611083984375, -0.0034160614013671875, -0.00262451171875, -0.0018329620361328125, -0.001041412353515625, -0.0002498626708984375, 0.00054168701171875, 0.0013332366943359375, 0.002124786376953125, 0.0029163360595703125, 0.0037078857421875, 0.0044994354248046875, 0.005290985107421875, 0.0060825347900390625, 0.00687408447265625, 0.0076656341552734375, 0.008457183837890625, 0.009248733520507812, 0.010040283203125, 0.010831832885742188, 0.011623382568359375, 0.012414932250976562, 0.01320648193359375, 0.013998031616210938, 0.014789581298828125, 0.015581130981445312, 0.0163726806640625, 0.017164230346679688, 0.017955780029296875, 0.018747329711914062, 0.01953887939453125, 0.020330429077148438, 0.021121978759765625, 0.021913528442382812, 0.022705078125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 10.0, 8.0, 10.0, 14.0, 23.0, 46.0, 45.0, 79.0, 107.0, 138.0, 118.0, 100.0, 82.0, 72.0, 49.0, 24.0, 25.0, 17.0, 13.0, 11.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9324737191200256, -0.9044672250747681, -0.8764607310295105, -0.8484541773796082, -0.8204476833343506, -0.792441189289093, -0.7644346952438354, -0.7364281415939331, -0.7084216475486755, -0.680415153503418, -0.6524086594581604, -0.6244021058082581, -0.5963956117630005, -0.5683891177177429, -0.5403826236724854, -0.512376070022583, -0.4843696057796478, -0.45636311173439026, -0.4283565878868103, -0.40035009384155273, -0.3723435699939728, -0.3443370759487152, -0.31633055210113525, -0.2883240580558777, -0.2603175640106201, -0.23231105506420135, -0.2043045461177826, -0.17629805207252502, -0.14829152822494507, -0.1202850341796875, -0.09227852523326874, -0.06427201628684998, -0.03626549243927002, -0.008258985355496407, 0.019747521728277206, 0.04775402694940567, 0.07576053589582443, 0.1037670373916626, 0.13177354633808136, 0.15978005528450012, 0.18778656423091888, 0.21579307317733765, 0.2437995821237564, 0.27180609107017517, 0.29981258511543274, 0.3278191089630127, 0.35582560300827026, 0.38383209705352783, 0.4118386209011078, 0.43984511494636536, 0.4678516387939453, 0.4958581328392029, 0.5238646268844604, 0.5518711805343628, 0.5798776745796204, 0.6078841686248779, 0.6358906626701355, 0.6638971567153931, 0.6919036507606506, 0.719910204410553, 0.7479166984558105, 0.7759231925010681, 0.8039296865463257, 0.831936240196228, 0.8599427342414856]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 4.0, 10.0, 7.0, 9.0, 15.0, 19.0, 18.0, 20.0, 18.0, 30.0, 25.0, 48.0, 43.0, 48.0, 44.0, 42.0, 49.0, 53.0, 51.0, 54.0, 47.0, 44.0, 38.0, 37.0, 25.0, 34.0, 30.0, 27.0, 22.0, 13.0, 21.0, 11.0, 13.0, 8.0, 5.0, 6.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4269494414329529, -0.41293370723724365, -0.3989179730415344, -0.3849022388458252, -0.3708864748477936, -0.35687074065208435, -0.3428550064563751, -0.3288392722606659, -0.3148235082626343, -0.30080777406692505, -0.2867920398712158, -0.2727763056755066, -0.258760541677475, -0.24474480748176575, -0.23072907328605652, -0.2167133390903473, -0.20269760489463806, -0.18868187069892883, -0.1746661216020584, -0.16065038740634918, -0.14663463830947876, -0.13261890411376953, -0.1186031699180603, -0.10458742827177048, -0.09057168662548065, -0.07655594497919083, -0.062540203332901, -0.04852446913719177, -0.03450872749090195, -0.02049298584461212, -0.006477251648902893, 0.007538489997386932, 0.021554231643676758, 0.03556997328996658, 0.04958571121096611, 0.06360144913196564, 0.07761719077825546, 0.09163293242454529, 0.10564866662025452, 0.11966440826654434, 0.13368014991283417, 0.1476958841085434, 0.16171163320541382, 0.17572736740112305, 0.18974310159683228, 0.2037588506937027, 0.21777458488941193, 0.23179033398628235, 0.24580606818199158, 0.2598218023777008, 0.27383753657341003, 0.28785330057144165, 0.3018690347671509, 0.3158847689628601, 0.32990050315856934, 0.34391623735427856, 0.3579319715499878, 0.371947705745697, 0.38596343994140625, 0.3999791741371155, 0.4139949381351471, 0.4280106723308563, 0.44202640652656555, 0.4560421407222748, 0.4700579047203064]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 11.0, 6.0, 7.0, 13.0, 21.0, 25.0, 24.0, 51.0, 63.0, 100.0, 141.0, 249.0, 406.0, 792.0, 1597.0, 3474.0, 9325.0, 28013.0, 111424.0, 589379.0, 233502.0, 46305.0, 14128.0, 4951.0, 2093.0, 1058.0, 515.0, 284.0, 197.0, 123.0, 68.0, 50.0, 37.0, 38.0, 27.0, 14.0, 10.0, 4.0, 9.0, 6.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.80419921875, -0.7771224975585938, -0.7500457763671875, -0.7229690551757812, -0.695892333984375, -0.6688156127929688, -0.6417388916015625, -0.6146621704101562, -0.58758544921875, -0.5605087280273438, -0.5334320068359375, -0.5063552856445312, -0.479278564453125, -0.45220184326171875, -0.4251251220703125, -0.39804840087890625, -0.3709716796875, -0.34389495849609375, -0.3168182373046875, -0.28974151611328125, -0.262664794921875, -0.23558807373046875, -0.2085113525390625, -0.18143463134765625, -0.15435791015625, -0.12728118896484375, -0.1002044677734375, -0.07312774658203125, -0.046051025390625, -0.01897430419921875, 0.0081024169921875, 0.03517913818359375, 0.062255859375, 0.08933258056640625, 0.1164093017578125, 0.14348602294921875, 0.170562744140625, 0.19763946533203125, 0.2247161865234375, 0.25179290771484375, 0.27886962890625, 0.30594635009765625, 0.3330230712890625, 0.36009979248046875, 0.387176513671875, 0.41425323486328125, 0.4413299560546875, 0.46840667724609375, 0.4954833984375, 0.5225601196289062, 0.5496368408203125, 0.5767135620117188, 0.603790283203125, 0.6308670043945312, 0.6579437255859375, 0.6850204467773438, 0.71209716796875, 0.7391738891601562, 0.7662506103515625, 0.7933273315429688, 0.820404052734375, 0.8474807739257812, 0.8745574951171875, 0.9016342163085938, 0.9287109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 12.0, 14.0, 15.0, 13.0, 17.0, 22.0, 32.0, 33.0, 39.0, 49.0, 41.0, 46.0, 48.0, 44.0, 52.0, 63.0, 50.0, 60.0, 54.0, 47.0, 29.0, 21.0, 33.0, 26.0, 33.0, 25.0, 14.0, 13.0, 11.0, 6.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.076171875, -1.0451507568359375, -1.014129638671875, -0.9831085205078125, -0.95208740234375, -0.9210662841796875, -0.890045166015625, -0.8590240478515625, -0.8280029296875, -0.7969818115234375, -0.765960693359375, -0.7349395751953125, -0.70391845703125, -0.6728973388671875, -0.641876220703125, -0.6108551025390625, -0.579833984375, -0.5488128662109375, -0.517791748046875, -0.4867706298828125, -0.45574951171875, -0.4247283935546875, -0.393707275390625, -0.3626861572265625, -0.3316650390625, -0.3006439208984375, -0.269622802734375, -0.2386016845703125, -0.20758056640625, -0.1765594482421875, -0.145538330078125, -0.1145172119140625, -0.08349609375, -0.0524749755859375, -0.021453857421875, 0.0095672607421875, 0.04058837890625, 0.0716094970703125, 0.102630615234375, 0.1336517333984375, 0.1646728515625, 0.1956939697265625, 0.226715087890625, 0.2577362060546875, 0.28875732421875, 0.3197784423828125, 0.350799560546875, 0.3818206787109375, 0.412841796875, 0.4438629150390625, 0.474884033203125, 0.5059051513671875, 0.53692626953125, 0.5679473876953125, 0.598968505859375, 0.6299896240234375, 0.6610107421875, 0.6920318603515625, 0.723052978515625, 0.7540740966796875, 0.78509521484375, 0.8161163330078125, 0.847137451171875, 0.8781585693359375, 0.9091796875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 9.0, 8.0, 12.0, 16.0, 28.0, 49.0, 97.0, 225.0, 666.0, 2245.0, 11402.0, 124511.0, 840522.0, 58967.0, 7222.0, 1652.0, 489.0, 207.0, 96.0, 40.0, 17.0, 26.0, 14.0, 7.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3154296875, -1.2655487060546875, -1.215667724609375, -1.1657867431640625, -1.11590576171875, -1.0660247802734375, -1.016143798828125, -0.9662628173828125, -0.9163818359375, -0.8665008544921875, -0.816619873046875, -0.7667388916015625, -0.71685791015625, -0.6669769287109375, -0.617095947265625, -0.5672149658203125, -0.517333984375, -0.4674530029296875, -0.417572021484375, -0.3676910400390625, -0.31781005859375, -0.2679290771484375, -0.218048095703125, -0.1681671142578125, -0.1182861328125, -0.0684051513671875, -0.018524169921875, 0.0313568115234375, 0.08123779296875, 0.1311187744140625, 0.180999755859375, 0.2308807373046875, 0.28076171875, 0.3306427001953125, 0.380523681640625, 0.4304046630859375, 0.48028564453125, 0.5301666259765625, 0.580047607421875, 0.6299285888671875, 0.6798095703125, 0.7296905517578125, 0.779571533203125, 0.8294525146484375, 0.87933349609375, 0.9292144775390625, 0.979095458984375, 1.0289764404296875, 1.078857421875, 1.1287384033203125, 1.178619384765625, 1.2285003662109375, 1.27838134765625, 1.3282623291015625, 1.378143310546875, 1.4280242919921875, 1.4779052734375, 1.5277862548828125, 1.577667236328125, 1.6275482177734375, 1.67742919921875, 1.7273101806640625, 1.777191162109375, 1.8270721435546875, 1.876953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 9.0, 5.0, 6.0, 7.0, 8.0, 14.0, 22.0, 9.0, 27.0, 23.0, 37.0, 35.0, 37.0, 36.0, 43.0, 47.0, 63.0, 47.0, 50.0, 56.0, 58.0, 50.0, 39.0, 45.0, 40.0, 29.0, 33.0, 25.0, 27.0, 22.0, 14.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.980560302734375, -0.94354248046875, -0.906524658203125, -0.8695068359375, -0.832489013671875, -0.79547119140625, -0.758453369140625, -0.721435546875, -0.684417724609375, -0.64739990234375, -0.610382080078125, -0.5733642578125, -0.536346435546875, -0.49932861328125, -0.462310791015625, -0.42529296875, -0.388275146484375, -0.35125732421875, -0.314239501953125, -0.2772216796875, -0.240203857421875, -0.20318603515625, -0.166168212890625, -0.129150390625, -0.092132568359375, -0.05511474609375, -0.018096923828125, 0.0189208984375, 0.055938720703125, 0.09295654296875, 0.129974365234375, 0.1669921875, 0.204010009765625, 0.24102783203125, 0.278045654296875, 0.3150634765625, 0.352081298828125, 0.38909912109375, 0.426116943359375, 0.463134765625, 0.500152587890625, 0.53717041015625, 0.574188232421875, 0.6112060546875, 0.648223876953125, 0.68524169921875, 0.722259521484375, 0.75927734375, 0.796295166015625, 0.83331298828125, 0.870330810546875, 0.9073486328125, 0.944366455078125, 0.98138427734375, 1.018402099609375, 1.055419921875, 1.092437744140625, 1.12945556640625, 1.166473388671875, 1.2034912109375, 1.240509033203125, 1.27752685546875, 1.314544677734375, 1.3515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 11.0, 19.0, 20.0, 31.0, 65.0, 124.0, 190.0, 442.0, 1010.0, 2722.0, 9078.0, 47297.0, 372633.0, 533975.0, 63790.0, 11674.0, 3227.0, 1127.0, 498.0, 253.0, 137.0, 75.0, 38.0, 30.0, 14.0, 25.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.23805809020996094, -0.23014450073242188, -0.2222309112548828, -0.21431732177734375, -0.2064037322998047, -0.19849014282226562, -0.19057655334472656, -0.1826629638671875, -0.17474937438964844, -0.16683578491210938, -0.1589221954345703, -0.15100860595703125, -0.1430950164794922, -0.13518142700195312, -0.12726783752441406, -0.119354248046875, -0.11144065856933594, -0.10352706909179688, -0.09561347961425781, -0.08769989013671875, -0.07978630065917969, -0.07187271118164062, -0.06395912170410156, -0.0560455322265625, -0.04813194274902344, -0.040218353271484375, -0.03230476379394531, -0.02439117431640625, -0.016477584838867188, -0.008563995361328125, -0.0006504058837890625, 0.00726318359375, 0.015176773071289062, 0.023090362548828125, 0.031003952026367188, 0.03891754150390625, 0.04683113098144531, 0.054744720458984375, 0.06265830993652344, 0.0705718994140625, 0.07848548889160156, 0.08639907836914062, 0.09431266784667969, 0.10222625732421875, 0.11013984680175781, 0.11805343627929688, 0.12596702575683594, 0.133880615234375, 0.14179420471191406, 0.14970779418945312, 0.1576213836669922, 0.16553497314453125, 0.1734485626220703, 0.18136215209960938, 0.18927574157714844, 0.1971893310546875, 0.20510292053222656, 0.21301651000976562, 0.2209300994873047, 0.22884368896484375, 0.2367572784423828, 0.24467086791992188, 0.25258445739746094, 0.260498046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 9.0, 6.0, 5.0, 11.0, 13.0, 11.0, 25.0, 29.0, 32.0, 52.0, 65.0, 96.0, 134.0, 124.0, 103.0, 84.0, 51.0, 43.0, 21.0, 23.0, 15.0, 16.0, 10.0, 4.0, 4.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.13060188293457e-05, -4.012230783700943e-05, -3.893859684467316e-05, -3.7754885852336884e-05, -3.657117486000061e-05, -3.538746386766434e-05, -3.4203752875328064e-05, -3.302004188299179e-05, -3.183633089065552e-05, -3.0652619898319244e-05, -2.946890890598297e-05, -2.8285197913646698e-05, -2.7101486921310425e-05, -2.591777592897415e-05, -2.473406493663788e-05, -2.3550353944301605e-05, -2.2366642951965332e-05, -2.118293195962906e-05, -1.9999220967292786e-05, -1.8815509974956512e-05, -1.763179898262024e-05, -1.6448087990283966e-05, -1.5264376997947693e-05, -1.408066600561142e-05, -1.2896955013275146e-05, -1.1713244020938873e-05, -1.05295330286026e-05, -9.345822036266327e-06, -8.162111043930054e-06, -6.9784000515937805e-06, -5.794689059257507e-06, -4.610978066921234e-06, -3.427267074584961e-06, -2.2435560822486877e-06, -1.0598450899124146e-06, 1.2386590242385864e-07, 1.3075768947601318e-06, 2.491287887096405e-06, 3.6749988794326782e-06, 4.858709871768951e-06, 6.042420864105225e-06, 7.226131856441498e-06, 8.409842848777771e-06, 9.593553841114044e-06, 1.0777264833450317e-05, 1.196097582578659e-05, 1.3144686818122864e-05, 1.4328397810459137e-05, 1.551210880279541e-05, 1.6695819795131683e-05, 1.7879530787467957e-05, 1.906324177980423e-05, 2.0246952772140503e-05, 2.1430663764476776e-05, 2.261437475681305e-05, 2.3798085749149323e-05, 2.4981796741485596e-05, 2.616550773382187e-05, 2.7349218726158142e-05, 2.8532929718494415e-05, 2.971664071083069e-05, 3.090035170316696e-05, 3.2084062695503235e-05, 3.326777368783951e-05, 3.445148468017578e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 16.0, 11.0, 20.0, 25.0, 37.0, 61.0, 83.0, 157.0, 255.0, 386.0, 719.0, 1224.0, 2327.0, 5333.0, 15315.0, 53077.0, 221713.0, 530529.0, 157543.0, 38997.0, 11707.0, 4355.0, 1990.0, 1044.0, 617.0, 393.0, 212.0, 141.0, 78.0, 57.0, 33.0, 25.0, 21.0, 15.0, 9.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1834716796875, -0.17743301391601562, -0.17139434814453125, -0.16535568237304688, -0.1593170166015625, -0.15327835083007812, -0.14723968505859375, -0.14120101928710938, -0.135162353515625, -0.12912368774414062, -0.12308502197265625, -0.11704635620117188, -0.1110076904296875, -0.10496902465820312, -0.09893035888671875, -0.09289169311523438, -0.08685302734375, -0.08081436157226562, -0.07477569580078125, -0.06873703002929688, -0.0626983642578125, -0.056659698486328125, -0.05062103271484375, -0.044582366943359375, -0.038543701171875, -0.032505035400390625, -0.02646636962890625, -0.020427703857421875, -0.0143890380859375, -0.008350372314453125, -0.00231170654296875, 0.003726959228515625, 0.009765625, 0.015804290771484375, 0.02184295654296875, 0.027881622314453125, 0.0339202880859375, 0.039958953857421875, 0.04599761962890625, 0.052036285400390625, 0.058074951171875, 0.06411361694335938, 0.07015228271484375, 0.07619094848632812, 0.0822296142578125, 0.08826828002929688, 0.09430694580078125, 0.10034561157226562, 0.10638427734375, 0.11242294311523438, 0.11846160888671875, 0.12450027465820312, 0.1305389404296875, 0.13657760620117188, 0.14261627197265625, 0.14865493774414062, 0.154693603515625, 0.16073226928710938, 0.16677093505859375, 0.17280960083007812, 0.1788482666015625, 0.18488693237304688, 0.19092559814453125, 0.19696426391601562, 0.2030029296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 8.0, 8.0, 12.0, 22.0, 18.0, 27.0, 34.0, 27.0, 41.0, 50.0, 70.0, 75.0, 76.0, 65.0, 77.0, 69.0, 54.0, 42.0, 46.0, 26.0, 24.0, 21.0, 13.0, 5.0, 15.0, 14.0, 6.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.09027099609375, -0.08777713775634766, -0.08528327941894531, -0.08278942108154297, -0.08029556274414062, -0.07780170440673828, -0.07530784606933594, -0.0728139877319336, -0.07032012939453125, -0.0678262710571289, -0.06533241271972656, -0.06283855438232422, -0.060344696044921875, -0.05785083770751953, -0.05535697937011719, -0.052863121032714844, -0.0503692626953125, -0.047875404357910156, -0.04538154602050781, -0.04288768768310547, -0.040393829345703125, -0.03789997100830078, -0.03540611267089844, -0.032912254333496094, -0.03041839599609375, -0.027924537658691406, -0.025430679321289062, -0.02293682098388672, -0.020442962646484375, -0.01794910430908203, -0.015455245971679688, -0.012961387634277344, -0.010467529296875, -0.007973670959472656, -0.0054798126220703125, -0.0029859542846679688, -0.000492095947265625, 0.0020017623901367188, 0.0044956207275390625, 0.006989479064941406, 0.00948333740234375, 0.011977195739746094, 0.014471054077148438, 0.01696491241455078, 0.019458770751953125, 0.02195262908935547, 0.024446487426757812, 0.026940345764160156, 0.0294342041015625, 0.031928062438964844, 0.03442192077636719, 0.03691577911376953, 0.039409637451171875, 0.04190349578857422, 0.04439735412597656, 0.046891212463378906, 0.04938507080078125, 0.051878929138183594, 0.05437278747558594, 0.05686664581298828, 0.059360504150390625, 0.06185436248779297, 0.06434822082519531, 0.06684207916259766, 0.0693359375]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 13.0, 26.0, 80.0, 174.0, 241.0, 252.0, 125.0, 55.0, 20.0, 14.0, 5.0, 3.0, 1.0, 1.0], "bins": [-7.421146392822266, -7.285796165466309, -7.15044641494751, -7.015096187591553, -6.879746437072754, -6.744396209716797, -6.60904598236084, -6.473696231842041, -6.338346004486084, -6.202995777130127, -6.067646026611328, -5.932295799255371, -5.796946048736572, -5.661595821380615, -5.526246070861816, -5.390895843505859, -5.255545616149902, -5.120195388793945, -4.9848456382751465, -4.8494954109191895, -4.714145660400391, -4.578795433044434, -4.443445205688477, -4.308095455169678, -4.172745704650879, -4.037395477294922, -3.902045726776123, -3.766695499420166, -3.631345510482788, -3.49599552154541, -3.3606455326080322, -3.2252955436706543, -3.0899453163146973, -2.9545953273773193, -2.8192453384399414, -2.6838951110839844, -2.5485451221466064, -2.4131951332092285, -2.2778451442718506, -2.1424951553344727, -2.0071449279785156, -1.8717949390411377, -1.7364448308944702, -1.6010948419570923, -1.4657447338104248, -1.3303947448730469, -1.195044755935669, -1.059694766998291, -0.9243447780609131, -0.7889947295188904, -0.6536446809768677, -0.5182946920394897, -0.38294464349746704, -0.24759459495544434, -0.1122446060180664, 0.0231054425239563, 0.158455491065979, 0.2938055396080017, 0.429155558347702, 0.5645055770874023, 0.699855625629425, 0.8352056741714478, 0.9705556631088257, 1.1059057712554932, 1.241255760192871]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 9.0, 13.0, 13.0, 20.0, 27.0, 26.0, 26.0, 27.0, 35.0, 39.0, 29.0, 33.0, 46.0, 34.0, 49.0, 48.0, 40.0, 39.0, 41.0, 43.0, 36.0, 41.0, 35.0, 27.0, 23.0, 29.0, 25.0, 25.0, 27.0, 11.0, 12.0, 11.0, 11.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.9613538980484009, -1.9067612886428833, -1.8521686792373657, -1.7975761890411377, -1.7429835796356201, -1.6883909702301025, -1.633798360824585, -1.5792057514190674, -1.5246131420135498, -1.4700205326080322, -1.4154279232025146, -1.360835313796997, -1.306242823600769, -1.2516502141952515, -1.1970576047897339, -1.1424649953842163, -1.0878725051879883, -1.0332798957824707, -0.9786873459815979, -0.9240947365760803, -0.8695021867752075, -0.8149095773696899, -0.7603169679641724, -0.7057243585586548, -0.651131808757782, -0.5965391993522644, -0.5419466495513916, -0.487354040145874, -0.43276146054267883, -0.37816888093948364, -0.32357627153396606, -0.2689836919307709, -0.21439123153686523, -0.15979865193367004, -0.10520605742931366, -0.050613462924957275, 0.003979116678237915, 0.058571696281433105, 0.11316430568695068, 0.16775688529014587, 0.22234946489334106, 0.27694204449653625, 0.33153462409973145, 0.386127233505249, 0.4407198131084442, 0.4953123927116394, 0.549905002117157, 0.6044975519180298, 0.6590901613235474, 0.7136827707290649, 0.7682753205299377, 0.8228679299354553, 0.8774604797363281, 0.9320530891418457, 0.9866456985473633, 1.0412383079528809, 1.0958309173583984, 1.150423526763916, 1.2050161361694336, 1.2596087455749512, 1.3142012357711792, 1.3687938451766968, 1.4233864545822144, 1.477979063987732, 1.53257155418396]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 10.0, 11.0, 12.0, 19.0, 33.0, 21.0, 48.0, 60.0, 61.0, 109.0, 172.0, 236.0, 426.0, 591.0, 1204.0, 2470.0, 5441.0, 15017.0, 60319.0, 730036.0, 3096278.0, 231223.0, 32936.0, 9744.0, 3843.0, 1638.0, 876.0, 532.0, 279.0, 191.0, 116.0, 79.0, 56.0, 50.0, 28.0, 19.0, 22.0, 19.0, 10.0, 7.0, 12.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.083984375, -1.0504302978515625, -1.016876220703125, -0.9833221435546875, -0.94976806640625, -0.9162139892578125, -0.882659912109375, -0.8491058349609375, -0.8155517578125, -0.7819976806640625, -0.748443603515625, -0.7148895263671875, -0.68133544921875, -0.6477813720703125, -0.614227294921875, -0.5806732177734375, -0.547119140625, -0.5135650634765625, -0.480010986328125, -0.4464569091796875, -0.41290283203125, -0.3793487548828125, -0.345794677734375, -0.3122406005859375, -0.2786865234375, -0.2451324462890625, -0.211578369140625, -0.1780242919921875, -0.14447021484375, -0.1109161376953125, -0.077362060546875, -0.0438079833984375, -0.01025390625, 0.0233001708984375, 0.056854248046875, 0.0904083251953125, 0.12396240234375, 0.1575164794921875, 0.191070556640625, 0.2246246337890625, 0.2581787109375, 0.2917327880859375, 0.325286865234375, 0.3588409423828125, 0.39239501953125, 0.4259490966796875, 0.459503173828125, 0.4930572509765625, 0.526611328125, 0.5601654052734375, 0.593719482421875, 0.6272735595703125, 0.66082763671875, 0.6943817138671875, 0.727935791015625, 0.7614898681640625, 0.7950439453125, 0.8285980224609375, 0.862152099609375, 0.8957061767578125, 0.92926025390625, 0.9628143310546875, 0.996368408203125, 1.0299224853515625, 1.0634765625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 13.0, 13.0, 8.0, 12.0, 16.0, 34.0, 43.0, 30.0, 32.0, 37.0, 49.0, 48.0, 44.0, 46.0, 47.0, 45.0, 43.0, 56.0, 47.0, 39.0, 45.0, 41.0, 20.0, 36.0, 32.0, 14.0, 25.0, 7.0, 14.0, 10.0, 3.0, 7.0, 6.0, 6.0, 9.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.402587890625, -0.38924407958984375, -0.3759002685546875, -0.36255645751953125, -0.349212646484375, -0.33586883544921875, -0.3225250244140625, -0.30918121337890625, -0.29583740234375, -0.28249359130859375, -0.2691497802734375, -0.25580596923828125, -0.242462158203125, -0.22911834716796875, -0.2157745361328125, -0.20243072509765625, -0.1890869140625, -0.17574310302734375, -0.1623992919921875, -0.14905548095703125, -0.135711669921875, -0.12236785888671875, -0.1090240478515625, -0.09568023681640625, -0.08233642578125, -0.06899261474609375, -0.0556488037109375, -0.04230499267578125, -0.028961181640625, -0.01561737060546875, -0.0022735595703125, 0.01107025146484375, 0.0244140625, 0.03775787353515625, 0.0511016845703125, 0.06444549560546875, 0.077789306640625, 0.09113311767578125, 0.1044769287109375, 0.11782073974609375, 0.13116455078125, 0.14450836181640625, 0.1578521728515625, 0.17119598388671875, 0.184539794921875, 0.19788360595703125, 0.2112274169921875, 0.22457122802734375, 0.2379150390625, 0.25125885009765625, 0.2646026611328125, 0.27794647216796875, 0.291290283203125, 0.30463409423828125, 0.3179779052734375, 0.33132171630859375, 0.34466552734375, 0.35800933837890625, 0.3713531494140625, 0.38469696044921875, 0.398040771484375, 0.41138458251953125, 0.4247283935546875, 0.43807220458984375, 0.451416015625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 11.0, 12.0, 17.0, 18.0, 29.0, 30.0, 35.0, 77.0, 156.0, 310.0, 728.0, 1983.0, 6450.0, 31693.0, 551010.0, 3479117.0, 103209.0, 13581.0, 3592.0, 1147.0, 486.0, 221.0, 123.0, 70.0, 34.0, 32.0, 21.0, 15.0, 15.0, 11.0, 6.0, 5.0, 4.0, 6.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7578125, -1.7049560546875, -1.652099609375, -1.5992431640625, -1.54638671875, -1.4935302734375, -1.440673828125, -1.3878173828125, -1.3349609375, -1.2821044921875, -1.229248046875, -1.1763916015625, -1.12353515625, -1.0706787109375, -1.017822265625, -0.9649658203125, -0.912109375, -0.8592529296875, -0.806396484375, -0.7535400390625, -0.70068359375, -0.6478271484375, -0.594970703125, -0.5421142578125, -0.4892578125, -0.4364013671875, -0.383544921875, -0.3306884765625, -0.27783203125, -0.2249755859375, -0.172119140625, -0.1192626953125, -0.06640625, -0.0135498046875, 0.039306640625, 0.0921630859375, 0.14501953125, 0.1978759765625, 0.250732421875, 0.3035888671875, 0.3564453125, 0.4093017578125, 0.462158203125, 0.5150146484375, 0.56787109375, 0.6207275390625, 0.673583984375, 0.7264404296875, 0.779296875, 0.8321533203125, 0.885009765625, 0.9378662109375, 0.99072265625, 1.0435791015625, 1.096435546875, 1.1492919921875, 1.2021484375, 1.2550048828125, 1.307861328125, 1.3607177734375, 1.41357421875, 1.4664306640625, 1.519287109375, 1.5721435546875, 1.625]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 5.0, 12.0, 8.0, 6.0, 8.0, 18.0, 16.0, 41.0, 43.0, 57.0, 74.0, 102.0, 159.0, 252.0, 413.0, 587.0, 650.0, 560.0, 338.0, 203.0, 142.0, 121.0, 66.0, 53.0, 35.0, 19.0, 14.0, 9.0, 10.0, 10.0, 5.0, 6.0, 6.0, 2.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.3583984375, -0.3485374450683594, -0.33867645263671875, -0.3288154602050781, -0.3189544677734375, -0.3090934753417969, -0.29923248291015625, -0.2893714904785156, -0.279510498046875, -0.2696495056152344, -0.25978851318359375, -0.24992752075195312, -0.2400665283203125, -0.23020553588867188, -0.22034454345703125, -0.21048355102539062, -0.20062255859375, -0.19076156616210938, -0.18090057373046875, -0.17103958129882812, -0.1611785888671875, -0.15131759643554688, -0.14145660400390625, -0.13159561157226562, -0.121734619140625, -0.11187362670898438, -0.10201263427734375, -0.09215164184570312, -0.0822906494140625, -0.07242965698242188, -0.06256866455078125, -0.052707672119140625, -0.0428466796875, -0.032985687255859375, -0.02312469482421875, -0.013263702392578125, -0.0034027099609375, 0.006458282470703125, 0.01631927490234375, 0.026180267333984375, 0.036041259765625, 0.045902252197265625, 0.05576324462890625, 0.06562423706054688, 0.0754852294921875, 0.08534622192382812, 0.09520721435546875, 0.10506820678710938, 0.11492919921875, 0.12479019165039062, 0.13465118408203125, 0.14451217651367188, 0.1543731689453125, 0.16423416137695312, 0.17409515380859375, 0.18395614624023438, 0.193817138671875, 0.20367813110351562, 0.21353912353515625, 0.22340011596679688, 0.2332611083984375, 0.24312210083007812, 0.25298309326171875, 0.2628440856933594, 0.272705078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 5.0, 13.0, 12.0, 9.0, 15.0, 11.0, 20.0, 28.0, 40.0, 50.0, 55.0, 58.0, 72.0, 98.0, 93.0, 84.0, 68.0, 71.0, 47.0, 43.0, 29.0, 20.0, 19.0, 14.0, 9.0, 0.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.4544001817703247, -1.421303153038025, -1.388206124305725, -1.3551090955734253, -1.3220120668411255, -1.2889150381088257, -1.2558180093765259, -1.222720980644226, -1.1896239519119263, -1.1565269231796265, -1.1234298944473267, -1.0903328657150269, -1.057235836982727, -1.0241388082504272, -0.9910417795181274, -0.9579447507858276, -0.9248477816581726, -0.8917507529258728, -0.858653724193573, -0.8255566954612732, -0.7924596667289734, -0.7593626379966736, -0.7262656688690186, -0.6931686401367188, -0.660071611404419, -0.6269745826721191, -0.5938775539398193, -0.5607805252075195, -0.5276834964752197, -0.4945864677429199, -0.4614894688129425, -0.4283924400806427, -0.3952954411506653, -0.3621984124183655, -0.3291013836860657, -0.29600435495376587, -0.26290732622146606, -0.22981031239032745, -0.19671329855918884, -0.16361626982688904, -0.13051924109458923, -0.09742221236228943, -0.06432519108057022, -0.031228169798851013, 0.0018688589334487915, 0.034965887665748596, 0.06806290149688721, 0.10115993022918701, 0.13425695896148682, 0.16735398769378662, 0.20045101642608643, 0.23354803025722504, 0.26664507389068604, 0.29974210262298584, 0.33283910155296326, 0.36593613028526306, 0.39903315901756287, 0.43213018774986267, 0.4652272164821625, 0.4983242154121399, 0.5314212441444397, 0.5645182728767395, 0.5976153016090393, 0.6307123303413391, 0.6638093590736389]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 13.0, 5.0, 5.0, 22.0, 16.0, 21.0, 25.0, 20.0, 23.0, 13.0, 26.0, 29.0, 24.0, 42.0, 41.0, 28.0, 36.0, 35.0, 40.0, 41.0, 28.0, 32.0, 42.0, 39.0, 35.0, 37.0, 37.0, 24.0, 31.0, 30.0, 20.0, 25.0, 15.0, 9.0, 13.0, 6.0, 15.0, 11.0, 4.0, 3.0, 7.0, 1.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.5339183211326599, -0.5166115164756775, -0.49930477142333984, -0.4819979667663574, -0.4646911919116974, -0.44738441705703735, -0.43007761240005493, -0.4127708375453949, -0.39546406269073486, -0.37815728783607483, -0.3608505129814148, -0.3435437083244324, -0.32623693346977234, -0.3089301586151123, -0.2916233539581299, -0.27431657910346985, -0.2570098042488098, -0.23970302939414978, -0.22239623963832855, -0.20508944988250732, -0.1877826750278473, -0.17047590017318726, -0.15316911041736603, -0.1358623206615448, -0.11855554580688477, -0.10124876350164413, -0.0839419811964035, -0.06663519889116287, -0.04932841658592224, -0.03202163428068161, -0.014714851975440979, 0.002591930329799652, 0.019898653030395508, 0.03720543533563614, 0.05451221764087677, 0.0718189999461174, 0.08912578225135803, 0.10643256455659866, 0.1237393468618393, 0.14104613661766052, 0.15835291147232056, 0.1756596863269806, 0.19296647608280182, 0.21027326583862305, 0.22758004069328308, 0.24488681554794312, 0.26219362020492554, 0.27950039505958557, 0.2968071699142456, 0.31411394476890564, 0.3314207196235657, 0.3487275242805481, 0.36603429913520813, 0.38334107398986816, 0.4006478786468506, 0.4179546535015106, 0.43526142835617065, 0.4525682032108307, 0.4698749780654907, 0.48718178272247314, 0.5044885873794556, 0.5217953324317932, 0.5391021370887756, 0.5564088821411133, 0.5737156867980957]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 11.0, 12.0, 22.0, 17.0, 30.0, 37.0, 53.0, 91.0, 102.0, 148.0, 210.0, 298.0, 535.0, 817.0, 1372.0, 2498.0, 4786.0, 10147.0, 34300.0, 385357.0, 537052.0, 46647.0, 11770.0, 5364.0, 2787.0, 1541.0, 859.0, 544.0, 336.0, 228.0, 163.0, 111.0, 72.0, 53.0, 47.0, 39.0, 19.0, 14.0, 12.0, 11.0, 6.0, 3.0, 5.0, 7.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.28759765625, -0.2789039611816406, -0.27021026611328125, -0.2615165710449219, -0.2528228759765625, -0.24412918090820312, -0.23543548583984375, -0.22674179077148438, -0.218048095703125, -0.20935440063476562, -0.20066070556640625, -0.19196701049804688, -0.1832733154296875, -0.17457962036132812, -0.16588592529296875, -0.15719223022460938, -0.14849853515625, -0.13980484008789062, -0.13111114501953125, -0.12241744995117188, -0.1137237548828125, -0.10503005981445312, -0.09633636474609375, -0.08764266967773438, -0.078948974609375, -0.07025527954101562, -0.06156158447265625, -0.052867889404296875, -0.0441741943359375, -0.035480499267578125, -0.02678680419921875, -0.018093109130859375, -0.0093994140625, -0.000705718994140625, 0.00798797607421875, 0.016681671142578125, 0.0253753662109375, 0.034069061279296875, 0.04276275634765625, 0.051456451416015625, 0.060150146484375, 0.06884384155273438, 0.07753753662109375, 0.08623123168945312, 0.0949249267578125, 0.10361862182617188, 0.11231231689453125, 0.12100601196289062, 0.12969970703125, 0.13839340209960938, 0.14708709716796875, 0.15578079223632812, 0.1644744873046875, 0.17316818237304688, 0.18186187744140625, 0.19055557250976562, 0.199249267578125, 0.20794296264648438, 0.21663665771484375, 0.22533035278320312, 0.2340240478515625, 0.24271774291992188, 0.25141143798828125, 0.2601051330566406, 0.268798828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 7.0, 12.0, 4.0, 12.0, 11.0, 17.0, 25.0, 19.0, 29.0, 29.0, 28.0, 34.0, 40.0, 45.0, 37.0, 41.0, 38.0, 37.0, 50.0, 35.0, 46.0, 49.0, 41.0, 41.0, 41.0, 37.0, 36.0, 21.0, 19.0, 26.0, 20.0, 15.0, 10.0, 9.0, 9.0, 3.0, 9.0, 3.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.435546875, -0.4220542907714844, -0.40856170654296875, -0.3950691223144531, -0.3815765380859375, -0.3680839538574219, -0.35459136962890625, -0.3410987854003906, -0.327606201171875, -0.3141136169433594, -0.30062103271484375, -0.2871284484863281, -0.2736358642578125, -0.2601432800292969, -0.24665069580078125, -0.23315811157226562, -0.21966552734375, -0.20617294311523438, -0.19268035888671875, -0.17918777465820312, -0.1656951904296875, -0.15220260620117188, -0.13871002197265625, -0.12521743774414062, -0.111724853515625, -0.09823226928710938, -0.08473968505859375, -0.07124710083007812, -0.0577545166015625, -0.044261932373046875, -0.03076934814453125, -0.017276763916015625, -0.0037841796875, 0.009708404541015625, 0.02320098876953125, 0.036693572998046875, 0.0501861572265625, 0.06367874145507812, 0.07717132568359375, 0.09066390991210938, 0.104156494140625, 0.11764907836914062, 0.13114166259765625, 0.14463424682617188, 0.1581268310546875, 0.17161941528320312, 0.18511199951171875, 0.19860458374023438, 0.21209716796875, 0.22558975219726562, 0.23908233642578125, 0.2525749206542969, 0.2660675048828125, 0.2795600891113281, 0.29305267333984375, 0.3065452575683594, 0.320037841796875, 0.3335304260253906, 0.34702301025390625, 0.3605155944824219, 0.3740081787109375, 0.3875007629394531, 0.40099334716796875, 0.4144859313964844, 0.427978515625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 5.0, 8.0, 19.0, 23.0, 21.0, 32.0, 51.0, 90.0, 163.0, 296.0, 597.0, 1328.0, 3540.0, 14386.0, 208907.0, 763621.0, 44753.0, 6729.0, 2139.0, 853.0, 410.0, 213.0, 130.0, 70.0, 49.0, 24.0, 26.0, 14.0, 8.0, 9.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.301025390625, -0.29107666015625, -0.2811279296875, -0.27117919921875, -0.26123046875, -0.25128173828125, -0.2413330078125, -0.23138427734375, -0.221435546875, -0.21148681640625, -0.2015380859375, -0.19158935546875, -0.181640625, -0.17169189453125, -0.1617431640625, -0.15179443359375, -0.141845703125, -0.13189697265625, -0.1219482421875, -0.11199951171875, -0.10205078125, -0.09210205078125, -0.0821533203125, -0.07220458984375, -0.062255859375, -0.05230712890625, -0.0423583984375, -0.03240966796875, -0.0224609375, -0.01251220703125, -0.0025634765625, 0.00738525390625, 0.017333984375, 0.02728271484375, 0.0372314453125, 0.04718017578125, 0.05712890625, 0.06707763671875, 0.0770263671875, 0.08697509765625, 0.096923828125, 0.10687255859375, 0.1168212890625, 0.12677001953125, 0.13671875, 0.14666748046875, 0.1566162109375, 0.16656494140625, 0.176513671875, 0.18646240234375, 0.1964111328125, 0.20635986328125, 0.21630859375, 0.22625732421875, 0.2362060546875, 0.24615478515625, 0.256103515625, 0.26605224609375, 0.2760009765625, 0.28594970703125, 0.2958984375, 0.30584716796875, 0.3157958984375, 0.32574462890625, 0.335693359375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 7.0, 4.0, 6.0, 8.0, 9.0, 5.0, 14.0, 13.0, 9.0, 17.0, 19.0, 25.0, 19.0, 40.0, 44.0, 29.0, 37.0, 43.0, 47.0, 41.0, 41.0, 42.0, 43.0, 47.0, 50.0, 35.0, 36.0, 38.0, 29.0, 29.0, 26.0, 24.0, 16.0, 18.0, 20.0, 11.0, 10.0, 10.0, 10.0, 8.0, 5.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8759384155273438, -0.8451385498046875, -0.8143386840820312, -0.783538818359375, -0.7527389526367188, -0.7219390869140625, -0.6911392211914062, -0.66033935546875, -0.6295394897460938, -0.5987396240234375, -0.5679397583007812, -0.537139892578125, -0.5063400268554688, -0.4755401611328125, -0.44474029541015625, -0.4139404296875, -0.38314056396484375, -0.3523406982421875, -0.32154083251953125, -0.290740966796875, -0.25994110107421875, -0.2291412353515625, -0.19834136962890625, -0.16754150390625, -0.13674163818359375, -0.1059417724609375, -0.07514190673828125, -0.044342041015625, -0.01354217529296875, 0.0172576904296875, 0.04805755615234375, 0.078857421875, 0.10965728759765625, 0.1404571533203125, 0.17125701904296875, 0.202056884765625, 0.23285675048828125, 0.2636566162109375, 0.29445648193359375, 0.32525634765625, 0.35605621337890625, 0.3868560791015625, 0.41765594482421875, 0.448455810546875, 0.47925567626953125, 0.5100555419921875, 0.5408554077148438, 0.5716552734375, 0.6024551391601562, 0.6332550048828125, 0.6640548706054688, 0.694854736328125, 0.7256546020507812, 0.7564544677734375, 0.7872543334960938, 0.81805419921875, 0.8488540649414062, 0.8796539306640625, 0.9104537963867188, 0.941253662109375, 0.9720535278320312, 1.0028533935546875, 1.0336532592773438, 1.064453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 11.0, 10.0, 21.0, 32.0, 33.0, 53.0, 108.0, 170.0, 333.0, 619.0, 1313.0, 3360.0, 9867.0, 42922.0, 591656.0, 355355.0, 29887.0, 7724.0, 2787.0, 1092.0, 521.0, 269.0, 140.0, 102.0, 63.0, 41.0, 17.0, 16.0, 3.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12066650390625, -0.1167612075805664, -0.11285591125488281, -0.10895061492919922, -0.10504531860351562, -0.10114002227783203, -0.09723472595214844, -0.09332942962646484, -0.08942413330078125, -0.08551883697509766, -0.08161354064941406, -0.07770824432373047, -0.07380294799804688, -0.06989765167236328, -0.06599235534667969, -0.062087059020996094, -0.0581817626953125, -0.054276466369628906, -0.05037117004394531, -0.04646587371826172, -0.042560577392578125, -0.03865528106689453, -0.03474998474121094, -0.030844688415527344, -0.02693939208984375, -0.023034095764160156, -0.019128799438476562, -0.015223503112792969, -0.011318206787109375, -0.007412910461425781, -0.0035076141357421875, 0.00039768218994140625, 0.004302978515625, 0.008208274841308594, 0.012113571166992188, 0.01601886749267578, 0.019924163818359375, 0.02382946014404297, 0.027734756469726562, 0.031640052795410156, 0.03554534912109375, 0.039450645446777344, 0.04335594177246094, 0.04726123809814453, 0.051166534423828125, 0.05507183074951172, 0.05897712707519531, 0.0628824234008789, 0.0667877197265625, 0.0706930160522461, 0.07459831237792969, 0.07850360870361328, 0.08240890502929688, 0.08631420135498047, 0.09021949768066406, 0.09412479400634766, 0.09803009033203125, 0.10193538665771484, 0.10584068298339844, 0.10974597930908203, 0.11365127563476562, 0.11755657196044922, 0.12146186828613281, 0.1253671646118164, 0.1292724609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 5.0, 8.0, 14.0, 15.0, 35.0, 24.0, 66.0, 131.0, 137.0, 191.0, 138.0, 76.0, 60.0, 29.0, 16.0, 14.0, 8.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.88569450378418e-05, -7.655378431081772e-05, -7.425062358379364e-05, -7.194746285676956e-05, -6.964430212974548e-05, -6.73411414027214e-05, -6.503798067569733e-05, -6.273481994867325e-05, -6.043165922164917e-05, -5.812849849462509e-05, -5.582533776760101e-05, -5.3522177040576935e-05, -5.1219016313552856e-05, -4.891585558652878e-05, -4.66126948595047e-05, -4.430953413248062e-05, -4.200637340545654e-05, -3.9703212678432465e-05, -3.7400051951408386e-05, -3.509689122438431e-05, -3.279373049736023e-05, -3.049056977033615e-05, -2.8187409043312073e-05, -2.5884248316287994e-05, -2.3581087589263916e-05, -2.1277926862239838e-05, -1.897476613521576e-05, -1.667160540819168e-05, -1.4368444681167603e-05, -1.2065283954143524e-05, -9.762123227119446e-06, -7.4589625000953674e-06, -5.155801773071289e-06, -2.8526410460472107e-06, -5.494803190231323e-07, 1.753680408000946e-06, 4.056841135025024e-06, 6.360001862049103e-06, 8.663162589073181e-06, 1.096632331609726e-05, 1.3269484043121338e-05, 1.5572644770145416e-05, 1.7875805497169495e-05, 2.0178966224193573e-05, 2.248212695121765e-05, 2.478528767824173e-05, 2.7088448405265808e-05, 2.9391609132289886e-05, 3.1694769859313965e-05, 3.399793058633804e-05, 3.630109131336212e-05, 3.86042520403862e-05, 4.090741276741028e-05, 4.321057349443436e-05, 4.5513734221458435e-05, 4.7816894948482513e-05, 5.012005567550659e-05, 5.242321640253067e-05, 5.472637712955475e-05, 5.702953785657883e-05, 5.9332698583602905e-05, 6.163585931062698e-05, 6.393902003765106e-05, 6.624218076467514e-05, 6.854534149169922e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 15.0, 26.0, 37.0, 36.0, 65.0, 97.0, 135.0, 170.0, 234.0, 364.0, 528.0, 734.0, 1068.0, 1666.0, 2500.0, 4258.0, 7005.0, 12988.0, 28993.0, 83018.0, 267915.0, 390685.0, 153618.0, 48192.0, 19566.0, 9682.0, 5531.0, 3360.0, 2008.0, 1353.0, 860.0, 555.0, 425.0, 288.0, 165.0, 135.0, 73.0, 67.0, 45.0, 24.0, 17.0, 17.0, 10.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0584716796875, -0.05660057067871094, -0.054729461669921875, -0.05285835266113281, -0.05098724365234375, -0.04911613464355469, -0.047245025634765625, -0.04537391662597656, -0.0435028076171875, -0.04163169860839844, -0.039760589599609375, -0.03788948059082031, -0.03601837158203125, -0.03414726257324219, -0.032276153564453125, -0.030405044555664062, -0.028533935546875, -0.026662826538085938, -0.024791717529296875, -0.022920608520507812, -0.02104949951171875, -0.019178390502929688, -0.017307281494140625, -0.015436172485351562, -0.0135650634765625, -0.011693954467773438, -0.009822845458984375, -0.007951736450195312, -0.00608062744140625, -0.0042095184326171875, -0.002338409423828125, -0.0004673004150390625, 0.00140380859375, 0.0032749176025390625, 0.005146026611328125, 0.0070171356201171875, 0.00888824462890625, 0.010759353637695312, 0.012630462646484375, 0.014501571655273438, 0.0163726806640625, 0.018243789672851562, 0.020114898681640625, 0.021986007690429688, 0.02385711669921875, 0.025728225708007812, 0.027599334716796875, 0.029470443725585938, 0.031341552734375, 0.03321266174316406, 0.035083770751953125, 0.03695487976074219, 0.03882598876953125, 0.04069709777832031, 0.042568206787109375, 0.04443931579589844, 0.0463104248046875, 0.04818153381347656, 0.050052642822265625, 0.05192375183105469, 0.05379486083984375, 0.05566596984863281, 0.057537078857421875, 0.05940818786621094, 0.061279296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 2.0, 8.0, 19.0, 12.0, 19.0, 35.0, 45.0, 57.0, 69.0, 79.0, 96.0, 106.0, 112.0, 69.0, 70.0, 45.0, 37.0, 22.0, 16.0, 15.0, 7.0, 13.0, 4.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02008056640625, -0.019389867782592773, -0.018699169158935547, -0.01800847053527832, -0.017317771911621094, -0.016627073287963867, -0.01593637466430664, -0.015245676040649414, -0.014554977416992188, -0.013864278793334961, -0.013173580169677734, -0.012482881546020508, -0.011792182922363281, -0.011101484298706055, -0.010410785675048828, -0.009720087051391602, -0.009029388427734375, -0.008338689804077148, -0.007647991180419922, -0.006957292556762695, -0.006266593933105469, -0.005575895309448242, -0.004885196685791016, -0.004194498062133789, -0.0035037994384765625, -0.002813100814819336, -0.0021224021911621094, -0.0014317035675048828, -0.0007410049438476562, -5.030632019042969e-05, 0.0006403923034667969, 0.0013310909271240234, 0.00202178955078125, 0.0027124881744384766, 0.003403186798095703, 0.00409388542175293, 0.004784584045410156, 0.005475282669067383, 0.006165981292724609, 0.006856679916381836, 0.0075473785400390625, 0.008238077163696289, 0.008928775787353516, 0.009619474411010742, 0.010310173034667969, 0.011000871658325195, 0.011691570281982422, 0.012382268905639648, 0.013072967529296875, 0.013763666152954102, 0.014454364776611328, 0.015145063400268555, 0.01583576202392578, 0.016526460647583008, 0.017217159271240234, 0.01790785789489746, 0.018598556518554688, 0.019289255142211914, 0.01997995376586914, 0.020670652389526367, 0.021361351013183594, 0.02205204963684082, 0.022742748260498047, 0.023433446884155273, 0.0241241455078125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 4.0, 8.0, 5.0, 10.0, 6.0, 10.0, 19.0, 21.0, 29.0, 30.0, 43.0, 62.0, 63.0, 71.0, 78.0, 95.0, 82.0, 85.0, 70.0, 48.0, 45.0, 30.0, 17.0, 24.0, 12.0, 8.0, 4.0, 5.0, 3.0, 3.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.8636022806167603, -0.8430411219596863, -0.8224799633026123, -0.8019188046455383, -0.7813576459884644, -0.7607964873313904, -0.7402353286743164, -0.7196741700172424, -0.6991130113601685, -0.6785518527030945, -0.6579906940460205, -0.6374295353889465, -0.6168683767318726, -0.5963072180747986, -0.5757460594177246, -0.5551849007606506, -0.5346237421035767, -0.5140625834465027, -0.4935014247894287, -0.47294026613235474, -0.45237910747528076, -0.4318179488182068, -0.4112567901611328, -0.39069563150405884, -0.37013453245162964, -0.34957337379455566, -0.3290122151374817, -0.3084510564804077, -0.28788989782333374, -0.26732873916625977, -0.24676759541034698, -0.226206436753273, -0.20564529299736023, -0.18508413434028625, -0.16452297568321228, -0.1439618170261383, -0.12340066581964493, -0.10283950716257095, -0.08227835595607758, -0.0617171972990036, -0.041156038641929626, -0.0205948818475008, -3.372505307197571e-05, 0.0205274298787117, 0.041088588535785675, 0.06164974719285965, 0.08221089839935303, 0.102772057056427, 0.12333321571350098, 0.14389437437057495, 0.16445553302764893, 0.1850166916847229, 0.20557785034179688, 0.22613900899887085, 0.24670015275478363, 0.2672613263130188, 0.2878224849700928, 0.30838364362716675, 0.3289448022842407, 0.3495059609413147, 0.37006711959838867, 0.39062827825546265, 0.4111894369125366, 0.4317505955696106, 0.4523117244243622]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 5.0, 7.0, 19.0, 22.0, 16.0, 21.0, 17.0, 22.0, 23.0, 25.0, 30.0, 31.0, 35.0, 40.0, 37.0, 41.0, 37.0, 41.0, 34.0, 37.0, 46.0, 35.0, 36.0, 33.0, 46.0, 33.0, 33.0, 29.0, 27.0, 19.0, 21.0, 14.0, 11.0, 9.0, 10.0, 11.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.37475356459617615, -0.36298030614852905, -0.35120704770088196, -0.33943378925323486, -0.32766053080558777, -0.3158872723579407, -0.3041140139102936, -0.2923407554626465, -0.2805674970149994, -0.2687942385673523, -0.2570209801197052, -0.2452477216720581, -0.233474463224411, -0.22170120477676392, -0.20992794632911682, -0.19815468788146973, -0.18638142943382263, -0.17460817098617554, -0.16283491253852844, -0.15106165409088135, -0.13928839564323425, -0.12751513719558716, -0.11574187874794006, -0.10396862030029297, -0.09219536185264587, -0.08042210340499878, -0.06864884495735168, -0.05687558650970459, -0.045102328062057495, -0.0333290696144104, -0.021555811166763306, -0.009782552719116211, 0.0019907355308532715, 0.013763993978500366, 0.02553725242614746, 0.037310510873794556, 0.04908376932144165, 0.060857027769088745, 0.07263028621673584, 0.08440354466438293, 0.09617680311203003, 0.10795006155967712, 0.11972332000732422, 0.1314965784549713, 0.1432698369026184, 0.1550430953502655, 0.1668163537979126, 0.1785896122455597, 0.1903628706932068, 0.20213612914085388, 0.21390938758850098, 0.22568264603614807, 0.23745590448379517, 0.24922916293144226, 0.26100242137908936, 0.27277567982673645, 0.28454893827438354, 0.29632219672203064, 0.30809545516967773, 0.31986871361732483, 0.3316419720649719, 0.343415230512619, 0.3551884889602661, 0.3669617474079132, 0.3787350058555603]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 13.0, 15.0, 14.0, 26.0, 19.0, 51.0, 60.0, 86.0, 142.0, 156.0, 235.0, 369.0, 573.0, 1035.0, 1714.0, 3105.0, 6436.0, 13833.0, 32418.0, 82648.0, 227756.0, 399529.0, 167917.0, 62635.0, 25269.0, 10976.0, 5093.0, 2529.0, 1443.0, 816.0, 488.0, 327.0, 236.0, 156.0, 106.0, 86.0, 63.0, 54.0, 39.0, 18.0, 21.0, 11.0, 6.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.67333984375, -0.6531524658203125, -0.632965087890625, -0.6127777099609375, -0.59259033203125, -0.5724029541015625, -0.552215576171875, -0.5320281982421875, -0.5118408203125, -0.4916534423828125, -0.471466064453125, -0.4512786865234375, -0.43109130859375, -0.4109039306640625, -0.390716552734375, -0.3705291748046875, -0.350341796875, -0.3301544189453125, -0.309967041015625, -0.2897796630859375, -0.26959228515625, -0.2494049072265625, -0.229217529296875, -0.2090301513671875, -0.1888427734375, -0.1686553955078125, -0.148468017578125, -0.1282806396484375, -0.10809326171875, -0.0879058837890625, -0.067718505859375, -0.0475311279296875, -0.02734375, -0.0071563720703125, 0.013031005859375, 0.0332183837890625, 0.05340576171875, 0.0735931396484375, 0.093780517578125, 0.1139678955078125, 0.1341552734375, 0.1543426513671875, 0.174530029296875, 0.1947174072265625, 0.21490478515625, 0.2350921630859375, 0.255279541015625, 0.2754669189453125, 0.295654296875, 0.3158416748046875, 0.336029052734375, 0.3562164306640625, 0.37640380859375, 0.3965911865234375, 0.416778564453125, 0.4369659423828125, 0.4571533203125, 0.4773406982421875, 0.497528076171875, 0.5177154541015625, 0.53790283203125, 0.5580902099609375, 0.578277587890625, 0.5984649658203125, 0.61865234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 8.0, 10.0, 11.0, 19.0, 19.0, 21.0, 21.0, 24.0, 27.0, 28.0, 30.0, 30.0, 44.0, 42.0, 36.0, 53.0, 43.0, 54.0, 43.0, 46.0, 33.0, 51.0, 34.0, 40.0, 34.0, 36.0, 31.0, 20.0, 10.0, 22.0, 10.0, 11.0, 16.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.724609375, -0.7022018432617188, -0.6797943115234375, -0.6573867797851562, -0.634979248046875, -0.6125717163085938, -0.5901641845703125, -0.5677566528320312, -0.54534912109375, -0.5229415893554688, -0.5005340576171875, -0.47812652587890625, -0.455718994140625, -0.43331146240234375, -0.4109039306640625, -0.38849639892578125, -0.3660888671875, -0.34368133544921875, -0.3212738037109375, -0.29886627197265625, -0.276458740234375, -0.25405120849609375, -0.2316436767578125, -0.20923614501953125, -0.18682861328125, -0.16442108154296875, -0.1420135498046875, -0.11960601806640625, -0.097198486328125, -0.07479095458984375, -0.0523834228515625, -0.02997589111328125, -0.007568359375, 0.01483917236328125, 0.0372467041015625, 0.05965423583984375, 0.082061767578125, 0.10446929931640625, 0.1268768310546875, 0.14928436279296875, 0.17169189453125, 0.19409942626953125, 0.2165069580078125, 0.23891448974609375, 0.261322021484375, 0.28372955322265625, 0.3061370849609375, 0.32854461669921875, 0.3509521484375, 0.37335968017578125, 0.3957672119140625, 0.41817474365234375, 0.440582275390625, 0.46298980712890625, 0.4853973388671875, 0.5078048706054688, 0.53021240234375, 0.5526199340820312, 0.5750274658203125, 0.5974349975585938, 0.619842529296875, 0.6422500610351562, 0.6646575927734375, 0.6870651245117188, 0.70947265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 11.0, 12.0, 30.0, 27.0, 48.0, 65.0, 77.0, 142.0, 171.0, 311.0, 442.0, 713.0, 1123.0, 1832.0, 3132.0, 5801.0, 11406.0, 23742.0, 53043.0, 134186.0, 351645.0, 277664.0, 101698.0, 41464.0, 18548.0, 9239.0, 4803.0, 2751.0, 1642.0, 1012.0, 621.0, 358.0, 252.0, 149.0, 116.0, 67.0, 62.0, 46.0, 28.0, 29.0, 12.0, 8.0, 1.0, 5.0, 5.0, 4.0, 1.0, 5.0], "bins": [-0.64404296875, -0.6265678405761719, -0.6090927124023438, -0.5916175842285156, -0.5741424560546875, -0.5566673278808594, -0.5391921997070312, -0.5217170715332031, -0.504241943359375, -0.4867668151855469, -0.46929168701171875, -0.4518165588378906, -0.4343414306640625, -0.4168663024902344, -0.39939117431640625, -0.3819160461425781, -0.36444091796875, -0.3469657897949219, -0.32949066162109375, -0.3120155334472656, -0.2945404052734375, -0.2770652770996094, -0.25959014892578125, -0.24211502075195312, -0.224639892578125, -0.20716476440429688, -0.18968963623046875, -0.17221450805664062, -0.1547393798828125, -0.13726425170898438, -0.11978912353515625, -0.10231399536132812, -0.0848388671875, -0.06736373901367188, -0.04988861083984375, -0.032413482666015625, -0.0149383544921875, 0.002536773681640625, 0.02001190185546875, 0.037487030029296875, 0.054962158203125, 0.07243728637695312, 0.08991241455078125, 0.10738754272460938, 0.1248626708984375, 0.14233779907226562, 0.15981292724609375, 0.17728805541992188, 0.19476318359375, 0.21223831176757812, 0.22971343994140625, 0.24718856811523438, 0.2646636962890625, 0.2821388244628906, 0.29961395263671875, 0.3170890808105469, 0.334564208984375, 0.3520393371582031, 0.36951446533203125, 0.3869895935058594, 0.4044647216796875, 0.4219398498535156, 0.43941497802734375, 0.4568901062011719, 0.474365234375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 5.0, 12.0, 5.0, 15.0, 14.0, 16.0, 22.0, 18.0, 27.0, 19.0, 25.0, 21.0, 30.0, 33.0, 40.0, 25.0, 34.0, 37.0, 41.0, 39.0, 43.0, 46.0, 47.0, 26.0, 32.0, 41.0, 31.0, 27.0, 28.0, 37.0, 32.0, 16.0, 18.0, 12.0, 12.0, 11.0, 13.0, 9.0, 9.0, 7.0, 4.0, 3.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.6298828125, -0.6074905395507812, -0.5850982666015625, -0.5627059936523438, -0.540313720703125, -0.5179214477539062, -0.4955291748046875, -0.47313690185546875, -0.45074462890625, -0.42835235595703125, -0.4059600830078125, -0.38356781005859375, -0.361175537109375, -0.33878326416015625, -0.3163909912109375, -0.29399871826171875, -0.2716064453125, -0.24921417236328125, -0.2268218994140625, -0.20442962646484375, -0.182037353515625, -0.15964508056640625, -0.1372528076171875, -0.11486053466796875, -0.09246826171875, -0.07007598876953125, -0.0476837158203125, -0.02529144287109375, -0.002899169921875, 0.01949310302734375, 0.0418853759765625, 0.06427764892578125, 0.086669921875, 0.10906219482421875, 0.1314544677734375, 0.15384674072265625, 0.176239013671875, 0.19863128662109375, 0.2210235595703125, 0.24341583251953125, 0.26580810546875, 0.28820037841796875, 0.3105926513671875, 0.33298492431640625, 0.355377197265625, 0.37776947021484375, 0.4001617431640625, 0.42255401611328125, 0.4449462890625, 0.46733856201171875, 0.4897308349609375, 0.5121231079101562, 0.534515380859375, 0.5569076538085938, 0.5792999267578125, 0.6016921997070312, 0.62408447265625, 0.6464767456054688, 0.6688690185546875, 0.6912612915039062, 0.713653564453125, 0.7360458374023438, 0.7584381103515625, 0.7808303833007812, 0.80322265625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 14.0, 17.0, 23.0, 47.0, 67.0, 98.0, 129.0, 175.0, 240.0, 356.0, 488.0, 726.0, 1101.0, 1552.0, 2481.0, 4194.0, 6886.0, 12080.0, 21556.0, 40074.0, 80922.0, 181323.0, 352796.0, 173575.0, 78117.0, 38957.0, 20653.0, 11645.0, 6798.0, 3969.0, 2555.0, 1576.0, 981.0, 717.0, 475.0, 320.0, 257.0, 176.0, 120.0, 79.0, 81.0, 45.0, 28.0, 22.0, 11.0, 15.0, 8.0, 12.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1058349609375, -0.10247230529785156, -0.09910964965820312, -0.09574699401855469, -0.09238433837890625, -0.08902168273925781, -0.08565902709960938, -0.08229637145996094, -0.0789337158203125, -0.07557106018066406, -0.07220840454101562, -0.06884574890136719, -0.06548309326171875, -0.06212043762207031, -0.058757781982421875, -0.05539512634277344, -0.052032470703125, -0.04866981506347656, -0.045307159423828125, -0.04194450378417969, -0.03858184814453125, -0.03521919250488281, -0.031856536865234375, -0.028493881225585938, -0.0251312255859375, -0.021768569946289062, -0.018405914306640625, -0.015043258666992188, -0.01168060302734375, -0.008317947387695312, -0.004955291748046875, -0.0015926361083984375, 0.00177001953125, 0.0051326751708984375, 0.008495330810546875, 0.011857986450195312, 0.01522064208984375, 0.018583297729492188, 0.021945953369140625, 0.025308609008789062, 0.0286712646484375, 0.03203392028808594, 0.035396575927734375, 0.03875923156738281, 0.04212188720703125, 0.04548454284667969, 0.048847198486328125, 0.05220985412597656, 0.055572509765625, 0.05893516540527344, 0.062297821044921875, 0.06566047668457031, 0.06902313232421875, 0.07238578796386719, 0.07574844360351562, 0.07911109924316406, 0.0824737548828125, 0.08583641052246094, 0.08919906616210938, 0.09256172180175781, 0.09592437744140625, 0.09928703308105469, 0.10264968872070312, 0.10601234436035156, 0.109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 6.0, 14.0, 9.0, 18.0, 8.0, 21.0, 22.0, 37.0, 43.0, 66.0, 62.0, 85.0, 134.0, 90.0, 74.0, 57.0, 49.0, 45.0, 35.0, 23.0, 20.0, 17.0, 13.0, 8.0, 8.0, 4.0, 4.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.93381342291832e-05, -3.820471465587616e-05, -3.707129508256912e-05, -3.5937875509262085e-05, -3.480445593595505e-05, -3.367103636264801e-05, -3.253761678934097e-05, -3.1404197216033936e-05, -3.0270777642726898e-05, -2.913735806941986e-05, -2.8003938496112823e-05, -2.6870518922805786e-05, -2.573709934949875e-05, -2.460367977619171e-05, -2.3470260202884674e-05, -2.2336840629577637e-05, -2.12034210562706e-05, -2.0070001482963562e-05, -1.8936581909656525e-05, -1.7803162336349487e-05, -1.666974276304245e-05, -1.5536323189735413e-05, -1.4402903616428375e-05, -1.3269484043121338e-05, -1.21360644698143e-05, -1.1002644896507263e-05, -9.869225323200226e-06, -8.735805749893188e-06, -7.602386176586151e-06, -6.468966603279114e-06, -5.335547029972076e-06, -4.202127456665039e-06, -3.0687078833580017e-06, -1.9352883100509644e-06, -8.01868736743927e-07, 3.3155083656311035e-07, 1.4649704098701477e-06, 2.598389983177185e-06, 3.7318095564842224e-06, 4.86522912979126e-06, 5.998648703098297e-06, 7.1320682764053345e-06, 8.265487849712372e-06, 9.39890742301941e-06, 1.0532326996326447e-05, 1.1665746569633484e-05, 1.2799166142940521e-05, 1.3932585716247559e-05, 1.5066005289554596e-05, 1.6199424862861633e-05, 1.733284443616867e-05, 1.8466264009475708e-05, 1.9599683582782745e-05, 2.0733103156089783e-05, 2.186652272939682e-05, 2.2999942302703857e-05, 2.4133361876010895e-05, 2.5266781449317932e-05, 2.640020102262497e-05, 2.7533620595932007e-05, 2.8667040169239044e-05, 2.980045974254608e-05, 3.093387931585312e-05, 3.2067298889160156e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 10.0, 11.0, 22.0, 34.0, 38.0, 46.0, 83.0, 113.0, 152.0, 226.0, 311.0, 443.0, 668.0, 1075.0, 1728.0, 2819.0, 4978.0, 9174.0, 18070.0, 37825.0, 87496.0, 229057.0, 393591.0, 145558.0, 58443.0, 26801.0, 13156.0, 6697.0, 3769.0, 2132.0, 1352.0, 861.0, 559.0, 355.0, 236.0, 195.0, 136.0, 94.0, 72.0, 46.0, 39.0, 18.0, 10.0, 12.0, 20.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.1473388671875, -0.14291000366210938, -0.13848114013671875, -0.13405227661132812, -0.1296234130859375, -0.12519454956054688, -0.12076568603515625, -0.11633682250976562, -0.111907958984375, -0.10747909545898438, -0.10305023193359375, -0.09862136840820312, -0.0941925048828125, -0.08976364135742188, -0.08533477783203125, -0.08090591430664062, -0.07647705078125, -0.07204818725585938, -0.06761932373046875, -0.06319046020507812, -0.0587615966796875, -0.054332733154296875, -0.04990386962890625, -0.045475006103515625, -0.041046142578125, -0.036617279052734375, -0.03218841552734375, -0.027759552001953125, -0.0233306884765625, -0.018901824951171875, -0.01447296142578125, -0.010044097900390625, -0.005615234375, -0.001186370849609375, 0.00324249267578125, 0.007671356201171875, 0.0121002197265625, 0.016529083251953125, 0.02095794677734375, 0.025386810302734375, 0.029815673828125, 0.034244537353515625, 0.03867340087890625, 0.043102264404296875, 0.0475311279296875, 0.051959991455078125, 0.05638885498046875, 0.060817718505859375, 0.06524658203125, 0.06967544555664062, 0.07410430908203125, 0.07853317260742188, 0.0829620361328125, 0.08739089965820312, 0.09181976318359375, 0.09624862670898438, 0.100677490234375, 0.10510635375976562, 0.10953521728515625, 0.11396408081054688, 0.1183929443359375, 0.12282180786132812, 0.12725067138671875, 0.13167953491210938, 0.1361083984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 8.0, 17.0, 23.0, 16.0, 20.0, 39.0, 43.0, 60.0, 88.0, 96.0, 162.0, 100.0, 83.0, 59.0, 40.0, 36.0, 12.0, 12.0, 11.0, 8.0, 7.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.12286376953125, -0.11893749237060547, -0.11501121520996094, -0.1110849380493164, -0.10715866088867188, -0.10323238372802734, -0.09930610656738281, -0.09537982940673828, -0.09145355224609375, -0.08752727508544922, -0.08360099792480469, -0.07967472076416016, -0.07574844360351562, -0.0718221664428711, -0.06789588928222656, -0.06396961212158203, -0.0600433349609375, -0.05611705780029297, -0.05219078063964844, -0.048264503479003906, -0.044338226318359375, -0.040411949157714844, -0.03648567199707031, -0.03255939483642578, -0.02863311767578125, -0.02470684051513672, -0.020780563354492188, -0.016854286193847656, -0.012928009033203125, -0.009001731872558594, -0.0050754547119140625, -0.0011491775512695312, 0.002777099609375, 0.006703376770019531, 0.010629653930664062, 0.014555931091308594, 0.018482208251953125, 0.022408485412597656, 0.026334762573242188, 0.03026103973388672, 0.03418731689453125, 0.03811359405517578, 0.04203987121582031, 0.045966148376464844, 0.049892425537109375, 0.053818702697753906, 0.05774497985839844, 0.06167125701904297, 0.0655975341796875, 0.06952381134033203, 0.07345008850097656, 0.0773763656616211, 0.08130264282226562, 0.08522891998291016, 0.08915519714355469, 0.09308147430419922, 0.09700775146484375, 0.10093402862548828, 0.10486030578613281, 0.10878658294677734, 0.11271286010742188, 0.1166391372680664, 0.12056541442871094, 0.12449169158935547, 0.12841796875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 7.0, 19.0, 29.0, 45.0, 87.0, 148.0, 179.0, 168.0, 138.0, 89.0, 42.0, 21.0, 16.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.089381217956543, -4.000082492828369, -3.910783290863037, -3.8214845657348633, -3.7321856021881104, -3.6428866386413574, -3.5535879135131836, -3.4642889499664307, -3.3749899864196777, -3.285691022872925, -3.196392059326172, -3.107093334197998, -3.017794370651245, -2.928495407104492, -2.8391966819763184, -2.7498977184295654, -2.6605987548828125, -2.5712997913360596, -2.4820008277893066, -2.392702102661133, -2.30340313911438, -2.214104175567627, -2.124805450439453, -2.0355064868927, -1.9462075233459473, -1.8569085597991943, -1.767609715461731, -1.6783108711242676, -1.5890119075775146, -1.4997129440307617, -1.4104140996932983, -1.321115255355835, -1.2318161725997925, -1.142517328262329, -1.0532183647155762, -0.963919460773468, -0.8746205568313599, -0.7853216528892517, -0.6960227489471436, -0.6067238450050354, -0.5174249410629272, -0.4281260371208191, -0.33882713317871094, -0.24952822923660278, -0.16022932529449463, -0.07093042135238647, 0.01836848258972168, 0.10766738653182983, 0.196966290473938, 0.28626519441604614, 0.3755640983581543, 0.46486300230026245, 0.5541619062423706, 0.6434608101844788, 0.7327597141265869, 0.8220586180686951, 0.9113575220108032, 1.0006563663482666, 1.0899553298950195, 1.1792542934417725, 1.2685531377792358, 1.3578519821166992, 1.4471509456634521, 1.536449909210205, 1.6257487535476685]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 5.0, 6.0, 3.0, 14.0, 15.0, 16.0, 15.0, 10.0, 24.0, 29.0, 27.0, 30.0, 29.0, 39.0, 33.0, 44.0, 64.0, 35.0, 42.0, 55.0, 42.0, 45.0, 52.0, 44.0, 28.0, 34.0, 39.0, 24.0, 32.0, 23.0, 18.0, 19.0, 13.0, 8.0, 9.0, 4.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.47878098487854, -1.4324082136154175, -1.3860353231430054, -1.3396625518798828, -1.2932897806167603, -1.2469170093536377, -1.2005441188812256, -1.154171347618103, -1.1077985763549805, -1.061425805091858, -1.0150529146194458, -0.9686801433563232, -0.9223073720932007, -0.8759345412254333, -0.829561710357666, -0.7831889390945435, -0.7368161082267761, -0.6904432773590088, -0.6440705060958862, -0.5976976752281189, -0.5513249039649963, -0.504952073097229, -0.45857927203178406, -0.4122064709663391, -0.36583366990089417, -0.3194608688354492, -0.2730880677700043, -0.22671525180339813, -0.18034245073795319, -0.13396964967250824, -0.0875968337059021, -0.04122403264045715, 0.005148768424987793, 0.05152157321572304, 0.09789437800645828, 0.14426718652248383, 0.19063998758792877, 0.23701278865337372, 0.28338560461997986, 0.3297584056854248, 0.37613120675086975, 0.4225040078163147, 0.46887680888175964, 0.5152496099472046, 0.5616224408149719, 0.6079952120780945, 0.6543680429458618, 0.7007408142089844, 0.7471136450767517, 0.793486475944519, 0.8398592472076416, 0.8862320780754089, 0.9326048493385315, 0.9789776802062988, 1.0253504514694214, 1.071723222732544, 1.118096113204956, 1.1644688844680786, 1.2108417749404907, 1.2572145462036133, 1.3035873174667358, 1.3499600887298584, 1.3963329792022705, 1.442705750465393, 1.4890785217285156]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 12.0, 6.0, 17.0, 22.0, 20.0, 26.0, 42.0, 49.0, 55.0, 94.0, 148.0, 209.0, 368.0, 567.0, 831.0, 1248.0, 1969.0, 1035770.0, 4267.0, 1635.0, 981.0, 714.0, 496.0, 318.0, 227.0, 132.0, 84.0, 64.0, 45.0, 35.0, 29.0, 27.0, 9.0, 18.0, 8.0, 7.0, 7.0, 6.0, 1.0, 9.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3435776233673096, -2.269963264465332, -2.1963489055633545, -2.122734546661377, -2.0491201877593994, -1.9755058288574219, -1.9018913507461548, -1.8282769918441772, -1.7546626329421997, -1.6810482740402222, -1.6074339151382446, -1.533819556236267, -1.460205078125, -1.3865907192230225, -1.312976360321045, -1.2393620014190674, -1.1657476425170898, -1.0921332836151123, -1.0185189247131348, -0.9449045062065125, -0.8712901473045349, -0.7976757884025574, -0.7240613698959351, -0.6504470109939575, -0.57683265209198, -0.5032182931900024, -0.4296039044857025, -0.3559895157814026, -0.28237515687942505, -0.2087607979774475, -0.13514640927314758, -0.061532020568847656, 0.012082576751708984, 0.08569695055484772, 0.15931132435798645, 0.23292569816112518, 0.3065400719642639, 0.38015443086624146, 0.4537688195705414, 0.5273832082748413, 0.6009975671768188, 0.6746119260787964, 0.7482262849807739, 0.8218407034873962, 0.8954550623893738, 0.9690694212913513, 1.0426838397979736, 1.1162981986999512, 1.1899125576019287, 1.2635269165039062, 1.3371412754058838, 1.4107556343078613, 1.4843699932098389, 1.5579843521118164, 1.6315988302230835, 1.705213189125061, 1.7788275480270386, 1.8524419069290161, 1.9260562658309937, 1.9996706247329712, 2.0732851028442383, 2.146899461746216, 2.2205138206481934, 2.294128179550171, 2.3677425384521484]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 8.0, 28.0, 20.0, 31.0, 46.0, 131.0, 287.0, 811.0, 2492.0, 8143.0, 65199.0, 51378640.0, 10276.0, 3360.0, 1152.0, 397.0, 151.0, 64.0, 43.0, 26.0, 11.0, 12.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.265235900878906, -7.999208450317383, -7.733180522918701, -7.4671525955200195, -7.201125144958496, -6.935097694396973, -6.669069766998291, -6.403041839599609, -6.137014389038086, -5.8709869384765625, -5.604959011077881, -5.338931083679199, -5.072903633117676, -4.806876182556152, -4.540848255157471, -4.274820327758789, -4.008792877197266, -3.742765188217163, -3.4767374992370605, -3.210709810256958, -2.9446821212768555, -2.678654432296753, -2.4126267433166504, -2.146599054336548, -1.8805713653564453, -1.6145436763763428, -1.3485159873962402, -1.0824882984161377, -0.8164606094360352, -0.5504329204559326, -0.2844052314758301, -0.01837754249572754, 0.2476511001586914, 0.513678789138794, 0.7797064781188965, 1.045734167098999, 1.3117618560791016, 1.577789545059204, 1.8438172340393066, 2.109844923019409, 2.3758726119995117, 2.6419003009796143, 2.907927989959717, 3.1739556789398193, 3.439983367919922, 3.7060110569000244, 3.972038745880127, 4.238066673278809, 4.504094123840332, 4.7701215744018555, 5.036149501800537, 5.302177429199219, 5.568204879760742, 5.834232330322266, 6.100260257720947, 6.366288185119629, 6.632315635681152, 6.898343086242676, 7.164371013641357, 7.430398941040039, 7.6964263916015625, 7.962453842163086, 8.22848129272461, 8.49450969696045, 8.760537147521973]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 6.0, 9.0, 13.0, 21.0, 28.0, 38.0, 63.0, 117.0, 170.0, 290.0, 502.0, 847.0, 1466.0, 2551.0, 4666.0, 8858.0, 17318.0, 34980.0, 72950.0, 157547.0, 329999.0, 686433.0, 3570371.0, 738085.0, 346004.0, 166383.0, 77157.0, 36397.0, 17848.0, 9175.0, 4828.0, 2604.0, 1523.0, 863.0, 511.0, 281.0, 191.0, 110.0, 87.0, 51.0, 35.0, 22.0, 17.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.62646484375, -0.609771728515625, -0.59307861328125, -0.576385498046875, -0.5596923828125, -0.542999267578125, -0.52630615234375, -0.509613037109375, -0.492919921875, -0.476226806640625, -0.45953369140625, -0.442840576171875, -0.4261474609375, -0.409454345703125, -0.39276123046875, -0.376068115234375, -0.359375, -0.342681884765625, -0.32598876953125, -0.309295654296875, -0.2926025390625, -0.275909423828125, -0.25921630859375, -0.242523193359375, -0.225830078125, -0.209136962890625, -0.19244384765625, -0.175750732421875, -0.1590576171875, -0.142364501953125, -0.12567138671875, -0.108978271484375, -0.09228515625, -0.075592041015625, -0.05889892578125, -0.042205810546875, -0.0255126953125, -0.008819580078125, 0.00787353515625, 0.024566650390625, 0.041259765625, 0.057952880859375, 0.07464599609375, 0.091339111328125, 0.1080322265625, 0.124725341796875, 0.14141845703125, 0.158111572265625, 0.1748046875, 0.191497802734375, 0.20819091796875, 0.224884033203125, 0.2415771484375, 0.258270263671875, 0.27496337890625, 0.291656494140625, 0.308349609375, 0.325042724609375, 0.34173583984375, 0.358428955078125, 0.3751220703125, 0.391815185546875, 0.40850830078125, 0.425201416015625, 0.44189453125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 10.0, 7.0, 5.0, 12.0, 14.0, 19.0, 11.0, 27.0, 23.0, 20.0, 31.0, 27.0, 30.0, 40.0, 42.0, 47.0, 51.0, 54.0, 107.0, 852.0, 218.0, 59.0, 31.0, 25.0, 38.0, 30.0, 32.0, 36.0, 14.0, 20.0, 22.0, 11.0, 8.0, 12.0, 9.0, 4.0, 4.0, 8.0, 4.0, 2.0, 6.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-5.7578125, -5.60089111328125, -5.4439697265625, -5.28704833984375, -5.130126953125, -4.97320556640625, -4.8162841796875, -4.65936279296875, -4.50244140625, -4.34552001953125, -4.1885986328125, -4.03167724609375, -3.874755859375, -3.71783447265625, -3.5609130859375, -3.40399169921875, -3.2470703125, -3.09014892578125, -2.9332275390625, -2.77630615234375, -2.619384765625, -2.46246337890625, -2.3055419921875, -2.14862060546875, -1.99169921875, -1.83477783203125, -1.6778564453125, -1.52093505859375, -1.364013671875, -1.20709228515625, -1.0501708984375, -0.89324951171875, -0.736328125, -0.57940673828125, -0.4224853515625, -0.26556396484375, -0.108642578125, 0.04827880859375, 0.2052001953125, 0.36212158203125, 0.51904296875, 0.67596435546875, 0.8328857421875, 0.98980712890625, 1.146728515625, 1.30364990234375, 1.4605712890625, 1.61749267578125, 1.7744140625, 1.93133544921875, 2.0882568359375, 2.24517822265625, 2.402099609375, 2.55902099609375, 2.7159423828125, 2.87286376953125, 3.02978515625, 3.18670654296875, 3.3436279296875, 3.50054931640625, 3.657470703125, 3.81439208984375, 3.9713134765625, 4.12823486328125, 4.28515625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 9.0, 9.0, 17.0, 9.0, 38.0, 47.0, 84.0, 165.0, 270.0, 508.0, 994.0, 2012.0, 4163.0, 9339.0, 20727.0, 47141.0, 106174.0, 221777.0, 401480.0, 859006.0, 3486288.0, 521064.0, 313499.0, 162427.0, 74419.0, 32842.0, 14346.0, 6408.0, 3147.0, 1457.0, 734.0, 362.0, 203.0, 124.0, 70.0, 29.0, 23.0, 12.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3046875, -0.29351806640625, -0.2823486328125, -0.27117919921875, -0.260009765625, -0.24884033203125, -0.2376708984375, -0.22650146484375, -0.21533203125, -0.20416259765625, -0.1929931640625, -0.18182373046875, -0.170654296875, -0.15948486328125, -0.1483154296875, -0.13714599609375, -0.1259765625, -0.11480712890625, -0.1036376953125, -0.09246826171875, -0.081298828125, -0.07012939453125, -0.0589599609375, -0.04779052734375, -0.03662109375, -0.02545166015625, -0.0142822265625, -0.00311279296875, 0.008056640625, 0.01922607421875, 0.0303955078125, 0.04156494140625, 0.052734375, 0.06390380859375, 0.0750732421875, 0.08624267578125, 0.097412109375, 0.10858154296875, 0.1197509765625, 0.13092041015625, 0.14208984375, 0.15325927734375, 0.1644287109375, 0.17559814453125, 0.186767578125, 0.19793701171875, 0.2091064453125, 0.22027587890625, 0.2314453125, 0.24261474609375, 0.2537841796875, 0.26495361328125, 0.276123046875, 0.28729248046875, 0.2984619140625, 0.30963134765625, 0.32080078125, 0.33197021484375, 0.3431396484375, 0.35430908203125, 0.365478515625, 0.37664794921875, 0.3878173828125, 0.39898681640625, 0.41015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 9.0, 5.0, 11.0, 13.0, 14.0, 20.0, 16.0, 26.0, 45.0, 34.0, 30.0, 48.0, 50.0, 48.0, 50.0, 181.0, 956.0, 59.0, 49.0, 69.0, 38.0, 34.0, 48.0, 38.0, 26.0, 24.0, 25.0, 13.0, 14.0, 12.0, 5.0, 4.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.16741943359375, -4.0028076171875, -3.83819580078125, -3.673583984375, -3.50897216796875, -3.3443603515625, -3.17974853515625, -3.01513671875, -2.85052490234375, -2.6859130859375, -2.52130126953125, -2.356689453125, -2.19207763671875, -2.0274658203125, -1.86285400390625, -1.6982421875, -1.53363037109375, -1.3690185546875, -1.20440673828125, -1.039794921875, -0.87518310546875, -0.7105712890625, -0.54595947265625, -0.38134765625, -0.21673583984375, -0.0521240234375, 0.11248779296875, 0.277099609375, 0.44171142578125, 0.6063232421875, 0.77093505859375, 0.935546875, 1.10015869140625, 1.2647705078125, 1.42938232421875, 1.593994140625, 1.75860595703125, 1.9232177734375, 2.08782958984375, 2.25244140625, 2.41705322265625, 2.5816650390625, 2.74627685546875, 2.910888671875, 3.07550048828125, 3.2401123046875, 3.40472412109375, 3.5693359375, 3.73394775390625, 3.8985595703125, 4.06317138671875, 4.227783203125, 4.39239501953125, 4.5570068359375, 4.72161865234375, 4.88623046875, 5.05084228515625, 5.2154541015625, 5.38006591796875, 5.544677734375, 5.70928955078125, 5.8739013671875, 6.03851318359375, 6.203125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 3.0, 7.0, 12.0, 16.0, 35.0, 24.0, 22.0, 47.0, 48.0, 74.0, 96.0, 125.0, 222.0, 293.0, 450.0, 596.0, 899.0, 1343.0, 2065.0, 3662.0, 7548.0, 17473.0, 48489.0, 145048.0, 418803.0, 1885747.0, 3049575.0, 456438.0, 159781.0, 53776.0, 19576.0, 8243.0, 4106.0, 2305.0, 1332.0, 965.0, 663.0, 415.0, 272.0, 213.0, 159.0, 119.0, 89.0, 68.0, 50.0, 35.0, 35.0, 25.0, 12.0, 7.0, 6.0, 7.0, 4.0, 4.0, 3.0], "bins": [-0.57177734375, -0.5554618835449219, -0.5391464233398438, -0.5228309631347656, -0.5065155029296875, -0.4902000427246094, -0.47388458251953125, -0.4575691223144531, -0.441253662109375, -0.4249382019042969, -0.40862274169921875, -0.3923072814941406, -0.3759918212890625, -0.3596763610839844, -0.34336090087890625, -0.3270454406738281, -0.31072998046875, -0.2944145202636719, -0.27809906005859375, -0.2617835998535156, -0.2454681396484375, -0.22915267944335938, -0.21283721923828125, -0.19652175903320312, -0.180206298828125, -0.16389083862304688, -0.14757537841796875, -0.13125991821289062, -0.1149444580078125, -0.09862899780273438, -0.08231353759765625, -0.06599807739257812, -0.0496826171875, -0.033367156982421875, -0.01705169677734375, -0.000736236572265625, 0.0155792236328125, 0.031894683837890625, 0.04821014404296875, 0.06452560424804688, 0.080841064453125, 0.09715652465820312, 0.11347198486328125, 0.12978744506835938, 0.1461029052734375, 0.16241836547851562, 0.17873382568359375, 0.19504928588867188, 0.21136474609375, 0.22768020629882812, 0.24399566650390625, 0.2603111267089844, 0.2766265869140625, 0.2929420471191406, 0.30925750732421875, 0.3255729675292969, 0.341888427734375, 0.3582038879394531, 0.37451934814453125, 0.3908348083496094, 0.4071502685546875, 0.4234657287597656, 0.43978118896484375, 0.4560966491699219, 0.472412109375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 5.0, 11.0, 4.0, 18.0, 10.0, 16.0, 24.0, 26.0, 37.0, 36.0, 37.0, 35.0, 35.0, 43.0, 41.0, 36.0, 378.0, 739.0, 51.0, 32.0, 46.0, 50.0, 31.0, 37.0, 30.0, 29.0, 25.0, 30.0, 21.0, 16.0, 13.0, 8.0, 12.0, 5.0, 15.0, 4.0, 9.0, 3.0, 4.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.71484375, -4.5634765625, -4.412109375, -4.2607421875, -4.109375, -3.9580078125, -3.806640625, -3.6552734375, -3.50390625, -3.3525390625, -3.201171875, -3.0498046875, -2.8984375, -2.7470703125, -2.595703125, -2.4443359375, -2.29296875, -2.1416015625, -1.990234375, -1.8388671875, -1.6875, -1.5361328125, -1.384765625, -1.2333984375, -1.08203125, -0.9306640625, -0.779296875, -0.6279296875, -0.4765625, -0.3251953125, -0.173828125, -0.0224609375, 0.12890625, 0.2802734375, 0.431640625, 0.5830078125, 0.734375, 0.8857421875, 1.037109375, 1.1884765625, 1.33984375, 1.4912109375, 1.642578125, 1.7939453125, 1.9453125, 2.0966796875, 2.248046875, 2.3994140625, 2.55078125, 2.7021484375, 2.853515625, 3.0048828125, 3.15625, 3.3076171875, 3.458984375, 3.6103515625, 3.76171875, 3.9130859375, 4.064453125, 4.2158203125, 4.3671875, 4.5185546875, 4.669921875, 4.8212890625, 4.97265625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 10.0, 27.0, 106.0, 455.0, 317.0, 61.0, 18.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.797701835632324, -11.989340782165527, -11.180978775024414, -10.372617721557617, -9.56425666809082, -8.755895614624023, -7.94753360748291, -7.139172554016113, -6.330811023712158, -5.522449493408203, -4.714088439941406, -3.905726909637451, -3.097365617752075, -2.289004325866699, -1.4806427955627441, -0.6722817420959473, 0.1360797882080078, 0.9444411396980286, 1.7528024911880493, 2.561163902282715, 3.369525194168091, 4.177886486053467, 4.986248016357422, 5.794609069824219, 6.602970600128174, 7.411332130432129, 8.219693183898926, 9.028055191040039, 9.836416244506836, 10.644777297973633, 11.45313835144043, 12.261499404907227, 13.069860458374023, 13.87822151184082, 14.686583518981934, 15.49494457244873, 16.303306579589844, 17.11166763305664, 17.920028686523438, 18.728389739990234, 19.53675079345703, 20.345111846923828, 21.153472900390625, 21.961833953857422, 22.77019691467285, 23.57855796813965, 24.386919021606445, 25.195280075073242, 26.003643035888672, 26.81200408935547, 27.620365142822266, 28.428726196289062, 29.237089157104492, 30.04545021057129, 30.853811264038086, 31.662172317504883, 32.47053146362305, 33.278892517089844, 34.08725357055664, 34.89561462402344, 35.703975677490234, 36.51233673095703, 37.320701599121094, 38.129058837890625, 38.93742370605469]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 7.0, 18.0, 15.0, 23.0, 39.0, 34.0, 42.0, 48.0, 69.0, 64.0, 74.0, 72.0, 71.0, 62.0, 71.0, 57.0, 44.0, 41.0, 34.0, 23.0, 23.0, 13.0, 13.0, 6.0, 9.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.216602325439453, -20.588478088378906, -19.96035385131836, -19.33222770690918, -18.704103469848633, -18.075979232788086, -17.447853088378906, -16.81972885131836, -16.191604614257812, -15.563480377197266, -14.935355186462402, -14.307229995727539, -13.679105758666992, -13.050981521606445, -12.422856330871582, -11.794731140136719, -11.166606903076172, -10.538482666015625, -9.910357475280762, -9.282232284545898, -8.654108047485352, -8.025983810424805, -7.397858619689941, -6.769733905792236, -6.141609191894531, -5.513484477996826, -4.885359764099121, -4.257235050201416, -3.629110336303711, -3.000985622406006, -2.372860908508301, -1.7447361946105957, -1.1166114807128906, -0.48848676681518555, 0.13963794708251953, 0.7677626609802246, 1.3958873748779297, 2.0240120887756348, 2.65213680267334, 3.280261516571045, 3.90838623046875, 4.536510944366455, 5.16463565826416, 5.792760372161865, 6.42088508605957, 7.049009799957275, 7.6771345138549805, 8.305259704589844, 8.93338394165039, 9.561508178710938, 10.1896333694458, 10.817758560180664, 11.445882797241211, 12.074007034301758, 12.702132225036621, 13.330257415771484, 13.958381652832031, 14.586505889892578, 15.214631080627441, 15.842756271362305, 16.47088050842285, 17.0990047454834, 17.727130889892578, 18.355255126953125, 18.983379364013672]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 7.0, 21.0, 35.0, 49.0, 58.0, 107.0, 201.0, 366.0, 802.0, 2352.0, 11965.0, 213660.0, 3923127.0, 34155.0, 4959.0, 1252.0, 534.0, 269.0, 138.0, 74.0, 60.0, 26.0, 20.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.44091796875, -0.42874908447265625, -0.4165802001953125, -0.40441131591796875, -0.392242431640625, -0.38007354736328125, -0.3679046630859375, -0.35573577880859375, -0.34356689453125, -0.33139801025390625, -0.3192291259765625, -0.30706024169921875, -0.294891357421875, -0.28272247314453125, -0.2705535888671875, -0.25838470458984375, -0.2462158203125, -0.23404693603515625, -0.2218780517578125, -0.20970916748046875, -0.197540283203125, -0.18537139892578125, -0.1732025146484375, -0.16103363037109375, -0.14886474609375, -0.13669586181640625, -0.1245269775390625, -0.11235809326171875, -0.100189208984375, -0.08802032470703125, -0.0758514404296875, -0.06368255615234375, -0.051513671875, -0.03934478759765625, -0.0271759033203125, -0.01500701904296875, -0.002838134765625, 0.00933074951171875, 0.0214996337890625, 0.03366851806640625, 0.04583740234375, 0.05800628662109375, 0.0701751708984375, 0.08234405517578125, 0.094512939453125, 0.10668182373046875, 0.1188507080078125, 0.13101959228515625, 0.1431884765625, 0.15535736083984375, 0.1675262451171875, 0.17969512939453125, 0.191864013671875, 0.20403289794921875, 0.2162017822265625, 0.22837066650390625, 0.24053955078125, 0.25270843505859375, 0.2648773193359375, 0.27704620361328125, 0.289215087890625, 0.30138397216796875, 0.3135528564453125, 0.32572174072265625, 0.337890625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 10.0, 11.0, 10.0, 23.0, 39.0, 44.0, 57.0, 79.0, 68.0, 63.0, 101.0, 99.0, 76.0, 74.0, 60.0, 49.0, 32.0, 28.0, 18.0, 20.0, 12.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.07818603515625, -0.07593345642089844, -0.07368087768554688, -0.07142829895019531, -0.06917572021484375, -0.06692314147949219, -0.06467056274414062, -0.06241798400878906, -0.0601654052734375, -0.05791282653808594, -0.055660247802734375, -0.05340766906738281, -0.05115509033203125, -0.04890251159667969, -0.046649932861328125, -0.04439735412597656, -0.042144775390625, -0.03989219665527344, -0.037639617919921875, -0.03538703918457031, -0.03313446044921875, -0.030881881713867188, -0.028629302978515625, -0.026376724243164062, -0.0241241455078125, -0.021871566772460938, -0.019618988037109375, -0.017366409301757812, -0.01511383056640625, -0.012861251831054688, -0.010608673095703125, -0.008356094360351562, -0.006103515625, -0.0038509368896484375, -0.001598358154296875, 0.0006542205810546875, 0.00290679931640625, 0.0051593780517578125, 0.007411956787109375, 0.009664535522460938, 0.0119171142578125, 0.014169692993164062, 0.016422271728515625, 0.018674850463867188, 0.02092742919921875, 0.023180007934570312, 0.025432586669921875, 0.027685165405273438, 0.029937744140625, 0.03219032287597656, 0.034442901611328125, 0.03669548034667969, 0.03894805908203125, 0.04120063781738281, 0.043453216552734375, 0.04570579528808594, 0.0479583740234375, 0.05021095275878906, 0.052463531494140625, 0.05471611022949219, 0.05696868896484375, 0.05922126770019531, 0.061473846435546875, 0.06372642517089844, 0.06597900390625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 17.0, 7.0, 10.0, 16.0, 12.0, 14.0, 29.0, 31.0, 26.0, 58.0, 86.0, 248.0, 1891.0, 514699.0, 3673858.0, 2735.0, 273.0, 95.0, 48.0, 29.0, 16.0, 19.0, 13.0, 7.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33984375, -0.32924652099609375, -0.3186492919921875, -0.30805206298828125, -0.297454833984375, -0.28685760498046875, -0.2762603759765625, -0.26566314697265625, -0.25506591796875, -0.24446868896484375, -0.2338714599609375, -0.22327423095703125, -0.212677001953125, -0.20207977294921875, -0.1914825439453125, -0.18088531494140625, -0.1702880859375, -0.15969085693359375, -0.1490936279296875, -0.13849639892578125, -0.127899169921875, -0.11730194091796875, -0.1067047119140625, -0.09610748291015625, -0.08551025390625, -0.07491302490234375, -0.0643157958984375, -0.05371856689453125, -0.043121337890625, -0.03252410888671875, -0.0219268798828125, -0.01132965087890625, -0.000732421875, 0.00986480712890625, 0.0204620361328125, 0.03105926513671875, 0.041656494140625, 0.05225372314453125, 0.0628509521484375, 0.07344818115234375, 0.08404541015625, 0.09464263916015625, 0.1052398681640625, 0.11583709716796875, 0.126434326171875, 0.13703155517578125, 0.1476287841796875, 0.15822601318359375, 0.1688232421875, 0.17942047119140625, 0.1900177001953125, 0.20061492919921875, 0.211212158203125, 0.22180938720703125, 0.2324066162109375, 0.24300384521484375, 0.25360107421875, 0.26419830322265625, 0.2747955322265625, 0.28539276123046875, 0.295989990234375, 0.30658721923828125, 0.3171844482421875, 0.32778167724609375, 0.33837890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 8.0, 4.0, 5.0, 9.0, 18.0, 35.0, 38.0, 80.0, 162.0, 323.0, 806.0, 1227.0, 679.0, 251.0, 130.0, 72.0, 45.0, 30.0, 26.0, 22.0, 12.0, 6.0, 19.0, 8.0, 14.0, 5.0, 3.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.07855224609375, -0.07578372955322266, -0.07301521301269531, -0.07024669647216797, -0.06747817993164062, -0.06470966339111328, -0.06194114685058594, -0.059172630310058594, -0.05640411376953125, -0.053635597229003906, -0.05086708068847656, -0.04809856414794922, -0.045330047607421875, -0.04256153106689453, -0.03979301452636719, -0.037024497985839844, -0.0342559814453125, -0.031487464904785156, -0.028718948364257812, -0.02595043182373047, -0.023181915283203125, -0.02041339874267578, -0.017644882202148438, -0.014876365661621094, -0.01210784912109375, -0.009339332580566406, -0.0065708160400390625, -0.0038022994995117188, -0.001033782958984375, 0.0017347335815429688, 0.0045032501220703125, 0.007271766662597656, 0.010040283203125, 0.012808799743652344, 0.015577316284179688, 0.01834583282470703, 0.021114349365234375, 0.02388286590576172, 0.026651382446289062, 0.029419898986816406, 0.03218841552734375, 0.034956932067871094, 0.03772544860839844, 0.04049396514892578, 0.043262481689453125, 0.04603099822998047, 0.04879951477050781, 0.051568031311035156, 0.0543365478515625, 0.057105064392089844, 0.05987358093261719, 0.06264209747314453, 0.06541061401367188, 0.06817913055419922, 0.07094764709472656, 0.0737161636352539, 0.07648468017578125, 0.0792531967163086, 0.08202171325683594, 0.08479022979736328, 0.08755874633789062, 0.09032726287841797, 0.09309577941894531, 0.09586429595947266, 0.0986328125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 489.0, 524.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8784648776054382, -0.7690642476081848, -0.6596636772155762, -0.5502630472183228, -0.44086241722106934, -0.3314617872238159, -0.22206121683120728, -0.11266058683395386, -0.0032599568367004395, 0.10614065825939178, 0.215541273355484, 0.32494187355041504, 0.43434250354766846, 0.5437431335449219, 0.6531437039375305, 0.7625443339347839, 0.8719449639320374, 0.9813455939292908, 1.0907461643218994, 1.2001467943191528, 1.3095474243164062, 1.4189480543136597, 1.528348684310913, 1.637749195098877, 1.74714994430542, 1.8565505743026733, 1.9659512042999268, 2.0753517150878906, 2.1847524642944336, 2.2941529750823975, 2.4035534858703613, 2.5129542350769043, 2.6223549842834473, 2.731755495071411, 2.841156244277954, 2.950556755065918, 3.059957504272461, 3.169358015060425, 3.2787585258483887, 3.3881592750549316, 3.4975600242614746, 3.6069605350494385, 3.7163612842559814, 3.8257617950439453, 3.9351625442504883, 4.044563293457031, 4.153963565826416, 4.263364315032959, 4.372764587402344, 4.482165336608887, 4.5915656089782715, 4.7009663581848145, 4.810367107391357, 4.9197678565979, 5.029168128967285, 5.138568878173828, 5.247969627380371, 5.357370376586914, 5.466770648956299, 5.576171398162842, 5.685572147369385, 5.794972896575928, 5.9043731689453125, 6.0137739181518555, 6.123174667358398]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 8.0, 4.0, 17.0, 5.0, 10.0, 14.0, 16.0, 24.0, 20.0, 25.0, 35.0, 37.0, 42.0, 46.0, 54.0, 55.0, 61.0, 51.0, 59.0, 64.0, 44.0, 42.0, 49.0, 52.0, 32.0, 25.0, 31.0, 23.0, 16.0, 13.0, 9.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3013148903846741, -0.2894304096698761, -0.2775459587574005, -0.26566147804260254, -0.25377699732780457, -0.24189253151416779, -0.230008065700531, -0.21812358498573303, -0.20623910427093506, -0.19435463845729828, -0.1824701577425003, -0.17058569192886353, -0.15870121121406555, -0.14681674540042877, -0.134932279586792, -0.12304779887199402, -0.11116333305835724, -0.09927885979413986, -0.08739438652992249, -0.0755099207162857, -0.06362544000148773, -0.051740970462560654, -0.039856500923633575, -0.0279720276594162, -0.016087554395198822, -0.00420308206230402, 0.007681390270590782, 0.01956586167216301, 0.031450334936380386, 0.04333480820059776, 0.05521927773952484, 0.06710375100374222, 0.0789882242679596, 0.09087269753217697, 0.10275717079639435, 0.11464163661003113, 0.1265261173248291, 0.13841058313846588, 0.15029504895210266, 0.16217952966690063, 0.1740640103816986, 0.1859484761953354, 0.19783295691013336, 0.20971742272377014, 0.22160190343856812, 0.2334863692522049, 0.24537083506584167, 0.25725531578063965, 0.26913976669311523, 0.2810242474079132, 0.2929086983203888, 0.30479317903518677, 0.31667765974998474, 0.3285621404647827, 0.3404465913772583, 0.3523310720920563, 0.36421555280685425, 0.3761000335216522, 0.3879844844341278, 0.3998689651489258, 0.41175344586372375, 0.42363792657852173, 0.4355223774909973, 0.4474068582057953, 0.45929133892059326]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 10.0, 10.0, 9.0, 24.0, 17.0, 34.0, 52.0, 68.0, 111.0, 189.0, 360.0, 762.0, 1465.0, 3828.0, 14165.0, 580735.0, 426698.0, 13242.0, 3802.0, 1456.0, 635.0, 364.0, 196.0, 99.0, 66.0, 48.0, 26.0, 21.0, 17.0, 17.0, 1.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.44287109375, -0.42758941650390625, -0.4123077392578125, -0.39702606201171875, -0.381744384765625, -0.36646270751953125, -0.3511810302734375, -0.33589935302734375, -0.32061767578125, -0.30533599853515625, -0.2900543212890625, -0.27477264404296875, -0.259490966796875, -0.24420928955078125, -0.2289276123046875, -0.21364593505859375, -0.1983642578125, -0.18308258056640625, -0.1678009033203125, -0.15251922607421875, -0.137237548828125, -0.12195587158203125, -0.1066741943359375, -0.09139251708984375, -0.07611083984375, -0.06082916259765625, -0.0455474853515625, -0.03026580810546875, -0.014984130859375, 0.00029754638671875, 0.0155792236328125, 0.03086090087890625, 0.046142578125, 0.06142425537109375, 0.0767059326171875, 0.09198760986328125, 0.107269287109375, 0.12255096435546875, 0.1378326416015625, 0.15311431884765625, 0.16839599609375, 0.18367767333984375, 0.1989593505859375, 0.21424102783203125, 0.229522705078125, 0.24480438232421875, 0.2600860595703125, 0.27536773681640625, 0.2906494140625, 0.30593109130859375, 0.3212127685546875, 0.33649444580078125, 0.351776123046875, 0.36705780029296875, 0.3823394775390625, 0.39762115478515625, 0.41290283203125, 0.42818450927734375, 0.4434661865234375, 0.45874786376953125, 0.474029541015625, 0.48931121826171875, 0.5045928955078125, 0.5198745727539062, 0.53515625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 13.0, 13.0, 19.0, 26.0, 48.0, 61.0, 59.0, 75.0, 86.0, 94.0, 77.0, 85.0, 79.0, 64.0, 49.0, 40.0, 28.0, 24.0, 15.0, 12.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07683181762695312, -0.07456207275390625, -0.07229232788085938, -0.0700225830078125, -0.06775283813476562, -0.06548309326171875, -0.06321334838867188, -0.060943603515625, -0.058673858642578125, -0.05640411376953125, -0.054134368896484375, -0.0518646240234375, -0.049594879150390625, -0.04732513427734375, -0.045055389404296875, -0.04278564453125, -0.040515899658203125, -0.03824615478515625, -0.035976409912109375, -0.0337066650390625, -0.031436920166015625, -0.02916717529296875, -0.026897430419921875, -0.024627685546875, -0.022357940673828125, -0.02008819580078125, -0.017818450927734375, -0.0155487060546875, -0.013278961181640625, -0.01100921630859375, -0.008739471435546875, -0.0064697265625, -0.004199981689453125, -0.00193023681640625, 0.000339508056640625, 0.0026092529296875, 0.004878997802734375, 0.00714874267578125, 0.009418487548828125, 0.011688232421875, 0.013957977294921875, 0.01622772216796875, 0.018497467041015625, 0.0207672119140625, 0.023036956787109375, 0.02530670166015625, 0.027576446533203125, 0.02984619140625, 0.032115936279296875, 0.03438568115234375, 0.036655426025390625, 0.0389251708984375, 0.041194915771484375, 0.04346466064453125, 0.045734405517578125, 0.048004150390625, 0.050273895263671875, 0.05254364013671875, 0.054813385009765625, 0.0570831298828125, 0.059352874755859375, 0.06162261962890625, 0.06389236450195312, 0.066162109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 10.0, 13.0, 22.0, 22.0, 32.0, 41.0, 70.0, 91.0, 108.0, 239.0, 451.0, 1476.0, 9939.0, 154845.0, 810867.0, 62844.0, 5412.0, 1041.0, 345.0, 155.0, 101.0, 78.0, 71.0, 50.0, 42.0, 36.0, 30.0, 15.0, 13.0, 16.0, 10.0, 10.0, 10.0, 7.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10418701171875, -0.10037899017333984, -0.09657096862792969, -0.09276294708251953, -0.08895492553710938, -0.08514690399169922, -0.08133888244628906, -0.0775308609008789, -0.07372283935546875, -0.0699148178100586, -0.06610679626464844, -0.06229877471923828, -0.058490753173828125, -0.05468273162841797, -0.05087471008300781, -0.047066688537597656, -0.0432586669921875, -0.039450645446777344, -0.03564262390136719, -0.03183460235595703, -0.028026580810546875, -0.02421855926513672, -0.020410537719726562, -0.016602516174316406, -0.01279449462890625, -0.008986473083496094, -0.0051784515380859375, -0.0013704299926757812, 0.002437591552734375, 0.006245613098144531, 0.010053634643554688, 0.013861656188964844, 0.017669677734375, 0.021477699279785156, 0.025285720825195312, 0.02909374237060547, 0.032901763916015625, 0.03670978546142578, 0.04051780700683594, 0.044325828552246094, 0.04813385009765625, 0.051941871643066406, 0.05574989318847656, 0.05955791473388672, 0.06336593627929688, 0.06717395782470703, 0.07098197937011719, 0.07479000091552734, 0.0785980224609375, 0.08240604400634766, 0.08621406555175781, 0.09002208709716797, 0.09383010864257812, 0.09763813018798828, 0.10144615173339844, 0.1052541732788086, 0.10906219482421875, 0.1128702163696289, 0.11667823791503906, 0.12048625946044922, 0.12429428100585938, 0.12810230255126953, 0.1319103240966797, 0.13571834564208984, 0.1395263671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 3.0, 5.0, 8.0, 9.0, 14.0, 12.0, 11.0, 14.0, 12.0, 14.0, 25.0, 26.0, 21.0, 32.0, 24.0, 21.0, 18.0, 25.0, 36.0, 38.0, 42.0, 39.0, 28.0, 30.0, 39.0, 33.0, 49.0, 45.0, 31.0, 34.0, 34.0, 30.0, 32.0, 25.0, 21.0, 13.0, 13.0, 10.0, 19.0, 9.0, 14.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.08453369140625, -0.081939697265625, -0.079345703125, -0.076751708984375, -0.07415771484375, -0.071563720703125, -0.0689697265625, -0.066375732421875, -0.06378173828125, -0.061187744140625, -0.05859375, -0.055999755859375, -0.05340576171875, -0.050811767578125, -0.0482177734375, -0.045623779296875, -0.04302978515625, -0.040435791015625, -0.037841796875, -0.035247802734375, -0.03265380859375, -0.030059814453125, -0.0274658203125, -0.024871826171875, -0.02227783203125, -0.019683837890625, -0.01708984375, -0.014495849609375, -0.01190185546875, -0.009307861328125, -0.0067138671875, -0.004119873046875, -0.00152587890625, 0.001068115234375, 0.003662109375, 0.006256103515625, 0.00885009765625, 0.011444091796875, 0.0140380859375, 0.016632080078125, 0.01922607421875, 0.021820068359375, 0.0244140625, 0.027008056640625, 0.02960205078125, 0.032196044921875, 0.0347900390625, 0.037384033203125, 0.03997802734375, 0.042572021484375, 0.045166015625, 0.047760009765625, 0.05035400390625, 0.052947998046875, 0.0555419921875, 0.058135986328125, 0.06072998046875, 0.063323974609375, 0.06591796875, 0.068511962890625, 0.07110595703125, 0.073699951171875, 0.0762939453125, 0.078887939453125, 0.08148193359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 11.0, 18.0, 28.0, 30.0, 36.0, 47.0, 75.0, 107.0, 140.0, 202.0, 250.0, 499.0, 802.0, 1467.0, 2954.0, 6829.0, 23453.0, 225150.0, 696561.0, 67993.0, 12479.0, 4531.0, 2106.0, 1070.0, 584.0, 361.0, 238.0, 154.0, 96.0, 64.0, 56.0, 40.0, 26.0, 21.0, 19.0, 11.0, 9.0, 9.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02032470703125, -0.0196533203125, -0.01898193359375, -0.018310546875, -0.01763916015625, -0.0169677734375, -0.01629638671875, -0.015625, -0.01495361328125, -0.0142822265625, -0.01361083984375, -0.012939453125, -0.01226806640625, -0.0115966796875, -0.01092529296875, -0.01025390625, -0.00958251953125, -0.0089111328125, -0.00823974609375, -0.007568359375, -0.00689697265625, -0.0062255859375, -0.00555419921875, -0.0048828125, -0.00421142578125, -0.0035400390625, -0.00286865234375, -0.002197265625, -0.00152587890625, -0.0008544921875, -0.00018310546875, 0.00048828125, 0.00115966796875, 0.0018310546875, 0.00250244140625, 0.003173828125, 0.00384521484375, 0.0045166015625, 0.00518798828125, 0.005859375, 0.00653076171875, 0.0072021484375, 0.00787353515625, 0.008544921875, 0.00921630859375, 0.0098876953125, 0.01055908203125, 0.01123046875, 0.01190185546875, 0.0125732421875, 0.01324462890625, 0.013916015625, 0.01458740234375, 0.0152587890625, 0.01593017578125, 0.0166015625, 0.01727294921875, 0.0179443359375, 0.01861572265625, 0.019287109375, 0.01995849609375, 0.0206298828125, 0.02130126953125, 0.02197265625, 0.02264404296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 8.0, 11.0, 13.0, 6.0, 25.0, 30.0, 53.0, 37.0, 57.0, 68.0, 66.0, 74.0, 76.0, 70.0, 74.0, 60.0, 51.0, 47.0, 50.0, 29.0, 28.0, 18.0, 9.0, 10.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.364418029785156e-06, -5.188398063182831e-06, -5.012378096580505e-06, -4.83635812997818e-06, -4.6603381633758545e-06, -4.484318196773529e-06, -4.308298230171204e-06, -4.132278263568878e-06, -3.956258296966553e-06, -3.7802383303642273e-06, -3.604218363761902e-06, -3.4281983971595764e-06, -3.252178430557251e-06, -3.0761584639549255e-06, -2.9001384973526e-06, -2.7241185307502747e-06, -2.5480985641479492e-06, -2.3720785975456238e-06, -2.1960586309432983e-06, -2.020038664340973e-06, -1.8440186977386475e-06, -1.667998731136322e-06, -1.4919787645339966e-06, -1.3159587979316711e-06, -1.1399388313293457e-06, -9.639188647270203e-07, -7.878988981246948e-07, -6.118789315223694e-07, -4.3585896492004395e-07, -2.598389983177185e-07, -8.381903171539307e-08, 9.220093488693237e-08, 2.682209014892578e-07, 4.4424086809158325e-07, 6.202608346939087e-07, 7.962808012962341e-07, 9.723007678985596e-07, 1.148320734500885e-06, 1.3243407011032104e-06, 1.5003606677055359e-06, 1.6763806343078613e-06, 1.8524006009101868e-06, 2.028420567512512e-06, 2.2044405341148376e-06, 2.380460500717163e-06, 2.5564804673194885e-06, 2.732500433921814e-06, 2.9085204005241394e-06, 3.084540367126465e-06, 3.2605603337287903e-06, 3.4365803003311157e-06, 3.612600266933441e-06, 3.7886202335357666e-06, 3.964640200138092e-06, 4.1406601667404175e-06, 4.316680133342743e-06, 4.492700099945068e-06, 4.668720066547394e-06, 4.844740033149719e-06, 5.020759999752045e-06, 5.19677996635437e-06, 5.3727999329566956e-06, 5.548819899559021e-06, 5.7248398661613464e-06, 5.900859832763672e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 6.0, 0.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 18.0, 37.0, 57.0, 130.0, 226.0, 627.0, 1509.0, 3609.0, 12377.0, 834510.0, 182668.0, 7831.0, 2779.0, 1196.0, 464.0, 196.0, 93.0, 48.0, 32.0, 16.0, 13.0, 12.0, 5.0, 9.0, 3.0, 6.0, 4.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.06866455078125, -0.06674957275390625, -0.0648345947265625, -0.06291961669921875, -0.061004638671875, -0.05908966064453125, -0.0571746826171875, -0.05525970458984375, -0.0533447265625, -0.05142974853515625, -0.0495147705078125, -0.04759979248046875, -0.045684814453125, -0.04376983642578125, -0.0418548583984375, -0.03993988037109375, -0.03802490234375, -0.03610992431640625, -0.0341949462890625, -0.03227996826171875, -0.030364990234375, -0.02845001220703125, -0.0265350341796875, -0.02462005615234375, -0.022705078125, -0.02079010009765625, -0.0188751220703125, -0.01696014404296875, -0.015045166015625, -0.01313018798828125, -0.0112152099609375, -0.00930023193359375, -0.00738525390625, -0.00547027587890625, -0.0035552978515625, -0.00164031982421875, 0.000274658203125, 0.00218963623046875, 0.0041046142578125, 0.00601959228515625, 0.0079345703125, 0.00984954833984375, 0.0117645263671875, 0.01367950439453125, 0.015594482421875, 0.01750946044921875, 0.0194244384765625, 0.02133941650390625, 0.02325439453125, 0.02516937255859375, 0.0270843505859375, 0.02899932861328125, 0.030914306640625, 0.03282928466796875, 0.0347442626953125, 0.03665924072265625, 0.03857421875, 0.04048919677734375, 0.0424041748046875, 0.04431915283203125, 0.046234130859375, 0.04814910888671875, 0.0500640869140625, 0.05197906494140625, 0.05389404296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 8.0, 3.0, 2.0, 7.0, 4.0, 6.0, 13.0, 15.0, 18.0, 29.0, 41.0, 58.0, 109.0, 156.0, 148.0, 126.0, 70.0, 46.0, 29.0, 22.0, 12.0, 15.0, 8.0, 9.0, 9.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.031341552734375, -0.030189990997314453, -0.029038429260253906, -0.02788686752319336, -0.026735305786132812, -0.025583744049072266, -0.02443218231201172, -0.023280620574951172, -0.022129058837890625, -0.020977497100830078, -0.01982593536376953, -0.018674373626708984, -0.017522811889648438, -0.01637125015258789, -0.015219688415527344, -0.014068126678466797, -0.01291656494140625, -0.011765003204345703, -0.010613441467285156, -0.00946187973022461, -0.008310317993164062, -0.007158756256103516, -0.006007194519042969, -0.004855632781982422, -0.003704071044921875, -0.002552509307861328, -0.0014009475708007812, -0.0002493858337402344, 0.0009021759033203125, 0.0020537376403808594, 0.0032052993774414062, 0.004356861114501953, 0.0055084228515625, 0.006659984588623047, 0.007811546325683594, 0.00896310806274414, 0.010114669799804688, 0.011266231536865234, 0.012417793273925781, 0.013569355010986328, 0.014720916748046875, 0.015872478485107422, 0.01702404022216797, 0.018175601959228516, 0.019327163696289062, 0.02047872543334961, 0.021630287170410156, 0.022781848907470703, 0.02393341064453125, 0.025084972381591797, 0.026236534118652344, 0.02738809585571289, 0.028539657592773438, 0.029691219329833984, 0.03084278106689453, 0.03199434280395508, 0.033145904541015625, 0.03429746627807617, 0.03544902801513672, 0.036600589752197266, 0.03775215148925781, 0.03890371322631836, 0.040055274963378906, 0.04120683670043945, 0.0423583984375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 13.0, 433.0, 564.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.60697603225708, -6.486982345581055, -6.366988182067871, -6.246994495391846, -6.127000331878662, -6.007006645202637, -5.887012481689453, -5.767018795013428, -5.647024631500244, -5.527030944824219, -5.407036781311035, -5.28704309463501, -5.167048931121826, -5.047055244445801, -4.927061080932617, -4.807067394256592, -4.687073707580566, -4.567080020904541, -4.447085857391357, -4.327092170715332, -4.207098007202148, -4.087104320526123, -3.9671101570129395, -3.847116470336914, -3.7271223068237305, -3.607128381729126, -3.4871344566345215, -3.367140531539917, -3.2471466064453125, -3.127152681350708, -3.0071587562561035, -2.887165069580078, -2.7671709060668945, -2.64717698097229, -2.5271830558776855, -2.407189130783081, -2.2871952056884766, -2.167201280593872, -2.0472073554992676, -1.9272135496139526, -1.8072196245193481, -1.6872256994247437, -1.5672317743301392, -1.4472379684448242, -1.3272440433502197, -1.2072501182556152, -1.0872561931610107, -0.9672622680664062, -0.8472683429718018, -0.7272744178771973, -0.6072804927825928, -0.48728662729263306, -0.36729270219802856, -0.24729877710342407, -0.12730491161346436, -0.007310986518859863, 0.11268293857574463, 0.23267684876918793, 0.3526707589626312, 0.47266465425491333, 0.5926585793495178, 0.7126525044441223, 0.832646369934082, 0.9526402950286865, 1.072634220123291]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 5.0, 13.0, 15.0, 8.0, 11.0, 13.0, 18.0, 18.0, 35.0, 29.0, 34.0, 36.0, 42.0, 43.0, 41.0, 54.0, 43.0, 47.0, 49.0, 47.0, 59.0, 40.0, 40.0, 38.0, 34.0, 35.0, 26.0, 24.0, 27.0, 24.0, 18.0, 9.0, 11.0, 6.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.7185108065605164, -0.6992398500442505, -0.6799688339233398, -0.660697877407074, -0.6414268612861633, -0.6221559047698975, -0.6028848886489868, -0.583613932132721, -0.5643429756164551, -0.5450720191001892, -0.5258010029792786, -0.5065300464630127, -0.48725903034210205, -0.4679880738258362, -0.4487170875072479, -0.42944610118865967, -0.410175085067749, -0.39090409874916077, -0.3716331124305725, -0.35236212611198425, -0.333091139793396, -0.3138201832771301, -0.29454919695854187, -0.2752782106399536, -0.25600722432136536, -0.2367362380027771, -0.21746525168418884, -0.19819428026676178, -0.17892329394817352, -0.15965230762958527, -0.1403813362121582, -0.12111034989356995, -0.10183936357498169, -0.08256837725639343, -0.06329739838838577, -0.044026415795087814, -0.024755433201789856, -0.005484446883201599, 0.01378653198480606, 0.03305751085281372, 0.05232849717140198, 0.07159948348999023, 0.0908704623579979, 0.11014144122600555, 0.1294124275445938, 0.14868341386318207, 0.16795438528060913, 0.1872253715991974, 0.20649635791778564, 0.2257673442363739, 0.24503833055496216, 0.2643093168735504, 0.28358030319213867, 0.30285125970840454, 0.3221222460269928, 0.34139323234558105, 0.3606642186641693, 0.37993520498275757, 0.3992061913013458, 0.4184771776199341, 0.43774813413619995, 0.4570191502571106, 0.47629010677337646, 0.4955610930919647, 0.514832079410553]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 20.0, 29.0, 43.0, 70.0, 89.0, 176.0, 722.0, 9915.0, 4178131.0, 4245.0, 440.0, 136.0, 66.0, 57.0, 41.0, 15.0, 24.0, 16.0, 7.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0136032104492188, -0.9822845458984375, -0.9509658813476562, -0.919647216796875, -0.8883285522460938, -0.8570098876953125, -0.8256912231445312, -0.79437255859375, -0.7630538940429688, -0.7317352294921875, -0.7004165649414062, -0.669097900390625, -0.6377792358398438, -0.6064605712890625, -0.5751419067382812, -0.5438232421875, -0.5125045776367188, -0.4811859130859375, -0.44986724853515625, -0.418548583984375, -0.38722991943359375, -0.3559112548828125, -0.32459259033203125, -0.29327392578125, -0.26195526123046875, -0.2306365966796875, -0.19931793212890625, -0.167999267578125, -0.13668060302734375, -0.1053619384765625, -0.07404327392578125, -0.042724609375, -0.01140594482421875, 0.0199127197265625, 0.05123138427734375, 0.082550048828125, 0.11386871337890625, 0.1451873779296875, 0.17650604248046875, 0.20782470703125, 0.23914337158203125, 0.2704620361328125, 0.30178070068359375, 0.333099365234375, 0.36441802978515625, 0.3957366943359375, 0.42705535888671875, 0.4583740234375, 0.48969268798828125, 0.5210113525390625, 0.5523300170898438, 0.583648681640625, 0.6149673461914062, 0.6462860107421875, 0.6776046752929688, 0.70892333984375, 0.7402420043945312, 0.7715606689453125, 0.8028793334960938, 0.834197998046875, 0.8655166625976562, 0.8968353271484375, 0.9281539916992188, 0.95947265625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 11.0, 10.0, 17.0, 37.0, 42.0, 55.0, 75.0, 72.0, 72.0, 85.0, 75.0, 100.0, 78.0, 76.0, 51.0, 34.0, 31.0, 21.0, 16.0, 12.0, 10.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07470703125, -0.07243919372558594, -0.07017135620117188, -0.06790351867675781, -0.06563568115234375, -0.06336784362792969, -0.061100006103515625, -0.05883216857910156, -0.0565643310546875, -0.05429649353027344, -0.052028656005859375, -0.04976081848144531, -0.04749298095703125, -0.04522514343261719, -0.042957305908203125, -0.04068946838378906, -0.038421630859375, -0.03615379333496094, -0.033885955810546875, -0.03161811828613281, -0.02935028076171875, -0.027082443237304688, -0.024814605712890625, -0.022546768188476562, -0.0202789306640625, -0.018011093139648438, -0.015743255615234375, -0.013475418090820312, -0.01120758056640625, -0.008939743041992188, -0.006671905517578125, -0.0044040679931640625, -0.00213623046875, 0.0001316070556640625, 0.002399444580078125, 0.0046672821044921875, 0.00693511962890625, 0.009202957153320312, 0.011470794677734375, 0.013738632202148438, 0.0160064697265625, 0.018274307250976562, 0.020542144775390625, 0.022809982299804688, 0.02507781982421875, 0.027345657348632812, 0.029613494873046875, 0.03188133239746094, 0.034149169921875, 0.03641700744628906, 0.038684844970703125, 0.04095268249511719, 0.04322052001953125, 0.04548835754394531, 0.047756195068359375, 0.05002403259277344, 0.0522918701171875, 0.05455970764160156, 0.056827545166015625, 0.05909538269042969, 0.06136322021484375, 0.06363105773925781, 0.06589889526367188, 0.06816673278808594, 0.0704345703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 20.0, 17.0, 26.0, 36.0, 70.0, 142.0, 408.0, 1456.0, 8904.0, 122006.0, 3558997.0, 478844.0, 19748.0, 2513.0, 672.0, 180.0, 73.0, 38.0, 28.0, 13.0, 21.0, 7.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1182861328125, -0.11385345458984375, -0.1094207763671875, -0.10498809814453125, -0.100555419921875, -0.09612274169921875, -0.0916900634765625, -0.08725738525390625, -0.08282470703125, -0.07839202880859375, -0.0739593505859375, -0.06952667236328125, -0.065093994140625, -0.06066131591796875, -0.0562286376953125, -0.05179595947265625, -0.04736328125, -0.04293060302734375, -0.0384979248046875, -0.03406524658203125, -0.029632568359375, -0.02519989013671875, -0.0207672119140625, -0.01633453369140625, -0.01190185546875, -0.00746917724609375, -0.0030364990234375, 0.00139617919921875, 0.005828857421875, 0.01026153564453125, 0.0146942138671875, 0.01912689208984375, 0.0235595703125, 0.02799224853515625, 0.0324249267578125, 0.03685760498046875, 0.041290283203125, 0.04572296142578125, 0.0501556396484375, 0.05458831787109375, 0.05902099609375, 0.06345367431640625, 0.0678863525390625, 0.07231903076171875, 0.076751708984375, 0.08118438720703125, 0.0856170654296875, 0.09004974365234375, 0.094482421875, 0.09891510009765625, 0.1033477783203125, 0.10778045654296875, 0.112213134765625, 0.11664581298828125, 0.1210784912109375, 0.12551116943359375, 0.12994384765625, 0.13437652587890625, 0.1388092041015625, 0.14324188232421875, 0.147674560546875, 0.15210723876953125, 0.1565399169921875, 0.16097259521484375, 0.1654052734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 6.0, 6.0, 18.0, 15.0, 25.0, 45.0, 50.0, 72.0, 129.0, 193.0, 326.0, 514.0, 783.0, 720.0, 440.0, 253.0, 139.0, 71.0, 70.0, 46.0, 37.0, 22.0, 22.0, 9.0, 12.0, 12.0, 6.0, 6.0, 7.0, 7.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04388427734375, -0.042401790618896484, -0.04091930389404297, -0.03943681716918945, -0.03795433044433594, -0.03647184371948242, -0.034989356994628906, -0.03350687026977539, -0.032024383544921875, -0.03054189682006836, -0.029059410095214844, -0.027576923370361328, -0.026094436645507812, -0.024611949920654297, -0.02312946319580078, -0.021646976470947266, -0.02016448974609375, -0.018682003021240234, -0.01719951629638672, -0.015717029571533203, -0.014234542846679688, -0.012752056121826172, -0.011269569396972656, -0.00978708267211914, -0.008304595947265625, -0.006822109222412109, -0.005339622497558594, -0.003857135772705078, -0.0023746490478515625, -0.0008921623229980469, 0.0005903244018554688, 0.0020728111267089844, 0.0035552978515625, 0.005037784576416016, 0.006520271301269531, 0.008002758026123047, 0.009485244750976562, 0.010967731475830078, 0.012450218200683594, 0.01393270492553711, 0.015415191650390625, 0.01689767837524414, 0.018380165100097656, 0.019862651824951172, 0.021345138549804688, 0.022827625274658203, 0.02431011199951172, 0.025792598724365234, 0.02727508544921875, 0.028757572174072266, 0.03024005889892578, 0.0317225456237793, 0.03320503234863281, 0.03468751907348633, 0.036170005798339844, 0.03765249252319336, 0.039134979248046875, 0.04061746597290039, 0.042099952697753906, 0.04358243942260742, 0.04506492614746094, 0.04654741287231445, 0.04802989959716797, 0.049512386322021484, 0.050994873046875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 18.0, 88.0, 543.0, 317.0, 37.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4997001886367798, -1.4696202278137207, -1.4395402669906616, -1.4094603061676025, -1.379380464553833, -1.349300503730774, -1.3192205429077148, -1.2891405820846558, -1.2590606212615967, -1.2289806604385376, -1.1989006996154785, -1.168820858001709, -1.13874089717865, -1.1086609363555908, -1.0785809755325317, -1.0485010147094727, -1.0184211730957031, -0.988341212272644, -0.9582613110542297, -0.9281813502311707, -0.8981013894081116, -0.8680214881896973, -0.8379415273666382, -0.8078615665435791, -0.77778160572052, -0.7477016448974609, -0.7176217436790466, -0.6875417828559875, -0.6574618220329285, -0.6273819208145142, -0.5973019599914551, -0.567221999168396, -0.5371420383453369, -0.5070620775222778, -0.47698214650154114, -0.44690221548080444, -0.41682228446006775, -0.38674235343933105, -0.356662392616272, -0.3265824615955353, -0.2965025305747986, -0.2664225995540619, -0.236342653632164, -0.2062627077102661, -0.17618277668952942, -0.14610283076763153, -0.11602288484573364, -0.08594295382499695, -0.055863022804260254, -0.025783082470297813, 0.004296857863664627, 0.03437680006027222, 0.06445673853158951, 0.0945366770029068, 0.12461662292480469, 0.15469655394554138, 0.18477649986743927, 0.21485644578933716, 0.24493637681007385, 0.27501630783081055, 0.30509626865386963, 0.3351761996746063, 0.365256130695343, 0.3953360915184021, 0.4254160225391388]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 3.0, 7.0, 13.0, 15.0, 14.0, 17.0, 22.0, 20.0, 23.0, 28.0, 29.0, 36.0, 35.0, 42.0, 41.0, 44.0, 60.0, 51.0, 54.0, 45.0, 59.0, 46.0, 33.0, 41.0, 40.0, 21.0, 19.0, 29.0, 25.0, 25.0, 16.0, 9.0, 6.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16625726222991943, -0.1611109972000122, -0.15596474707126617, -0.15081848204135895, -0.14567223191261292, -0.1405259668827057, -0.13537971675395966, -0.13023345172405243, -0.1250872015953064, -0.11994094401597977, -0.11479468643665314, -0.10964842885732651, -0.10450217127799988, -0.09935590624809265, -0.09420964866876602, -0.08906339108943939, -0.08391712605953217, -0.07877086848020554, -0.0736246109008789, -0.06847835332155228, -0.06333209574222565, -0.05818583443760872, -0.05303957313299179, -0.04789331555366516, -0.04274705797433853, -0.0376008003950119, -0.03245454281568527, -0.027308281511068344, -0.022162023931741714, -0.017015766352415085, -0.011869506910443306, -0.006723247468471527, -0.0015769898891448975, 0.003569268621504307, 0.008715527132153511, 0.013861785642802715, 0.01900804415345192, 0.02415430173277855, 0.029300561174750328, 0.03444682061672211, 0.03959307819604874, 0.044739335775375366, 0.049885593354701996, 0.055031854659318924, 0.060178112238645554, 0.06532436609268188, 0.07047063112258911, 0.07561688870191574, 0.08076314628124237, 0.085909403860569, 0.09105566143989563, 0.09620191901922226, 0.10134817659854889, 0.10649444162845612, 0.11164069920778275, 0.11678695678710938, 0.121933214366436, 0.12707947194576263, 0.13222573697566986, 0.1373719871044159, 0.14251825213432312, 0.14766450226306915, 0.15281076729297638, 0.1579570174217224, 0.16310328245162964]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 6.0, 1.0, 13.0, 17.0, 12.0, 30.0, 41.0, 85.0, 124.0, 182.0, 312.0, 616.0, 1190.0, 2953.0, 8789.0, 43468.0, 547729.0, 397096.0, 33496.0, 7356.0, 2571.0, 1065.0, 547.0, 325.0, 203.0, 120.0, 58.0, 40.0, 34.0, 17.0, 18.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.259521484375, -0.2520923614501953, -0.24466323852539062, -0.23723411560058594, -0.22980499267578125, -0.22237586975097656, -0.21494674682617188, -0.2075176239013672, -0.2000885009765625, -0.1926593780517578, -0.18523025512695312, -0.17780113220214844, -0.17037200927734375, -0.16294288635253906, -0.15551376342773438, -0.1480846405029297, -0.140655517578125, -0.1332263946533203, -0.12579727172851562, -0.11836814880371094, -0.11093902587890625, -0.10350990295410156, -0.09608078002929688, -0.08865165710449219, -0.0812225341796875, -0.07379341125488281, -0.06636428833007812, -0.05893516540527344, -0.05150604248046875, -0.04407691955566406, -0.036647796630859375, -0.029218673706054688, -0.02178955078125, -0.014360427856445312, -0.006931304931640625, 0.0004978179931640625, 0.00792694091796875, 0.015356063842773438, 0.022785186767578125, 0.030214309692382812, 0.0376434326171875, 0.04507255554199219, 0.052501678466796875, 0.05993080139160156, 0.06735992431640625, 0.07478904724121094, 0.08221817016601562, 0.08964729309082031, 0.097076416015625, 0.10450553894042969, 0.11193466186523438, 0.11936378479003906, 0.12679290771484375, 0.13422203063964844, 0.14165115356445312, 0.1490802764892578, 0.1565093994140625, 0.1639385223388672, 0.17136764526367188, 0.17879676818847656, 0.18622589111328125, 0.19365501403808594, 0.20108413696289062, 0.2085132598876953, 0.2159423828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 6.0, 7.0, 12.0, 14.0, 29.0, 47.0, 60.0, 58.0, 88.0, 86.0, 76.0, 100.0, 80.0, 76.0, 87.0, 53.0, 27.0, 29.0, 19.0, 18.0, 12.0, 7.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.081787109375, -0.07944679260253906, -0.07710647583007812, -0.07476615905761719, -0.07242584228515625, -0.07008552551269531, -0.06774520874023438, -0.06540489196777344, -0.0630645751953125, -0.06072425842285156, -0.058383941650390625, -0.05604362487792969, -0.05370330810546875, -0.05136299133300781, -0.049022674560546875, -0.04668235778808594, -0.044342041015625, -0.04200172424316406, -0.039661407470703125, -0.03732109069824219, -0.03498077392578125, -0.03264045715332031, -0.030300140380859375, -0.027959823608398438, -0.0256195068359375, -0.023279190063476562, -0.020938873291015625, -0.018598556518554688, -0.01625823974609375, -0.013917922973632812, -0.011577606201171875, -0.009237289428710938, -0.00689697265625, -0.0045566558837890625, -0.002216339111328125, 0.0001239776611328125, 0.00246429443359375, 0.0048046112060546875, 0.007144927978515625, 0.009485244750976562, 0.0118255615234375, 0.014165878295898438, 0.016506195068359375, 0.018846511840820312, 0.02118682861328125, 0.023527145385742188, 0.025867462158203125, 0.028207778930664062, 0.030548095703125, 0.03288841247558594, 0.035228729248046875, 0.03756904602050781, 0.03990936279296875, 0.04224967956542969, 0.044589996337890625, 0.04693031311035156, 0.0492706298828125, 0.05161094665527344, 0.053951263427734375, 0.05629158020019531, 0.05863189697265625, 0.06097221374511719, 0.06331253051757812, 0.06565284729003906, 0.0679931640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 5.0, 6.0, 13.0, 11.0, 21.0, 21.0, 26.0, 48.0, 44.0, 66.0, 110.0, 193.0, 511.0, 4129.0, 206181.0, 819056.0, 16326.0, 1048.0, 276.0, 118.0, 90.0, 41.0, 40.0, 31.0, 21.0, 18.0, 16.0, 14.0, 15.0, 8.0, 13.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29508399963378906, -0.2864570617675781, -0.2778301239013672, -0.26920318603515625, -0.2605762481689453, -0.2519493103027344, -0.24332237243652344, -0.2346954345703125, -0.22606849670410156, -0.21744155883789062, -0.2088146209716797, -0.20018768310546875, -0.1915607452392578, -0.18293380737304688, -0.17430686950683594, -0.165679931640625, -0.15705299377441406, -0.14842605590820312, -0.1397991180419922, -0.13117218017578125, -0.12254524230957031, -0.11391830444335938, -0.10529136657714844, -0.0966644287109375, -0.08803749084472656, -0.07941055297851562, -0.07078361511230469, -0.06215667724609375, -0.05352973937988281, -0.044902801513671875, -0.03627586364746094, -0.02764892578125, -0.019021987915039062, -0.010395050048828125, -0.0017681121826171875, 0.00685882568359375, 0.015485763549804688, 0.024112701416015625, 0.03273963928222656, 0.0413665771484375, 0.04999351501464844, 0.058620452880859375, 0.06724739074707031, 0.07587432861328125, 0.08450126647949219, 0.09312820434570312, 0.10175514221191406, 0.110382080078125, 0.11900901794433594, 0.12763595581054688, 0.1362628936767578, 0.14488983154296875, 0.1535167694091797, 0.16214370727539062, 0.17077064514160156, 0.1793975830078125, 0.18802452087402344, 0.19665145874023438, 0.2052783966064453, 0.21390533447265625, 0.2225322723388672, 0.23115921020507812, 0.23978614807128906, 0.2484130859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 5.0, 5.0, 4.0, 7.0, 13.0, 11.0, 16.0, 15.0, 16.0, 34.0, 41.0, 45.0, 39.0, 52.0, 58.0, 55.0, 44.0, 51.0, 48.0, 52.0, 40.0, 44.0, 43.0, 42.0, 33.0, 37.0, 24.0, 25.0, 19.0, 17.0, 14.0, 7.0, 13.0, 9.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0845947265625, -0.0819234848022461, -0.07925224304199219, -0.07658100128173828, -0.07390975952148438, -0.07123851776123047, -0.06856727600097656, -0.06589603424072266, -0.06322479248046875, -0.060553550720214844, -0.05788230895996094, -0.05521106719970703, -0.052539825439453125, -0.04986858367919922, -0.04719734191894531, -0.044526100158691406, -0.0418548583984375, -0.039183616638183594, -0.03651237487792969, -0.03384113311767578, -0.031169891357421875, -0.02849864959716797, -0.025827407836914062, -0.023156166076660156, -0.02048492431640625, -0.017813682556152344, -0.015142440795898438, -0.012471199035644531, -0.009799957275390625, -0.007128715515136719, -0.0044574737548828125, -0.0017862319946289062, 0.000885009765625, 0.0035562515258789062, 0.0062274932861328125, 0.008898735046386719, 0.011569976806640625, 0.014241218566894531, 0.016912460327148438, 0.019583702087402344, 0.02225494384765625, 0.024926185607910156, 0.027597427368164062, 0.03026866912841797, 0.032939910888671875, 0.03561115264892578, 0.03828239440917969, 0.040953636169433594, 0.0436248779296875, 0.046296119689941406, 0.04896736145019531, 0.05163860321044922, 0.054309844970703125, 0.05698108673095703, 0.05965232849121094, 0.062323570251464844, 0.06499481201171875, 0.06766605377197266, 0.07033729553222656, 0.07300853729248047, 0.07567977905273438, 0.07835102081298828, 0.08102226257324219, 0.0836935043334961, 0.08636474609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 10.0, 3.0, 8.0, 14.0, 15.0, 22.0, 34.0, 38.0, 87.0, 123.0, 191.0, 338.0, 589.0, 1278.0, 2609.0, 5668.0, 13016.0, 32644.0, 89472.0, 251354.0, 379538.0, 170613.0, 60221.0, 22793.0, 9568.0, 4181.0, 1884.0, 966.0, 536.0, 248.0, 174.0, 93.0, 63.0, 49.0, 30.0, 27.0, 11.0, 9.0, 12.0, 9.0, 3.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01910400390625, -0.018512725830078125, -0.01792144775390625, -0.017330169677734375, -0.0167388916015625, -0.016147613525390625, -0.01555633544921875, -0.014965057373046875, -0.014373779296875, -0.013782501220703125, -0.01319122314453125, -0.012599945068359375, -0.0120086669921875, -0.011417388916015625, -0.01082611083984375, -0.010234832763671875, -0.0096435546875, -0.009052276611328125, -0.00846099853515625, -0.007869720458984375, -0.0072784423828125, -0.006687164306640625, -0.00609588623046875, -0.005504608154296875, -0.004913330078125, -0.004322052001953125, -0.00373077392578125, -0.003139495849609375, -0.0025482177734375, -0.001956939697265625, -0.00136566162109375, -0.000774383544921875, -0.00018310546875, 0.000408172607421875, 0.00099945068359375, 0.001590728759765625, 0.0021820068359375, 0.002773284912109375, 0.00336456298828125, 0.003955841064453125, 0.004547119140625, 0.005138397216796875, 0.00572967529296875, 0.006320953369140625, 0.0069122314453125, 0.007503509521484375, 0.00809478759765625, 0.008686065673828125, 0.00927734375, 0.009868621826171875, 0.01045989990234375, 0.011051177978515625, 0.0116424560546875, 0.012233734130859375, 0.01282501220703125, 0.013416290283203125, 0.014007568359375, 0.014598846435546875, 0.01519012451171875, 0.015781402587890625, 0.0163726806640625, 0.016963958740234375, 0.01755523681640625, 0.018146514892578125, 0.01873779296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 9.0, 5.0, 10.0, 10.0, 10.0, 10.0, 10.0, 21.0, 21.0, 27.0, 44.0, 44.0, 49.0, 75.0, 77.0, 67.0, 69.0, 64.0, 66.0, 46.0, 46.0, 34.0, 38.0, 26.0, 27.0, 16.0, 18.0, 15.0, 8.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.000301361083984e-06, -8.72090458869934e-06, -8.441507816314697e-06, -8.162111043930054e-06, -7.88271427154541e-06, -7.603317499160767e-06, -7.323920726776123e-06, -7.0445239543914795e-06, -6.765127182006836e-06, -6.485730409622192e-06, -6.206333637237549e-06, -5.926936864852905e-06, -5.647540092468262e-06, -5.368143320083618e-06, -5.088746547698975e-06, -4.809349775314331e-06, -4.5299530029296875e-06, -4.250556230545044e-06, -3.9711594581604e-06, -3.691762685775757e-06, -3.4123659133911133e-06, -3.1329691410064697e-06, -2.853572368621826e-06, -2.5741755962371826e-06, -2.294778823852539e-06, -2.0153820514678955e-06, -1.735985279083252e-06, -1.4565885066986084e-06, -1.1771917343139648e-06, -8.977949619293213e-07, -6.183981895446777e-07, -3.390014171600342e-07, -5.960464477539063e-08, 2.1979212760925293e-07, 4.991888999938965e-07, 7.7858567237854e-07, 1.0579824447631836e-06, 1.3373792171478271e-06, 1.6167759895324707e-06, 1.8961727619171143e-06, 2.175569534301758e-06, 2.4549663066864014e-06, 2.734363079071045e-06, 3.0137598514556885e-06, 3.293156623840332e-06, 3.5725533962249756e-06, 3.851950168609619e-06, 4.131346940994263e-06, 4.410743713378906e-06, 4.69014048576355e-06, 4.969537258148193e-06, 5.248934030532837e-06, 5.5283308029174805e-06, 5.807727575302124e-06, 6.087124347686768e-06, 6.366521120071411e-06, 6.645917892456055e-06, 6.925314664840698e-06, 7.204711437225342e-06, 7.484108209609985e-06, 7.763504981994629e-06, 8.042901754379272e-06, 8.322298526763916e-06, 8.60169529914856e-06, 8.881092071533203e-06]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 3.0, 18.0, 19.0, 18.0, 26.0, 31.0, 37.0, 58.0, 99.0, 183.0, 742.0, 10988.0, 544258.0, 481136.0, 9682.0, 757.0, 194.0, 88.0, 53.0, 38.0, 29.0, 18.0, 18.0, 15.0, 11.0, 6.0, 6.0, 7.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05389404296875, -0.05209636688232422, -0.05029869079589844, -0.048501014709472656, -0.046703338623046875, -0.044905662536621094, -0.04310798645019531, -0.04131031036376953, -0.03951263427734375, -0.03771495819091797, -0.03591728210449219, -0.034119606018066406, -0.032321929931640625, -0.030524253845214844, -0.028726577758789062, -0.02692890167236328, -0.0251312255859375, -0.02333354949951172, -0.021535873413085938, -0.019738197326660156, -0.017940521240234375, -0.016142845153808594, -0.014345169067382812, -0.012547492980957031, -0.01074981689453125, -0.008952140808105469, -0.0071544647216796875, -0.005356788635253906, -0.003559112548828125, -0.0017614364624023438, 3.62396240234375e-05, 0.0018339157104492188, 0.003631591796875, 0.005429267883300781, 0.0072269439697265625, 0.009024620056152344, 0.010822296142578125, 0.012619972229003906, 0.014417648315429688, 0.01621532440185547, 0.01801300048828125, 0.01981067657470703, 0.021608352661132812, 0.023406028747558594, 0.025203704833984375, 0.027001380920410156, 0.028799057006835938, 0.03059673309326172, 0.0323944091796875, 0.03419208526611328, 0.03598976135253906, 0.037787437438964844, 0.039585113525390625, 0.041382789611816406, 0.04318046569824219, 0.04497814178466797, 0.04677581787109375, 0.04857349395751953, 0.05037117004394531, 0.052168846130371094, 0.053966522216796875, 0.055764198303222656, 0.05756187438964844, 0.05935955047607422, 0.0611572265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 5.0, 12.0, 12.0, 14.0, 27.0, 21.0, 35.0, 34.0, 41.0, 43.0, 63.0, 74.0, 73.0, 85.0, 75.0, 72.0, 57.0, 50.0, 37.0, 31.0, 23.0, 21.0, 20.0, 10.0, 16.0, 12.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0137939453125, -0.013353943824768066, -0.012913942337036133, -0.0124739408493042, -0.012033939361572266, -0.011593937873840332, -0.011153936386108398, -0.010713934898376465, -0.010273933410644531, -0.009833931922912598, -0.009393930435180664, -0.00895392894744873, -0.008513927459716797, -0.008073925971984863, -0.00763392448425293, -0.007193922996520996, -0.0067539215087890625, -0.006313920021057129, -0.005873918533325195, -0.005433917045593262, -0.004993915557861328, -0.0045539140701293945, -0.004113912582397461, -0.0036739110946655273, -0.0032339096069335938, -0.00279390811920166, -0.0023539066314697266, -0.001913905143737793, -0.0014739036560058594, -0.0010339021682739258, -0.0005939006805419922, -0.0001538991928100586, 0.000286102294921875, 0.0007261037826538086, 0.0011661052703857422, 0.0016061067581176758, 0.0020461082458496094, 0.002486109733581543, 0.0029261112213134766, 0.00336611270904541, 0.0038061141967773438, 0.004246115684509277, 0.004686117172241211, 0.0051261186599731445, 0.005566120147705078, 0.006006121635437012, 0.006446123123168945, 0.006886124610900879, 0.0073261260986328125, 0.007766127586364746, 0.00820612907409668, 0.008646130561828613, 0.009086132049560547, 0.00952613353729248, 0.009966135025024414, 0.010406136512756348, 0.010846138000488281, 0.011286139488220215, 0.011726140975952148, 0.012166142463684082, 0.012606143951416016, 0.01304614543914795, 0.013486146926879883, 0.013926148414611816, 0.01436614990234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 48.0, 264.0, 479.0, 180.0, 32.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3462444543838501, -0.32376745343208313, -0.30129048228263855, -0.2788134813308716, -0.256336510181427, -0.23385950922966003, -0.21138252317905426, -0.1889055371284485, -0.1664285510778427, -0.14395156502723694, -0.12147457897663116, -0.0989975854754448, -0.07652059942483902, -0.054043613374233246, -0.031566619873046875, -0.009089633822441101, 0.013387352228164673, 0.03586433827877045, 0.05834132805466652, 0.08081831783056259, 0.10329530388116837, 0.12577229738235474, 0.1482492834329605, 0.17072626948356628, 0.19320325553417206, 0.21568024158477783, 0.2381572276353836, 0.2606342136859894, 0.28311121463775635, 0.3055881857872009, 0.3280651867389679, 0.35054218769073486, 0.37301915884017944, 0.3954961597919464, 0.417973130941391, 0.44045013189315796, 0.46292710304260254, 0.4854041039943695, 0.5078811049461365, 0.530358076095581, 0.5528350472450256, 0.5753120183944702, 0.5977890491485596, 0.6202660202980042, 0.6427429914474487, 0.6652199625968933, 0.6876969933509827, 0.7101739645004272, 0.7326509952545166, 0.7551279664039612, 0.7776049971580505, 0.8000819683074951, 0.8225589394569397, 0.8450359106063843, 0.8675129413604736, 0.8899899125099182, 0.9124668836593628, 0.9349438548088074, 0.9574208855628967, 0.9798978567123413, 1.0023748874664307, 1.0248517990112305, 1.0473288297653198, 1.0698058605194092, 1.092282772064209]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 5.0, 7.0, 6.0, 9.0, 13.0, 11.0, 16.0, 17.0, 22.0, 18.0, 15.0, 20.0, 30.0, 46.0, 40.0, 35.0, 29.0, 42.0, 45.0, 43.0, 44.0, 56.0, 44.0, 43.0, 45.0, 52.0, 24.0, 27.0, 27.0, 35.0, 18.0, 17.0, 13.0, 15.0, 21.0, 10.0, 12.0, 4.0, 6.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2666276693344116, -0.2581077218055725, -0.249587744474411, -0.2410677820444107, -0.2325478196144104, -0.2240278571844101, -0.2155078947544098, -0.20698793232440948, -0.19846796989440918, -0.18994800746440887, -0.18142804503440857, -0.17290808260440826, -0.16438812017440796, -0.15586815774440765, -0.14734819531440735, -0.13882823288440704, -0.13030827045440674, -0.12178830802440643, -0.11326834559440613, -0.10474838316440582, -0.09622842073440552, -0.08770845830440521, -0.07918849587440491, -0.0706685334444046, -0.0621485710144043, -0.05362860858440399, -0.045108646154403687, -0.03658868372440338, -0.028068721294403076, -0.01954875886440277, -0.011028796434402466, -0.0025088340044021606, 0.0060111284255981445, 0.01453109085559845, 0.023051053285598755, 0.03157101571559906, 0.040090978145599365, 0.04861094057559967, 0.057130903005599976, 0.06565086543560028, 0.07417082786560059, 0.08269079029560089, 0.0912107527256012, 0.0997307151556015, 0.1082506775856018, 0.11677064001560211, 0.12529060244560242, 0.13381056487560272, 0.14233052730560303, 0.15085048973560333, 0.15937045216560364, 0.16789041459560394, 0.17641037702560425, 0.18493033945560455, 0.19345030188560486, 0.20197026431560516, 0.21049022674560547, 0.21901018917560577, 0.22753015160560608, 0.23605011403560638, 0.2445700764656067, 0.2530900239944458, 0.2616100013256073, 0.2701299786567688, 0.2786499261856079]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 3.0, 8.0, 6.0, 20.0, 14.0, 35.0, 48.0, 92.0, 156.0, 296.0, 587.0, 1429.0, 6688.0, 883379.0, 3286974.0, 11356.0, 1796.0, 648.0, 323.0, 174.0, 101.0, 54.0, 31.0, 24.0, 13.0, 13.0, 3.0, 3.0, 4.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.321533203125, -0.3128662109375, -0.30419921875, -0.2955322265625, -0.286865234375, -0.2781982421875, -0.26953125, -0.2608642578125, -0.252197265625, -0.2435302734375, -0.23486328125, -0.2261962890625, -0.217529296875, -0.2088623046875, -0.2001953125, -0.1915283203125, -0.182861328125, -0.1741943359375, -0.16552734375, -0.1568603515625, -0.148193359375, -0.1395263671875, -0.130859375, -0.1221923828125, -0.113525390625, -0.1048583984375, -0.09619140625, -0.0875244140625, -0.078857421875, -0.0701904296875, -0.0615234375, -0.0528564453125, -0.044189453125, -0.0355224609375, -0.02685546875, -0.0181884765625, -0.009521484375, -0.0008544921875, 0.0078125, 0.0164794921875, 0.025146484375, 0.0338134765625, 0.04248046875, 0.0511474609375, 0.059814453125, 0.0684814453125, 0.0771484375, 0.0858154296875, 0.094482421875, 0.1031494140625, 0.11181640625, 0.1204833984375, 0.129150390625, 0.1378173828125, 0.146484375, 0.1551513671875, 0.163818359375, 0.1724853515625, 0.18115234375, 0.1898193359375, 0.198486328125, 0.2071533203125, 0.2158203125, 0.2244873046875, 0.233154296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 10.0, 15.0, 19.0, 31.0, 43.0, 58.0, 59.0, 80.0, 69.0, 76.0, 83.0, 68.0, 84.0, 72.0, 71.0, 46.0, 19.0, 29.0, 20.0, 10.0, 13.0, 9.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06695556640625, -0.06487751007080078, -0.06279945373535156, -0.060721397399902344, -0.058643341064453125, -0.056565284729003906, -0.05448722839355469, -0.05240917205810547, -0.05033111572265625, -0.04825305938720703, -0.04617500305175781, -0.044096946716308594, -0.042018890380859375, -0.039940834045410156, -0.03786277770996094, -0.03578472137451172, -0.0337066650390625, -0.03162860870361328, -0.029550552368164062, -0.027472496032714844, -0.025394439697265625, -0.023316383361816406, -0.021238327026367188, -0.01916027069091797, -0.01708221435546875, -0.015004158020019531, -0.012926101684570312, -0.010848045349121094, -0.008769989013671875, -0.006691932678222656, -0.0046138763427734375, -0.0025358200073242188, -0.000457763671875, 0.0016202926635742188, 0.0036983489990234375, 0.005776405334472656, 0.007854461669921875, 0.009932518005371094, 0.012010574340820312, 0.014088630676269531, 0.01616668701171875, 0.01824474334716797, 0.020322799682617188, 0.022400856018066406, 0.024478912353515625, 0.026556968688964844, 0.028635025024414062, 0.03071308135986328, 0.0327911376953125, 0.03486919403076172, 0.03694725036621094, 0.039025306701660156, 0.041103363037109375, 0.043181419372558594, 0.04525947570800781, 0.04733753204345703, 0.04941558837890625, 0.05149364471435547, 0.05357170104980469, 0.055649757385253906, 0.057727813720703125, 0.059805870056152344, 0.06188392639160156, 0.06396198272705078, 0.0660400390625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 8.0, 12.0, 9.0, 16.0, 24.0, 24.0, 48.0, 66.0, 109.0, 179.0, 358.0, 944.0, 4052.0, 33990.0, 697811.0, 3211883.0, 226110.0, 14897.0, 2316.0, 700.0, 281.0, 133.0, 77.0, 52.0, 45.0, 33.0, 25.0, 17.0, 15.0, 10.0, 6.0, 4.0, 10.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10235595703125, -0.09796810150146484, -0.09358024597167969, -0.08919239044189453, -0.08480453491210938, -0.08041667938232422, -0.07602882385253906, -0.0716409683227539, -0.06725311279296875, -0.0628652572631836, -0.05847740173339844, -0.05408954620361328, -0.049701690673828125, -0.04531383514404297, -0.04092597961425781, -0.036538124084472656, -0.0321502685546875, -0.027762413024902344, -0.023374557495117188, -0.01898670196533203, -0.014598846435546875, -0.010210990905761719, -0.0058231353759765625, -0.0014352798461914062, 0.00295257568359375, 0.007340431213378906, 0.011728286743164062, 0.01611614227294922, 0.020503997802734375, 0.02489185333251953, 0.029279708862304688, 0.033667564392089844, 0.038055419921875, 0.042443275451660156, 0.04683113098144531, 0.05121898651123047, 0.055606842041015625, 0.05999469757080078, 0.06438255310058594, 0.0687704086303711, 0.07315826416015625, 0.0775461196899414, 0.08193397521972656, 0.08632183074951172, 0.09070968627929688, 0.09509754180908203, 0.09948539733886719, 0.10387325286865234, 0.1082611083984375, 0.11264896392822266, 0.11703681945800781, 0.12142467498779297, 0.12581253051757812, 0.13020038604736328, 0.13458824157714844, 0.1389760971069336, 0.14336395263671875, 0.1477518081665039, 0.15213966369628906, 0.15652751922607422, 0.16091537475585938, 0.16530323028564453, 0.1696910858154297, 0.17407894134521484, 0.178466796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 5.0, 12.0, 16.0, 15.0, 24.0, 31.0, 61.0, 52.0, 71.0, 123.0, 160.0, 197.0, 279.0, 352.0, 475.0, 565.0, 442.0, 306.0, 223.0, 157.0, 123.0, 83.0, 62.0, 55.0, 45.0, 38.0, 22.0, 17.0, 12.0, 11.0, 6.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.05499267578125, -0.05346822738647461, -0.05194377899169922, -0.05041933059692383, -0.04889488220214844, -0.04737043380737305, -0.045845985412597656, -0.044321537017822266, -0.042797088623046875, -0.041272640228271484, -0.039748191833496094, -0.0382237434387207, -0.03669929504394531, -0.03517484664916992, -0.03365039825439453, -0.03212594985961914, -0.03060150146484375, -0.02907705307006836, -0.02755260467529297, -0.026028156280517578, -0.024503707885742188, -0.022979259490966797, -0.021454811096191406, -0.019930362701416016, -0.018405914306640625, -0.016881465911865234, -0.015357017517089844, -0.013832569122314453, -0.012308120727539062, -0.010783672332763672, -0.009259223937988281, -0.007734775543212891, -0.0062103271484375, -0.004685878753662109, -0.0031614303588867188, -0.0016369819641113281, -0.0001125335693359375, 0.0014119148254394531, 0.0029363632202148438, 0.004460811614990234, 0.005985260009765625, 0.007509708404541016, 0.009034156799316406, 0.010558605194091797, 0.012083053588867188, 0.013607501983642578, 0.015131950378417969, 0.01665639877319336, 0.01818084716796875, 0.01970529556274414, 0.02122974395751953, 0.022754192352294922, 0.024278640747070312, 0.025803089141845703, 0.027327537536621094, 0.028851985931396484, 0.030376434326171875, 0.031900882720947266, 0.033425331115722656, 0.03494977951049805, 0.03647422790527344, 0.03799867630004883, 0.03952312469482422, 0.04104757308959961, 0.042572021484375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 12.0, 650.0, 347.0, 9.0, 1.0, 0.0, 1.0], "bins": [-3.672536849975586, -3.6101274490356445, -3.547718048095703, -3.4853084087371826, -3.422899007797241, -3.3604896068573, -3.2980802059173584, -3.235670566558838, -3.1732611656188965, -3.110851764678955, -3.0484423637390137, -2.986032724380493, -2.9236233234405518, -2.8612139225006104, -2.798804521560669, -2.7363948822021484, -2.673985481262207, -2.6115760803222656, -2.549166679382324, -2.4867570400238037, -2.4243476390838623, -2.361938238143921, -2.2995288372039795, -2.237119197845459, -2.1747097969055176, -2.112300395965576, -2.0498909950256348, -1.9874814748764038, -1.9250719547271729, -1.8626625537872314, -1.8002530336380005, -1.737843632698059, -1.6754341125488281, -1.6130247116088867, -1.5506151914596558, -1.4882057905197144, -1.4257962703704834, -1.363386869430542, -1.300977349281311, -1.2385679483413696, -1.1761585474014282, -1.1137491464614868, -1.0513396263122559, -0.9889301657676697, -0.9265207052230835, -0.8641113042831421, -0.8017017841339111, -0.7392923831939697, -0.6768828630447388, -0.6144734025001526, -0.5520639419555664, -0.4896544814109802, -0.42724502086639404, -0.36483559012413025, -0.30242612957954407, -0.24001666903495789, -0.1776072084903717, -0.11519774794578552, -0.05278829485177994, 0.009621158242225647, 0.07203061878681183, 0.13444006443023682, 0.196849524974823, 0.2592589855194092, 0.32166844606399536]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 5.0, 4.0, 10.0, 9.0, 15.0, 14.0, 15.0, 19.0, 34.0, 39.0, 42.0, 56.0, 61.0, 37.0, 42.0, 57.0, 60.0, 47.0, 52.0, 43.0, 70.0, 45.0, 45.0, 32.0, 29.0, 20.0, 18.0, 21.0, 19.0, 14.0, 7.0, 5.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18857109546661377, -0.18238410353660583, -0.1761971265077591, -0.17001013457775116, -0.16382314264774323, -0.15763616561889648, -0.15144917368888855, -0.14526218175888062, -0.13907518982887268, -0.13288819789886475, -0.126701220870018, -0.12051422894001007, -0.11432723701000214, -0.1081402525305748, -0.10195326805114746, -0.09576627612113953, -0.08957929909229279, -0.08339231461286545, -0.07720532268285751, -0.07101833820343018, -0.06483134627342224, -0.058644361793994904, -0.052457377314567566, -0.04627038910984993, -0.040083400905132294, -0.03389641270041466, -0.02770942635834217, -0.021522440016269684, -0.015335451811552048, -0.009148463606834412, -0.002961479127407074, 0.003225509077310562, 0.009412497282028198, 0.01559948455542326, 0.02178647182881832, 0.027973458170890808, 0.034160446375608444, 0.04034743458032608, 0.04653441905975342, 0.052721407264471054, 0.05890839546918869, 0.06509537994861603, 0.07128237187862396, 0.0774693563580513, 0.08365634083747864, 0.08984333276748657, 0.09603031724691391, 0.10221730172634125, 0.10840429365634918, 0.11459127813577652, 0.12077827006578445, 0.1269652545452118, 0.13315224647521973, 0.13933923840522766, 0.1455262154340744, 0.15171320736408234, 0.15790018439292908, 0.164087176322937, 0.17027415335178375, 0.1764611452817917, 0.18264813721179962, 0.18883511424064636, 0.1950221061706543, 0.20120909810066223, 0.20739609003067017]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 3.0, 4.0, 8.0, 6.0, 8.0, 8.0, 13.0, 22.0, 21.0, 43.0, 53.0, 83.0, 139.0, 247.0, 421.0, 729.0, 1471.0, 3258.0, 7660.0, 20446.0, 69036.0, 307271.0, 464055.0, 122057.0, 31686.0, 11121.0, 4507.0, 1965.0, 955.0, 485.0, 296.0, 151.0, 87.0, 69.0, 53.0, 25.0, 17.0, 14.0, 16.0, 9.0, 9.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1309814453125, -0.12691307067871094, -0.12284469604492188, -0.11877632141113281, -0.11470794677734375, -0.11063957214355469, -0.10657119750976562, -0.10250282287597656, -0.0984344482421875, -0.09436607360839844, -0.09029769897460938, -0.08622932434082031, -0.08216094970703125, -0.07809257507324219, -0.07402420043945312, -0.06995582580566406, -0.065887451171875, -0.06181907653808594, -0.057750701904296875, -0.05368232727050781, -0.04961395263671875, -0.04554557800292969, -0.041477203369140625, -0.03740882873535156, -0.0333404541015625, -0.029272079467773438, -0.025203704833984375, -0.021135330200195312, -0.01706695556640625, -0.012998580932617188, -0.008930206298828125, -0.0048618316650390625, -0.00079345703125, 0.0032749176025390625, 0.007343292236328125, 0.011411666870117188, 0.01548004150390625, 0.019548416137695312, 0.023616790771484375, 0.027685165405273438, 0.0317535400390625, 0.03582191467285156, 0.039890289306640625, 0.04395866394042969, 0.04802703857421875, 0.05209541320800781, 0.056163787841796875, 0.06023216247558594, 0.064300537109375, 0.06836891174316406, 0.07243728637695312, 0.07650566101074219, 0.08057403564453125, 0.08464241027832031, 0.08871078491210938, 0.09277915954589844, 0.0968475341796875, 0.10091590881347656, 0.10498428344726562, 0.10905265808105469, 0.11312103271484375, 0.11718940734863281, 0.12125778198242188, 0.12532615661621094, 0.12939453125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 9.0, 19.0, 25.0, 30.0, 53.0, 65.0, 61.0, 74.0, 92.0, 83.0, 90.0, 76.0, 88.0, 72.0, 49.0, 34.0, 18.0, 15.0, 19.0, 11.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07733154296875, -0.07509613037109375, -0.0728607177734375, -0.07062530517578125, -0.068389892578125, -0.06615447998046875, -0.0639190673828125, -0.06168365478515625, -0.0594482421875, -0.05721282958984375, -0.0549774169921875, -0.05274200439453125, -0.050506591796875, -0.04827117919921875, -0.0460357666015625, -0.04380035400390625, -0.04156494140625, -0.03932952880859375, -0.0370941162109375, -0.03485870361328125, -0.032623291015625, -0.03038787841796875, -0.0281524658203125, -0.02591705322265625, -0.023681640625, -0.02144622802734375, -0.0192108154296875, -0.01697540283203125, -0.014739990234375, -0.01250457763671875, -0.0102691650390625, -0.00803375244140625, -0.00579833984375, -0.00356292724609375, -0.0013275146484375, 0.00090789794921875, 0.003143310546875, 0.00537872314453125, 0.0076141357421875, 0.00984954833984375, 0.0120849609375, 0.01432037353515625, 0.0165557861328125, 0.01879119873046875, 0.021026611328125, 0.02326202392578125, 0.0254974365234375, 0.02773284912109375, 0.02996826171875, 0.03220367431640625, 0.0344390869140625, 0.03667449951171875, 0.038909912109375, 0.04114532470703125, 0.0433807373046875, 0.04561614990234375, 0.0478515625, 0.05008697509765625, 0.0523223876953125, 0.05455780029296875, 0.056793212890625, 0.05902862548828125, 0.0612640380859375, 0.06349945068359375, 0.06573486328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 9.0, 12.0, 22.0, 30.0, 37.0, 53.0, 65.0, 145.0, 322.0, 997.0, 4539.0, 26888.0, 314871.0, 628674.0, 60613.0, 8628.0, 1723.0, 430.0, 165.0, 105.0, 68.0, 32.0, 24.0, 25.0, 17.0, 7.0, 9.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.22509765625, -0.21870040893554688, -0.21230316162109375, -0.20590591430664062, -0.1995086669921875, -0.19311141967773438, -0.18671417236328125, -0.18031692504882812, -0.173919677734375, -0.16752243041992188, -0.16112518310546875, -0.15472793579101562, -0.1483306884765625, -0.14193344116210938, -0.13553619384765625, -0.12913894653320312, -0.12274169921875, -0.11634445190429688, -0.10994720458984375, -0.10354995727539062, -0.0971527099609375, -0.09075546264648438, -0.08435821533203125, -0.07796096801757812, -0.071563720703125, -0.06516647338867188, -0.05876922607421875, -0.052371978759765625, -0.0459747314453125, -0.039577484130859375, -0.03318023681640625, -0.026782989501953125, -0.0203857421875, -0.013988494873046875, -0.00759124755859375, -0.001194000244140625, 0.0052032470703125, 0.011600494384765625, 0.01799774169921875, 0.024394989013671875, 0.030792236328125, 0.037189483642578125, 0.04358673095703125, 0.049983978271484375, 0.0563812255859375, 0.06277847290039062, 0.06917572021484375, 0.07557296752929688, 0.08197021484375, 0.08836746215820312, 0.09476470947265625, 0.10116195678710938, 0.1075592041015625, 0.11395645141601562, 0.12035369873046875, 0.12675094604492188, 0.133148193359375, 0.13954544067382812, 0.14594268798828125, 0.15233993530273438, 0.1587371826171875, 0.16513442993164062, 0.17153167724609375, 0.17792892456054688, 0.184326171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 5.0, 12.0, 8.0, 7.0, 17.0, 14.0, 20.0, 32.0, 26.0, 25.0, 31.0, 44.0, 57.0, 34.0, 49.0, 59.0, 52.0, 49.0, 53.0, 53.0, 36.0, 49.0, 43.0, 27.0, 31.0, 18.0, 30.0, 20.0, 24.0, 11.0, 9.0, 11.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07806015014648438, -0.07524871826171875, -0.07243728637695312, -0.0696258544921875, -0.06681442260742188, -0.06400299072265625, -0.061191558837890625, -0.058380126953125, -0.055568695068359375, -0.05275726318359375, -0.049945831298828125, -0.0471343994140625, -0.044322967529296875, -0.04151153564453125, -0.038700103759765625, -0.035888671875, -0.033077239990234375, -0.03026580810546875, -0.027454376220703125, -0.0246429443359375, -0.021831512451171875, -0.01902008056640625, -0.016208648681640625, -0.013397216796875, -0.010585784912109375, -0.00777435302734375, -0.004962921142578125, -0.0021514892578125, 0.000659942626953125, 0.00347137451171875, 0.006282806396484375, 0.00909423828125, 0.011905670166015625, 0.01471710205078125, 0.017528533935546875, 0.0203399658203125, 0.023151397705078125, 0.02596282958984375, 0.028774261474609375, 0.031585693359375, 0.034397125244140625, 0.03720855712890625, 0.040019989013671875, 0.0428314208984375, 0.045642852783203125, 0.04845428466796875, 0.051265716552734375, 0.0540771484375, 0.056888580322265625, 0.05970001220703125, 0.06251144409179688, 0.0653228759765625, 0.06813430786132812, 0.07094573974609375, 0.07375717163085938, 0.076568603515625, 0.07938003540039062, 0.08219146728515625, 0.08500289916992188, 0.0878143310546875, 0.09062576293945312, 0.09343719482421875, 0.09624862670898438, 0.09906005859375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 14.0, 8.0, 28.0, 24.0, 55.0, 83.0, 136.0, 207.0, 338.0, 621.0, 1123.0, 2348.0, 5783.0, 16584.0, 86521.0, 683047.0, 210064.0, 27126.0, 8020.0, 3095.0, 1501.0, 770.0, 428.0, 239.0, 142.0, 82.0, 58.0, 28.0, 17.0, 12.0, 8.0, 12.0, 4.0, 3.0, 2.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06805419921875, -0.06517982482910156, -0.062305450439453125, -0.05943107604980469, -0.05655670166015625, -0.05368232727050781, -0.050807952880859375, -0.04793357849121094, -0.0450592041015625, -0.04218482971191406, -0.039310455322265625, -0.03643608093261719, -0.03356170654296875, -0.030687332153320312, -0.027812957763671875, -0.024938583374023438, -0.022064208984375, -0.019189834594726562, -0.016315460205078125, -0.013441085815429688, -0.01056671142578125, -0.0076923370361328125, -0.004817962646484375, -0.0019435882568359375, 0.0009307861328125, 0.0038051605224609375, 0.006679534912109375, 0.009553909301757812, 0.01242828369140625, 0.015302658081054688, 0.018177032470703125, 0.021051406860351562, 0.02392578125, 0.026800155639648438, 0.029674530029296875, 0.03254890441894531, 0.03542327880859375, 0.03829765319824219, 0.041172027587890625, 0.04404640197753906, 0.0469207763671875, 0.04979515075683594, 0.052669525146484375, 0.05554389953613281, 0.05841827392578125, 0.06129264831542969, 0.06416702270507812, 0.06704139709472656, 0.069915771484375, 0.07279014587402344, 0.07566452026367188, 0.07853889465332031, 0.08141326904296875, 0.08428764343261719, 0.08716201782226562, 0.09003639221191406, 0.0929107666015625, 0.09578514099121094, 0.09865951538085938, 0.10153388977050781, 0.10440826416015625, 0.10728263854980469, 0.11015701293945312, 0.11303138732910156, 0.11590576171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 12.0, 20.0, 43.0, 159.0, 300.0, 257.0, 118.0, 35.0, 16.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5822391510009766e-05, -3.443937748670578e-05, -3.3056363463401794e-05, -3.167334944009781e-05, -3.0290335416793823e-05, -2.8907321393489838e-05, -2.7524307370185852e-05, -2.6141293346881866e-05, -2.475827932357788e-05, -2.3375265300273895e-05, -2.199225127696991e-05, -2.0609237253665924e-05, -1.922622323036194e-05, -1.7843209207057953e-05, -1.6460195183753967e-05, -1.5077181160449982e-05, -1.3694167137145996e-05, -1.231115311384201e-05, -1.0928139090538025e-05, -9.54512506723404e-06, -8.162111043930054e-06, -6.779097020626068e-06, -5.3960829973220825e-06, -4.013068974018097e-06, -2.6300549507141113e-06, -1.2470409274101257e-06, 1.3597309589385986e-07, 1.5189871191978455e-06, 2.902001142501831e-06, 4.285015165805817e-06, 5.668029189109802e-06, 7.051043212413788e-06, 8.434057235717773e-06, 9.817071259021759e-06, 1.1200085282325745e-05, 1.258309930562973e-05, 1.3966113328933716e-05, 1.53491273522377e-05, 1.6732141375541687e-05, 1.8115155398845673e-05, 1.9498169422149658e-05, 2.0881183445453644e-05, 2.226419746875763e-05, 2.3647211492061615e-05, 2.50302255153656e-05, 2.6413239538669586e-05, 2.7796253561973572e-05, 2.9179267585277557e-05, 3.056228160858154e-05, 3.194529563188553e-05, 3.3328309655189514e-05, 3.47113236784935e-05, 3.6094337701797485e-05, 3.747735172510147e-05, 3.8860365748405457e-05, 4.024337977170944e-05, 4.162639379501343e-05, 4.300940781831741e-05, 4.43924218416214e-05, 4.5775435864925385e-05, 4.715844988822937e-05, 4.8541463911533356e-05, 4.992447793483734e-05, 5.130749195814133e-05, 5.269050598144531e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 10.0, 11.0, 19.0, 18.0, 33.0, 63.0, 119.0, 310.0, 1176.0, 5384.0, 33584.0, 476827.0, 489041.0, 34598.0, 5569.0, 1168.0, 296.0, 110.0, 67.0, 47.0, 21.0, 16.0, 10.0, 6.0, 7.0, 8.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.107177734375, -0.10435771942138672, -0.10153770446777344, -0.09871768951416016, -0.09589767456054688, -0.0930776596069336, -0.09025764465332031, -0.08743762969970703, -0.08461761474609375, -0.08179759979248047, -0.07897758483886719, -0.0761575698852539, -0.07333755493164062, -0.07051753997802734, -0.06769752502441406, -0.06487751007080078, -0.0620574951171875, -0.05923748016357422, -0.05641746520996094, -0.053597450256347656, -0.050777435302734375, -0.047957420349121094, -0.04513740539550781, -0.04231739044189453, -0.03949737548828125, -0.03667736053466797, -0.03385734558105469, -0.031037330627441406, -0.028217315673828125, -0.025397300720214844, -0.022577285766601562, -0.01975727081298828, -0.016937255859375, -0.014117240905761719, -0.011297225952148438, -0.008477210998535156, -0.005657196044921875, -0.0028371810913085938, -1.71661376953125e-05, 0.0028028488159179688, 0.00562286376953125, 0.008442878723144531, 0.011262893676757812, 0.014082908630371094, 0.016902923583984375, 0.019722938537597656, 0.022542953491210938, 0.02536296844482422, 0.0281829833984375, 0.03100299835205078, 0.03382301330566406, 0.036643028259277344, 0.039463043212890625, 0.042283058166503906, 0.04510307312011719, 0.04792308807373047, 0.05074310302734375, 0.05356311798095703, 0.05638313293457031, 0.059203147888183594, 0.062023162841796875, 0.06484317779541016, 0.06766319274902344, 0.07048320770263672, 0.07330322265625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 12.0, 17.0, 14.0, 29.0, 21.0, 40.0, 39.0, 70.0, 60.0, 75.0, 113.0, 84.0, 80.0, 70.0, 67.0, 40.0, 30.0, 28.0, 34.0, 19.0, 11.0, 6.0, 9.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.033111572265625, -0.032111406326293945, -0.03111124038696289, -0.030111074447631836, -0.02911090850830078, -0.028110742568969727, -0.027110576629638672, -0.026110410690307617, -0.025110244750976562, -0.024110078811645508, -0.023109912872314453, -0.0221097469329834, -0.021109580993652344, -0.02010941505432129, -0.019109249114990234, -0.01810908317565918, -0.017108917236328125, -0.01610875129699707, -0.015108585357666016, -0.014108419418334961, -0.013108253479003906, -0.012108087539672852, -0.011107921600341797, -0.010107755661010742, -0.009107589721679688, -0.008107423782348633, -0.007107257843017578, -0.0061070919036865234, -0.005106925964355469, -0.004106760025024414, -0.0031065940856933594, -0.0021064281463623047, -0.00110626220703125, -0.00010609626770019531, 0.0008940696716308594, 0.001894235610961914, 0.0028944015502929688, 0.0038945674896240234, 0.004894733428955078, 0.005894899368286133, 0.0068950653076171875, 0.007895231246948242, 0.008895397186279297, 0.009895563125610352, 0.010895729064941406, 0.011895895004272461, 0.012896060943603516, 0.01389622688293457, 0.014896392822265625, 0.01589655876159668, 0.016896724700927734, 0.01789689064025879, 0.018897056579589844, 0.0198972225189209, 0.020897388458251953, 0.021897554397583008, 0.022897720336914062, 0.023897886276245117, 0.024898052215576172, 0.025898218154907227, 0.02689838409423828, 0.027898550033569336, 0.02889871597290039, 0.029898881912231445, 0.0308990478515625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 32.0, 195.0, 417.0, 289.0, 58.0, 11.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.580330729484558, -1.5491642951965332, -1.5179978609085083, -1.4868314266204834, -1.4556649923324585, -1.4244985580444336, -1.3933320045471191, -1.3621655702590942, -1.3309991359710693, -1.2998327016830444, -1.2686662673950195, -1.2374998331069946, -1.2063333988189697, -1.1751668453216553, -1.14400053024292, -1.1128339767456055, -1.0816676616668701, -1.0505012273788452, -1.0193347930908203, -0.9881683588027954, -0.9570018649101257, -0.9258354306221008, -0.8946689963340759, -0.863502562046051, -0.8323360681533813, -0.8011696338653564, -0.7700031995773315, -0.7388367652893066, -0.707670271396637, -0.6765038371086121, -0.6453374028205872, -0.6141709685325623, -0.5830044746398926, -0.5518380403518677, -0.5206716060638428, -0.4895051419734955, -0.4583386778831482, -0.4271722435951233, -0.3960058093070984, -0.3648393750190735, -0.3336729109287262, -0.3025064766407013, -0.271340012550354, -0.2401735782623291, -0.209007129073143, -0.1778406798839569, -0.146674245595932, -0.11550779640674591, -0.08434134721755981, -0.05317490175366402, -0.02200845628976822, 0.00915798544883728, 0.040324434638023376, 0.07149088382720947, 0.10265731811523438, 0.13382376730442047, 0.16499021649360657, 0.19615666568279266, 0.22732311487197876, 0.25848954916000366, 0.28965598344802856, 0.32082244753837585, 0.35198888182640076, 0.38315534591674805, 0.41432178020477295]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 9.0, 12.0, 13.0, 17.0, 12.0, 21.0, 18.0, 27.0, 33.0, 41.0, 34.0, 41.0, 42.0, 42.0, 42.0, 35.0, 44.0, 31.0, 32.0, 50.0, 40.0, 49.0, 37.0, 38.0, 30.0, 36.0, 16.0, 24.0, 20.0, 18.0, 9.0, 14.0, 8.0, 10.0, 14.0, 11.0, 10.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0], "bins": [-0.2713168263435364, -0.26379385590553284, -0.2562708854675293, -0.24874791502952576, -0.24122492969036102, -0.23370195925235748, -0.22617898881435394, -0.2186560183763504, -0.21113303303718567, -0.20361006259918213, -0.1960870921611786, -0.18856412172317505, -0.18104113638401031, -0.17351816594600677, -0.16599519550800323, -0.1584722250699997, -0.15094925463199615, -0.14342628419399261, -0.13590331375598907, -0.12838032841682434, -0.1208573579788208, -0.11333438754081726, -0.10581141710281372, -0.09828844666481018, -0.09076546877622604, -0.0832424983382225, -0.07571952044963837, -0.06819655001163483, -0.06067357584834099, -0.05315060168504715, -0.04562763124704361, -0.03810465708374977, -0.030581682920455933, -0.023058708757162094, -0.015535736456513405, -0.008012764155864716, -0.0004897899925708771, 0.007033184170722961, 0.014556154608726501, 0.02207912877202034, 0.02960210293531418, 0.03712507709860802, 0.044648051261901855, 0.052171021699905396, 0.059693995863199234, 0.06721697002649307, 0.07473994046449661, 0.08226291835308075, 0.08978588879108429, 0.09730885922908783, 0.10483183711767197, 0.1123548075556755, 0.11987778544425964, 0.12740075588226318, 0.13492372632026672, 0.14244669675827026, 0.1499696671962738, 0.15749263763427734, 0.16501560807228088, 0.17253857851028442, 0.18006156384944916, 0.1875845342874527, 0.19510750472545624, 0.20263047516345978, 0.2101534605026245]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 9.0, 9.0, 18.0, 37.0, 54.0, 70.0, 134.0, 224.0, 456.0, 905.0, 2384.0, 8410.0, 53574.0, 1293810.0, 2690956.0, 122830.0, 14588.0, 3543.0, 1182.0, 471.0, 252.0, 138.0, 76.0, 54.0, 25.0, 23.0, 11.0, 6.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10699462890625, -0.1036672592163086, -0.10033988952636719, -0.09701251983642578, -0.09368515014648438, -0.09035778045654297, -0.08703041076660156, -0.08370304107666016, -0.08037567138671875, -0.07704830169677734, -0.07372093200683594, -0.07039356231689453, -0.06706619262695312, -0.06373882293701172, -0.06041145324707031, -0.057084083557128906, -0.0537567138671875, -0.050429344177246094, -0.04710197448730469, -0.04377460479736328, -0.040447235107421875, -0.03711986541748047, -0.03379249572753906, -0.030465126037597656, -0.02713775634765625, -0.023810386657714844, -0.020483016967773438, -0.01715564727783203, -0.013828277587890625, -0.010500907897949219, -0.0071735382080078125, -0.0038461685180664062, -0.000518798828125, 0.0028085708618164062, 0.0061359405517578125, 0.009463310241699219, 0.012790679931640625, 0.01611804962158203, 0.019445419311523438, 0.022772789001464844, 0.02610015869140625, 0.029427528381347656, 0.03275489807128906, 0.03608226776123047, 0.039409637451171875, 0.04273700714111328, 0.04606437683105469, 0.049391746520996094, 0.0527191162109375, 0.056046485900878906, 0.05937385559082031, 0.06270122528076172, 0.06602859497070312, 0.06935596466064453, 0.07268333435058594, 0.07601070404052734, 0.07933807373046875, 0.08266544342041016, 0.08599281311035156, 0.08932018280029297, 0.09264755249023438, 0.09597492218017578, 0.09930229187011719, 0.1026296615600586, 0.10595703125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 13.0, 16.0, 22.0, 44.0, 65.0, 65.0, 82.0, 86.0, 94.0, 105.0, 102.0, 83.0, 62.0, 50.0, 35.0, 23.0, 21.0, 10.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08477783203125, -0.08234500885009766, -0.07991218566894531, -0.07747936248779297, -0.07504653930664062, -0.07261371612548828, -0.07018089294433594, -0.0677480697631836, -0.06531524658203125, -0.0628824234008789, -0.06044960021972656, -0.05801677703857422, -0.055583953857421875, -0.05315113067626953, -0.05071830749511719, -0.048285484313964844, -0.0458526611328125, -0.043419837951660156, -0.04098701477050781, -0.03855419158935547, -0.036121368408203125, -0.03368854522705078, -0.03125572204589844, -0.028822898864746094, -0.02639007568359375, -0.023957252502441406, -0.021524429321289062, -0.01909160614013672, -0.016658782958984375, -0.014225959777832031, -0.011793136596679688, -0.009360313415527344, -0.006927490234375, -0.004494667053222656, -0.0020618438720703125, 0.00037097930908203125, 0.002803802490234375, 0.005236625671386719, 0.0076694488525390625, 0.010102272033691406, 0.01253509521484375, 0.014967918395996094, 0.017400741577148438, 0.01983356475830078, 0.022266387939453125, 0.02469921112060547, 0.027132034301757812, 0.029564857482910156, 0.0319976806640625, 0.034430503845214844, 0.03686332702636719, 0.03929615020751953, 0.041728973388671875, 0.04416179656982422, 0.04659461975097656, 0.049027442932128906, 0.05146026611328125, 0.053893089294433594, 0.05632591247558594, 0.05875873565673828, 0.061191558837890625, 0.06362438201904297, 0.06605720520019531, 0.06849002838134766, 0.0709228515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 11.0, 8.0, 21.0, 29.0, 62.0, 109.0, 210.0, 422.0, 1032.0, 4002.0, 63795.0, 2590939.0, 1496631.0, 32578.0, 2882.0, 806.0, 364.0, 162.0, 101.0, 55.0, 30.0, 17.0, 12.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.142578125, -0.13780975341796875, -0.1330413818359375, -0.12827301025390625, -0.123504638671875, -0.11873626708984375, -0.1139678955078125, -0.10919952392578125, -0.10443115234375, -0.09966278076171875, -0.0948944091796875, -0.09012603759765625, -0.085357666015625, -0.08058929443359375, -0.0758209228515625, -0.07105255126953125, -0.0662841796875, -0.06151580810546875, -0.0567474365234375, -0.05197906494140625, -0.047210693359375, -0.04244232177734375, -0.0376739501953125, -0.03290557861328125, -0.02813720703125, -0.02336883544921875, -0.0186004638671875, -0.01383209228515625, -0.009063720703125, -0.00429534912109375, 0.0004730224609375, 0.00524139404296875, 0.010009765625, 0.01477813720703125, 0.0195465087890625, 0.02431488037109375, 0.029083251953125, 0.03385162353515625, 0.0386199951171875, 0.04338836669921875, 0.04815673828125, 0.05292510986328125, 0.0576934814453125, 0.06246185302734375, 0.067230224609375, 0.07199859619140625, 0.0767669677734375, 0.08153533935546875, 0.0863037109375, 0.09107208251953125, 0.0958404541015625, 0.10060882568359375, 0.105377197265625, 0.11014556884765625, 0.1149139404296875, 0.11968231201171875, 0.12445068359375, 0.12921905517578125, 0.1339874267578125, 0.13875579833984375, 0.143524169921875, 0.14829254150390625, 0.1530609130859375, 0.15782928466796875, 0.16259765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 9.0, 24.0, 30.0, 38.0, 69.0, 91.0, 150.0, 211.0, 261.0, 340.0, 455.0, 461.0, 448.0, 412.0, 311.0, 254.0, 181.0, 99.0, 85.0, 38.0, 29.0, 20.0, 12.0, 12.0, 8.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07855224609375, -0.0762186050415039, -0.07388496398925781, -0.07155132293701172, -0.06921768188476562, -0.06688404083251953, -0.06455039978027344, -0.062216758728027344, -0.05988311767578125, -0.057549476623535156, -0.05521583557128906, -0.05288219451904297, -0.050548553466796875, -0.04821491241455078, -0.04588127136230469, -0.043547630310058594, -0.0412139892578125, -0.038880348205566406, -0.03654670715332031, -0.03421306610107422, -0.031879425048828125, -0.02954578399658203, -0.027212142944335938, -0.024878501892089844, -0.02254486083984375, -0.020211219787597656, -0.017877578735351562, -0.015543937683105469, -0.013210296630859375, -0.010876655578613281, -0.008543014526367188, -0.006209373474121094, -0.003875732421875, -0.0015420913696289062, 0.0007915496826171875, 0.0031251907348632812, 0.005458831787109375, 0.007792472839355469, 0.010126113891601562, 0.012459754943847656, 0.01479339599609375, 0.017127037048339844, 0.019460678100585938, 0.02179431915283203, 0.024127960205078125, 0.02646160125732422, 0.028795242309570312, 0.031128883361816406, 0.0334625244140625, 0.035796165466308594, 0.03812980651855469, 0.04046344757080078, 0.042797088623046875, 0.04513072967529297, 0.04746437072753906, 0.049798011779785156, 0.05213165283203125, 0.054465293884277344, 0.05679893493652344, 0.05913257598876953, 0.061466217041015625, 0.06379985809326172, 0.06613349914550781, 0.0684671401977539, 0.07080078125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 10.0, 36.0, 117.0, 276.0, 333.0, 171.0, 48.0, 13.0, 6.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.2687463760375977, -1.2457294464111328, -1.222712516784668, -1.1996957063674927, -1.1766787767410278, -1.153661847114563, -1.1306449174880981, -1.1076281070709229, -1.084611177444458, -1.0615942478179932, -1.0385773181915283, -1.015560507774353, -0.9925435781478882, -0.9695266485214233, -0.9465097188949585, -0.9234928488731384, -0.9004759192466736, -0.8774589896202087, -0.8544421195983887, -0.8314251899719238, -0.8084083199501038, -0.7853913903236389, -0.7623745203018188, -0.739357590675354, -0.7163406610488892, -0.6933237314224243, -0.6703068614006042, -0.6472899317741394, -0.6242730617523193, -0.6012561321258545, -0.5782392024993896, -0.5552223324775696, -0.5322054624557495, -0.5091885328292847, -0.4861716628074646, -0.46315473318099976, -0.4401378631591797, -0.41712093353271484, -0.3941040337085724, -0.37108713388442993, -0.3480702340602875, -0.325053334236145, -0.30203643441200256, -0.2790195345878601, -0.25600260496139526, -0.232985720038414, -0.20996880531311035, -0.1869519054889679, -0.16393500566482544, -0.14091810584068298, -0.11790119856595993, -0.09488429129123688, -0.07186739146709442, -0.048850491642951965, -0.025833576917648315, -0.0028166770935058594, 0.020200222730636597, 0.04321712628006935, 0.0662340298295021, 0.08925093710422516, 0.11226783692836761, 0.13528473675251007, 0.15830165147781372, 0.18131855130195618, 0.20433545112609863]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 5.0, 13.0, 16.0, 17.0, 23.0, 29.0, 37.0, 38.0, 40.0, 34.0, 32.0, 49.0, 40.0, 50.0, 41.0, 37.0, 48.0, 46.0, 42.0, 50.0, 39.0, 47.0, 30.0, 39.0, 24.0, 20.0, 18.0, 19.0, 8.0, 13.0, 9.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2681151032447815, -0.26059675216674805, -0.2530784010887146, -0.24556006491184235, -0.2380417287349701, -0.23052337765693665, -0.2230050265789032, -0.21548667550086975, -0.2079683393239975, -0.20044998824596405, -0.1929316520690918, -0.18541330099105835, -0.1778949499130249, -0.17037661373615265, -0.1628582626581192, -0.15533992648124695, -0.1478215754032135, -0.14030322432518005, -0.1327848881483078, -0.12526653707027435, -0.1177481934428215, -0.11022984981536865, -0.1027114987373352, -0.09519315510988235, -0.0876748114824295, -0.08015646785497665, -0.0726381242275238, -0.06511977314949036, -0.057601429522037506, -0.050083085894584656, -0.04256473854184151, -0.03504639118909836, -0.027528047561645508, -0.020009702071547508, -0.012491356581449509, -0.004973011091351509, 0.0025453343987464905, 0.01006367802619934, 0.01758202537894249, 0.02510037273168564, 0.03261871635913849, 0.04013705998659134, 0.04765540733933449, 0.05517375469207764, 0.06269209831953049, 0.07021044194698334, 0.07772879302501678, 0.08524713665246964, 0.09276548027992249, 0.10028382390737534, 0.10780216753482819, 0.11532051861286163, 0.12283886224031448, 0.13035720586776733, 0.13787555694580078, 0.14539390802383423, 0.15291224420070648, 0.16043059527873993, 0.16794893145561218, 0.17546728253364563, 0.18298563361167908, 0.19050396978855133, 0.19802232086658478, 0.20554065704345703, 0.21305900812149048]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 9.0, 10.0, 20.0, 42.0, 54.0, 80.0, 112.0, 195.0, 347.0, 713.0, 1669.0, 4227.0, 12585.0, 40164.0, 139926.0, 389784.0, 315565.0, 99090.0, 28934.0, 9139.0, 3224.0, 1256.0, 613.0, 300.0, 180.0, 99.0, 58.0, 42.0, 29.0, 21.0, 19.0, 12.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09939861297607422, -0.09583091735839844, -0.09226322174072266, -0.08869552612304688, -0.0851278305053711, -0.08156013488769531, -0.07799243927001953, -0.07442474365234375, -0.07085704803466797, -0.06728935241699219, -0.0637216567993164, -0.060153961181640625, -0.056586265563964844, -0.05301856994628906, -0.04945087432861328, -0.0458831787109375, -0.04231548309326172, -0.03874778747558594, -0.035180091857910156, -0.031612396240234375, -0.028044700622558594, -0.024477005004882812, -0.02090930938720703, -0.01734161376953125, -0.013773918151855469, -0.010206222534179688, -0.006638526916503906, -0.003070831298828125, 0.0004968643188476562, 0.0040645599365234375, 0.007632255554199219, 0.011199951171875, 0.014767646789550781, 0.018335342407226562, 0.021903038024902344, 0.025470733642578125, 0.029038429260253906, 0.03260612487792969, 0.03617382049560547, 0.03974151611328125, 0.04330921173095703, 0.04687690734863281, 0.050444602966308594, 0.054012298583984375, 0.057579994201660156, 0.06114768981933594, 0.06471538543701172, 0.0682830810546875, 0.07185077667236328, 0.07541847229003906, 0.07898616790771484, 0.08255386352539062, 0.0861215591430664, 0.08968925476074219, 0.09325695037841797, 0.09682464599609375, 0.10039234161376953, 0.10396003723144531, 0.1075277328491211, 0.11109542846679688, 0.11466312408447266, 0.11823081970214844, 0.12179851531982422, 0.1253662109375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 14.0, 20.0, 31.0, 54.0, 62.0, 73.0, 86.0, 113.0, 109.0, 95.0, 95.0, 82.0, 57.0, 42.0, 21.0, 19.0, 15.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0894775390625, -0.08694171905517578, -0.08440589904785156, -0.08187007904052734, -0.07933425903320312, -0.0767984390258789, -0.07426261901855469, -0.07172679901123047, -0.06919097900390625, -0.06665515899658203, -0.06411933898925781, -0.061583518981933594, -0.059047698974609375, -0.056511878967285156, -0.05397605895996094, -0.05144023895263672, -0.0489044189453125, -0.04636859893798828, -0.04383277893066406, -0.041296958923339844, -0.038761138916015625, -0.036225318908691406, -0.03368949890136719, -0.03115367889404297, -0.02861785888671875, -0.02608203887939453, -0.023546218872070312, -0.021010398864746094, -0.018474578857421875, -0.015938758850097656, -0.013402938842773438, -0.010867118835449219, -0.008331298828125, -0.005795478820800781, -0.0032596588134765625, -0.0007238388061523438, 0.001811981201171875, 0.004347801208496094, 0.0068836212158203125, 0.009419441223144531, 0.01195526123046875, 0.014491081237792969, 0.017026901245117188, 0.019562721252441406, 0.022098541259765625, 0.024634361267089844, 0.027170181274414062, 0.02970600128173828, 0.0322418212890625, 0.03477764129638672, 0.03731346130371094, 0.039849281311035156, 0.042385101318359375, 0.044920921325683594, 0.04745674133300781, 0.04999256134033203, 0.05252838134765625, 0.05506420135498047, 0.05760002136230469, 0.060135841369628906, 0.06267166137695312, 0.06520748138427734, 0.06774330139160156, 0.07027912139892578, 0.07281494140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 4.0, 7.0, 3.0, 15.0, 14.0, 20.0, 33.0, 40.0, 54.0, 79.0, 118.0, 227.0, 516.0, 1114.0, 3052.0, 9675.0, 31187.0, 107322.0, 314981.0, 372717.0, 144823.0, 43203.0, 12670.0, 4035.0, 1385.0, 562.0, 243.0, 145.0, 94.0, 56.0, 36.0, 32.0, 21.0, 22.0, 13.0, 11.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.135986328125, -0.13232421875, -0.128662109375, -0.125, -0.121337890625, -0.11767578125, -0.114013671875, -0.1103515625, -0.106689453125, -0.10302734375, -0.099365234375, -0.095703125, -0.092041015625, -0.08837890625, -0.084716796875, -0.0810546875, -0.077392578125, -0.07373046875, -0.070068359375, -0.06640625, -0.062744140625, -0.05908203125, -0.055419921875, -0.0517578125, -0.048095703125, -0.04443359375, -0.040771484375, -0.037109375, -0.033447265625, -0.02978515625, -0.026123046875, -0.0224609375, -0.018798828125, -0.01513671875, -0.011474609375, -0.0078125, -0.004150390625, -0.00048828125, 0.003173828125, 0.0068359375, 0.010498046875, 0.01416015625, 0.017822265625, 0.021484375, 0.025146484375, 0.02880859375, 0.032470703125, 0.0361328125, 0.039794921875, 0.04345703125, 0.047119140625, 0.05078125, 0.054443359375, 0.05810546875, 0.061767578125, 0.0654296875, 0.069091796875, 0.07275390625, 0.076416015625, 0.080078125, 0.083740234375, 0.08740234375, 0.091064453125, 0.0947265625, 0.098388671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 10.0, 7.0, 10.0, 7.0, 8.0, 12.0, 15.0, 16.0, 16.0, 35.0, 31.0, 32.0, 30.0, 35.0, 42.0, 40.0, 50.0, 35.0, 47.0, 47.0, 48.0, 47.0, 60.0, 42.0, 32.0, 38.0, 28.0, 27.0, 26.0, 18.0, 20.0, 17.0, 13.0, 17.0, 8.0, 10.0, 9.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08538818359375, -0.08251380920410156, -0.07963943481445312, -0.07676506042480469, -0.07389068603515625, -0.07101631164550781, -0.06814193725585938, -0.06526756286621094, -0.0623931884765625, -0.05951881408691406, -0.056644439697265625, -0.05377006530761719, -0.05089569091796875, -0.04802131652832031, -0.045146942138671875, -0.04227256774902344, -0.039398193359375, -0.03652381896972656, -0.033649444580078125, -0.030775070190429688, -0.02790069580078125, -0.025026321411132812, -0.022151947021484375, -0.019277572631835938, -0.0164031982421875, -0.013528823852539062, -0.010654449462890625, -0.0077800750732421875, -0.00490570068359375, -0.0020313262939453125, 0.000843048095703125, 0.0037174224853515625, 0.006591796875, 0.009466171264648438, 0.012340545654296875, 0.015214920043945312, 0.01808929443359375, 0.020963668823242188, 0.023838043212890625, 0.026712417602539062, 0.0295867919921875, 0.03246116638183594, 0.035335540771484375, 0.03820991516113281, 0.04108428955078125, 0.04395866394042969, 0.046833038330078125, 0.04970741271972656, 0.052581787109375, 0.05545616149902344, 0.058330535888671875, 0.06120491027832031, 0.06407928466796875, 0.06695365905761719, 0.06982803344726562, 0.07270240783691406, 0.0755767822265625, 0.07845115661621094, 0.08132553100585938, 0.08419990539550781, 0.08707427978515625, 0.08994865417480469, 0.09282302856445312, 0.09569740295410156, 0.09857177734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 15.0, 19.0, 21.0, 30.0, 44.0, 70.0, 92.0, 145.0, 248.0, 444.0, 943.0, 2192.0, 6104.0, 21072.0, 99000.0, 412260.0, 387606.0, 89074.0, 19562.0, 5575.0, 1999.0, 891.0, 438.0, 234.0, 167.0, 94.0, 66.0, 41.0, 28.0, 26.0, 16.0, 11.0, 4.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07415771484375, -0.0717630386352539, -0.06936836242675781, -0.06697368621826172, -0.06457901000976562, -0.06218433380126953, -0.05978965759277344, -0.057394981384277344, -0.05500030517578125, -0.052605628967285156, -0.05021095275878906, -0.04781627655029297, -0.045421600341796875, -0.04302692413330078, -0.04063224792480469, -0.038237571716308594, -0.0358428955078125, -0.033448219299316406, -0.031053543090820312, -0.02865886688232422, -0.026264190673828125, -0.02386951446533203, -0.021474838256835938, -0.019080162048339844, -0.01668548583984375, -0.014290809631347656, -0.011896133422851562, -0.009501457214355469, -0.007106781005859375, -0.004712104797363281, -0.0023174285888671875, 7.724761962890625e-05, 0.002471923828125, 0.004866600036621094, 0.0072612762451171875, 0.009655952453613281, 0.012050628662109375, 0.014445304870605469, 0.016839981079101562, 0.019234657287597656, 0.02162933349609375, 0.024024009704589844, 0.026418685913085938, 0.02881336212158203, 0.031208038330078125, 0.03360271453857422, 0.03599739074707031, 0.038392066955566406, 0.0407867431640625, 0.043181419372558594, 0.04557609558105469, 0.04797077178955078, 0.050365447998046875, 0.05276012420654297, 0.05515480041503906, 0.057549476623535156, 0.05994415283203125, 0.062338829040527344, 0.06473350524902344, 0.06712818145751953, 0.06952285766601562, 0.07191753387451172, 0.07431221008300781, 0.0767068862915039, 0.0791015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 13.0, 33.0, 111.0, 266.0, 291.0, 169.0, 52.0, 31.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2034854888916016e-05, -5.012284964323044e-05, -4.821084439754486e-05, -4.6298839151859283e-05, -4.4386833906173706e-05, -4.247482866048813e-05, -4.056282341480255e-05, -3.8650818169116974e-05, -3.6738812923431396e-05, -3.482680767774582e-05, -3.291480243206024e-05, -3.1002797186374664e-05, -2.9090791940689087e-05, -2.717878669500351e-05, -2.5266781449317932e-05, -2.3354776203632355e-05, -2.1442770957946777e-05, -1.95307657122612e-05, -1.7618760466575623e-05, -1.5706755220890045e-05, -1.3794749975204468e-05, -1.188274472951889e-05, -9.970739483833313e-06, -8.058734238147736e-06, -6.146728992462158e-06, -4.234723746776581e-06, -2.3227185010910034e-06, -4.10713255405426e-07, 1.5012919902801514e-06, 3.4132972359657288e-06, 5.325302481651306e-06, 7.2373077273368835e-06, 9.149312973022461e-06, 1.1061318218708038e-05, 1.2973323464393616e-05, 1.4885328710079193e-05, 1.679733395576477e-05, 1.8709339201450348e-05, 2.0621344447135925e-05, 2.2533349692821503e-05, 2.444535493850708e-05, 2.6357360184192657e-05, 2.8269365429878235e-05, 3.0181370675563812e-05, 3.209337592124939e-05, 3.400538116693497e-05, 3.5917386412620544e-05, 3.782939165830612e-05, 3.97413969039917e-05, 4.1653402149677277e-05, 4.3565407395362854e-05, 4.547741264104843e-05, 4.738941788673401e-05, 4.9301423132419586e-05, 5.1213428378105164e-05, 5.312543362379074e-05, 5.503743886947632e-05, 5.6949444115161896e-05, 5.886144936084747e-05, 6.077345460653305e-05, 6.268545985221863e-05, 6.45974650979042e-05, 6.650947034358978e-05, 6.842147558927536e-05, 7.033348083496094e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 7.0, 8.0, 10.0, 27.0, 21.0, 38.0, 62.0, 69.0, 118.0, 216.0, 421.0, 939.0, 2361.0, 6780.0, 21524.0, 83120.0, 298424.0, 414880.0, 160860.0, 40400.0, 11700.0, 3824.0, 1436.0, 571.0, 303.0, 141.0, 102.0, 71.0, 32.0, 24.0, 16.0, 18.0, 9.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.062469482421875, -0.060835838317871094, -0.05920219421386719, -0.05756855010986328, -0.055934906005859375, -0.05430126190185547, -0.05266761779785156, -0.051033973693847656, -0.04940032958984375, -0.047766685485839844, -0.04613304138183594, -0.04449939727783203, -0.042865753173828125, -0.04123210906982422, -0.03959846496582031, -0.037964820861816406, -0.0363311767578125, -0.034697532653808594, -0.03306388854980469, -0.03143024444580078, -0.029796600341796875, -0.02816295623779297, -0.026529312133789062, -0.024895668029785156, -0.02326202392578125, -0.021628379821777344, -0.019994735717773438, -0.01836109161376953, -0.016727447509765625, -0.015093803405761719, -0.013460159301757812, -0.011826515197753906, -0.01019287109375, -0.008559226989746094, -0.0069255828857421875, -0.005291938781738281, -0.003658294677734375, -0.0020246505737304688, -0.0003910064697265625, 0.0012426376342773438, 0.00287628173828125, 0.004509925842285156, 0.0061435699462890625, 0.007777214050292969, 0.009410858154296875, 0.011044502258300781, 0.012678146362304688, 0.014311790466308594, 0.0159454345703125, 0.017579078674316406, 0.019212722778320312, 0.02084636688232422, 0.022480010986328125, 0.02411365509033203, 0.025747299194335938, 0.027380943298339844, 0.02901458740234375, 0.030648231506347656, 0.03228187561035156, 0.03391551971435547, 0.035549163818359375, 0.03718280792236328, 0.03881645202636719, 0.040450096130371094, 0.042083740234375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 11.0, 10.0, 11.0, 13.0, 12.0, 17.0, 17.0, 23.0, 36.0, 43.0, 36.0, 46.0, 47.0, 62.0, 49.0, 56.0, 67.0, 50.0, 59.0, 56.0, 50.0, 38.0, 30.0, 32.0, 23.0, 22.0, 12.0, 16.0, 15.0, 9.0, 8.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.026153564453125, -0.025241851806640625, -0.02433013916015625, -0.023418426513671875, -0.0225067138671875, -0.021595001220703125, -0.02068328857421875, -0.019771575927734375, -0.01885986328125, -0.017948150634765625, -0.01703643798828125, -0.016124725341796875, -0.0152130126953125, -0.014301300048828125, -0.01338958740234375, -0.012477874755859375, -0.011566162109375, -0.010654449462890625, -0.00974273681640625, -0.008831024169921875, -0.0079193115234375, -0.007007598876953125, -0.00609588623046875, -0.005184173583984375, -0.0042724609375, -0.003360748291015625, -0.00244903564453125, -0.001537322998046875, -0.0006256103515625, 0.000286102294921875, 0.00119781494140625, 0.002109527587890625, 0.003021240234375, 0.003932952880859375, 0.00484466552734375, 0.005756378173828125, 0.0066680908203125, 0.007579803466796875, 0.00849151611328125, 0.009403228759765625, 0.01031494140625, 0.011226654052734375, 0.01213836669921875, 0.013050079345703125, 0.0139617919921875, 0.014873504638671875, 0.01578521728515625, 0.016696929931640625, 0.017608642578125, 0.018520355224609375, 0.01943206787109375, 0.020343780517578125, 0.0212554931640625, 0.022167205810546875, 0.02307891845703125, 0.023990631103515625, 0.02490234375, 0.025814056396484375, 0.02672576904296875, 0.027637481689453125, 0.0285491943359375, 0.029460906982421875, 0.03037261962890625, 0.031284332275390625, 0.032196044921875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 1.0, 11.0, 31.0, 67.0, 125.0, 180.0, 202.0, 199.0, 108.0, 47.0, 22.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24090297520160675, -0.22256381809711456, -0.20422464609146118, -0.185885488986969, -0.1675463318824768, -0.14920717477798462, -0.13086801767349243, -0.11252884566783905, -0.09418968856334686, -0.07585053145885468, -0.05751136690378189, -0.039172206073999405, -0.02083304524421692, -0.0024938881397247314, 0.015845276415348053, 0.03418444097042084, 0.052523598074913025, 0.07086275517940521, 0.089201919734478, 0.10754108428955078, 0.12588024139404297, 0.14421939849853516, 0.16255855560302734, 0.18089772760868073, 0.1992368847131729, 0.2175760418176651, 0.23591521382331848, 0.25425437092781067, 0.27259352803230286, 0.29093268513679504, 0.30927184224128723, 0.3276110291481018, 0.345950186252594, 0.3642893433570862, 0.38262850046157837, 0.40096765756607056, 0.41930681467056274, 0.43764597177505493, 0.4559851586818695, 0.4743243157863617, 0.4926634728908539, 0.5110026597976685, 0.5293418169021606, 0.5476809740066528, 0.566020131111145, 0.5843592882156372, 0.6026984453201294, 0.6210376024246216, 0.6393767595291138, 0.657715916633606, 0.6760550737380981, 0.6943942308425903, 0.7127333879470825, 0.7310725450515747, 0.7494117021560669, 0.7677508592605591, 0.7860900163650513, 0.8044291734695435, 0.8227683305740356, 0.8411074876785278, 0.85944664478302, 0.8777858018875122, 0.8961249589920044, 0.9144641160964966, 0.9328033328056335]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 3.0, 13.0, 13.0, 7.0, 9.0, 17.0, 20.0, 16.0, 32.0, 23.0, 29.0, 30.0, 34.0, 46.0, 54.0, 37.0, 41.0, 44.0, 55.0, 49.0, 48.0, 47.0, 35.0, 31.0, 37.0, 35.0, 30.0, 30.0, 24.0, 18.0, 27.0, 13.0, 17.0, 11.0, 7.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32587873935699463, -0.31643909215927124, -0.30699944496154785, -0.29755979776382446, -0.2881201207637787, -0.2786804735660553, -0.2692408263683319, -0.2598011791706085, -0.25036153197288513, -0.24092188477516174, -0.23148222267627716, -0.22204257547855377, -0.21260292828083038, -0.2031632661819458, -0.1937236189842224, -0.18428397178649902, -0.17484430968761444, -0.16540466248989105, -0.15596500039100647, -0.14652535319328308, -0.1370857059955597, -0.1276460587978363, -0.11820639669895172, -0.10876674950122833, -0.09932709485292435, -0.08988744020462036, -0.08044779300689697, -0.07100813835859299, -0.0615684874355793, -0.05212883651256561, -0.04268918186426163, -0.03324953466653824, -0.023809880018234253, -0.014370228163897991, -0.004930576309561729, 0.004509076476097107, 0.013948727399110794, 0.02338837832212448, 0.03282803297042847, 0.042267680168151855, 0.05170733481645584, 0.06114698573946953, 0.07058663666248322, 0.0800262913107872, 0.08946594595909119, 0.09890559315681458, 0.10834524780511856, 0.11778489500284195, 0.12722454965114594, 0.13666419684886932, 0.1461038589477539, 0.1555435061454773, 0.16498315334320068, 0.17442280054092407, 0.18386246263980865, 0.19330210983753204, 0.20274177193641663, 0.21218141913414001, 0.2216210812330246, 0.23106072843074799, 0.24050037562847137, 0.24994003772735596, 0.25937968492507935, 0.26881933212280273, 0.2782589793205261]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 8.0, 8.0, 21.0, 22.0, 29.0, 76.0, 130.0, 182.0, 308.0, 682.0, 2758.0, 50026.0, 3667938.0, 461935.0, 8143.0, 1122.0, 357.0, 207.0, 119.0, 72.0, 51.0, 33.0, 19.0, 9.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.194580078125, -0.1894207000732422, -0.18426132202148438, -0.17910194396972656, -0.17394256591796875, -0.16878318786621094, -0.16362380981445312, -0.1584644317626953, -0.1533050537109375, -0.1481456756591797, -0.14298629760742188, -0.13782691955566406, -0.13266754150390625, -0.12750816345214844, -0.12234878540039062, -0.11718940734863281, -0.112030029296875, -0.10687065124511719, -0.10171127319335938, -0.09655189514160156, -0.09139251708984375, -0.08623313903808594, -0.08107376098632812, -0.07591438293457031, -0.0707550048828125, -0.06559562683105469, -0.060436248779296875, -0.05527687072753906, -0.05011749267578125, -0.04495811462402344, -0.039798736572265625, -0.03463935852050781, -0.02947998046875, -0.024320602416992188, -0.019161224365234375, -0.014001846313476562, -0.00884246826171875, -0.0036830902099609375, 0.001476287841796875, 0.0066356658935546875, 0.0117950439453125, 0.016954421997070312, 0.022113800048828125, 0.027273178100585938, 0.03243255615234375, 0.03759193420410156, 0.042751312255859375, 0.04791069030761719, 0.053070068359375, 0.05822944641113281, 0.06338882446289062, 0.06854820251464844, 0.07370758056640625, 0.07886695861816406, 0.08402633666992188, 0.08918571472167969, 0.0943450927734375, 0.09950447082519531, 0.10466384887695312, 0.10982322692871094, 0.11498260498046875, 0.12014198303222656, 0.12530136108398438, 0.1304607391357422, 0.1356201171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 11.0, 19.0, 27.0, 57.0, 52.0, 63.0, 79.0, 88.0, 101.0, 97.0, 88.0, 75.0, 68.0, 51.0, 44.0, 31.0, 14.0, 13.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0804443359375, -0.07806777954101562, -0.07569122314453125, -0.07331466674804688, -0.0709381103515625, -0.06856155395507812, -0.06618499755859375, -0.06380844116210938, -0.061431884765625, -0.059055328369140625, -0.05667877197265625, -0.054302215576171875, -0.0519256591796875, -0.049549102783203125, -0.04717254638671875, -0.044795989990234375, -0.04241943359375, -0.040042877197265625, -0.03766632080078125, -0.035289764404296875, -0.0329132080078125, -0.030536651611328125, -0.02816009521484375, -0.025783538818359375, -0.023406982421875, -0.021030426025390625, -0.01865386962890625, -0.016277313232421875, -0.0139007568359375, -0.011524200439453125, -0.00914764404296875, -0.006771087646484375, -0.00439453125, -0.002017974853515625, 0.00035858154296875, 0.002735137939453125, 0.0051116943359375, 0.007488250732421875, 0.00986480712890625, 0.012241363525390625, 0.014617919921875, 0.016994476318359375, 0.01937103271484375, 0.021747589111328125, 0.0241241455078125, 0.026500701904296875, 0.02887725830078125, 0.031253814697265625, 0.03363037109375, 0.036006927490234375, 0.03838348388671875, 0.040760040283203125, 0.0431365966796875, 0.045513153076171875, 0.04788970947265625, 0.050266265869140625, 0.052642822265625, 0.055019378662109375, 0.05739593505859375, 0.059772491455078125, 0.0621490478515625, 0.06452560424804688, 0.06690216064453125, 0.06927871704101562, 0.0716552734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 19.0, 23.0, 42.0, 69.0, 108.0, 170.0, 253.0, 414.0, 836.0, 2271.0, 11201.0, 126907.0, 1882932.0, 2012540.0, 140312.0, 11901.0, 2323.0, 805.0, 428.0, 260.0, 155.0, 101.0, 65.0, 34.0, 36.0, 24.0, 13.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09521484375, -0.09204292297363281, -0.08887100219726562, -0.08569908142089844, -0.08252716064453125, -0.07935523986816406, -0.07618331909179688, -0.07301139831542969, -0.0698394775390625, -0.06666755676269531, -0.06349563598632812, -0.06032371520996094, -0.05715179443359375, -0.05397987365722656, -0.050807952880859375, -0.04763603210449219, -0.044464111328125, -0.04129219055175781, -0.038120269775390625, -0.03494834899902344, -0.03177642822265625, -0.028604507446289062, -0.025432586669921875, -0.022260665893554688, -0.0190887451171875, -0.015916824340820312, -0.012744903564453125, -0.009572982788085938, -0.00640106201171875, -0.0032291412353515625, -5.7220458984375e-05, 0.0031147003173828125, 0.00628662109375, 0.009458541870117188, 0.012630462646484375, 0.015802383422851562, 0.01897430419921875, 0.022146224975585938, 0.025318145751953125, 0.028490066528320312, 0.0316619873046875, 0.03483390808105469, 0.038005828857421875, 0.04117774963378906, 0.04434967041015625, 0.04752159118652344, 0.050693511962890625, 0.05386543273925781, 0.057037353515625, 0.06020927429199219, 0.06338119506835938, 0.06655311584472656, 0.06972503662109375, 0.07289695739746094, 0.07606887817382812, 0.07924079895019531, 0.0824127197265625, 0.08558464050292969, 0.08875656127929688, 0.09192848205566406, 0.09510040283203125, 0.09827232360839844, 0.10144424438476562, 0.10461616516113281, 0.1077880859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 10.0, 7.0, 16.0, 13.0, 29.0, 37.0, 60.0, 79.0, 126.0, 143.0, 182.0, 257.0, 315.0, 346.0, 381.0, 393.0, 385.0, 326.0, 256.0, 173.0, 167.0, 98.0, 88.0, 67.0, 40.0, 21.0, 19.0, 13.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049407958984375, -0.04756879806518555, -0.045729637145996094, -0.04389047622680664, -0.04205131530761719, -0.040212154388427734, -0.03837299346923828, -0.03653383255004883, -0.034694671630859375, -0.03285551071166992, -0.03101634979248047, -0.029177188873291016, -0.027338027954101562, -0.02549886703491211, -0.023659706115722656, -0.021820545196533203, -0.01998138427734375, -0.018142223358154297, -0.016303062438964844, -0.01446390151977539, -0.012624740600585938, -0.010785579681396484, -0.008946418762207031, -0.007107257843017578, -0.005268096923828125, -0.003428936004638672, -0.0015897750854492188, 0.0002493858337402344, 0.0020885467529296875, 0.003927707672119141, 0.005766868591308594, 0.007606029510498047, 0.0094451904296875, 0.011284351348876953, 0.013123512268066406, 0.01496267318725586, 0.016801834106445312, 0.018640995025634766, 0.02048015594482422, 0.022319316864013672, 0.024158477783203125, 0.025997638702392578, 0.02783679962158203, 0.029675960540771484, 0.03151512145996094, 0.03335428237915039, 0.035193443298339844, 0.0370326042175293, 0.03887176513671875, 0.0407109260559082, 0.042550086975097656, 0.04438924789428711, 0.04622840881347656, 0.048067569732666016, 0.04990673065185547, 0.05174589157104492, 0.053585052490234375, 0.05542421340942383, 0.05726337432861328, 0.059102535247802734, 0.06094169616699219, 0.06278085708618164, 0.0646200180053711, 0.06645917892456055, 0.06829833984375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 29.0, 37.0, 92.0, 174.0, 222.0, 183.0, 144.0, 78.0, 21.0, 13.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6508854627609253, -0.6363779306411743, -0.6218704581260681, -0.6073629856109619, -0.5928554534912109, -0.57834792137146, -0.5638404488563538, -0.5493329763412476, -0.5348254442214966, -0.5203179121017456, -0.5058104395866394, -0.4913029372692108, -0.4767954349517822, -0.46228793263435364, -0.44778043031692505, -0.43327292799949646, -0.41876542568206787, -0.4042579233646393, -0.3897504210472107, -0.3752429187297821, -0.3607354164123535, -0.3462279140949249, -0.33172041177749634, -0.31721290946006775, -0.30270540714263916, -0.28819790482521057, -0.273690402507782, -0.2591829001903534, -0.2446753978729248, -0.23016789555549622, -0.21566039323806763, -0.20115289092063904, -0.18664538860321045, -0.17213788628578186, -0.15763038396835327, -0.14312288165092468, -0.1286153793334961, -0.1141078770160675, -0.09960037469863892, -0.08509287238121033, -0.07058537006378174, -0.05607786774635315, -0.04157036542892456, -0.02706286311149597, -0.012555360794067383, 0.001952141523361206, 0.016459643840789795, 0.030967146158218384, 0.04547464847564697, 0.05998215079307556, 0.07448965311050415, 0.08899715542793274, 0.10350465774536133, 0.11801216006278992, 0.1325196623802185, 0.1470271646976471, 0.16153466701507568, 0.17604216933250427, 0.19054967164993286, 0.20505717396736145, 0.21956467628479004, 0.23407217860221863, 0.24857968091964722, 0.2630871832370758, 0.2775946855545044]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 14.0, 13.0, 20.0, 17.0, 19.0, 28.0, 20.0, 31.0, 34.0, 42.0, 42.0, 33.0, 38.0, 31.0, 48.0, 43.0, 50.0, 52.0, 45.0, 56.0, 29.0, 34.0, 38.0, 39.0, 31.0, 18.0, 29.0, 18.0, 15.0, 12.0, 10.0, 6.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186978280544281, -0.18026453256607056, -0.1735507845878601, -0.16683705151081085, -0.1601233035326004, -0.15340955555438995, -0.1466958224773407, -0.13998207449913025, -0.1332683265209198, -0.12655457854270935, -0.1198408380150795, -0.11312709748744965, -0.1064133495092392, -0.09969960153102875, -0.0929858610033989, -0.08627212047576904, -0.0795583724975586, -0.07284462451934814, -0.06613088399171829, -0.05941713973879814, -0.05270339548587799, -0.04598965123295784, -0.03927590698003769, -0.03256216272711754, -0.025848418474197388, -0.019134674221277237, -0.012420929968357086, -0.005707185715436935, 0.0010065585374832153, 0.007720302790403366, 0.014434047043323517, 0.021147791296243668, 0.02786153554916382, 0.03457527980208397, 0.04128902405500412, 0.04800276830792427, 0.05471651256084442, 0.06143025681376457, 0.06814400106668472, 0.07485774159431458, 0.08157148957252502, 0.08828523755073547, 0.09499897807836533, 0.10171271860599518, 0.10842646658420563, 0.11514021456241608, 0.12185395509004593, 0.12856769561767578, 0.13528144359588623, 0.14199519157409668, 0.14870893955230713, 0.15542267262935638, 0.16213642060756683, 0.16885016858577728, 0.17556390166282654, 0.182277649641037, 0.18899139761924744, 0.19570514559745789, 0.20241889357566833, 0.2091326266527176, 0.21584637463092804, 0.2225601226091385, 0.22927385568618774, 0.2359876036643982, 0.24270135164260864]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 2.0, 8.0, 10.0, 4.0, 12.0, 16.0, 22.0, 27.0, 54.0, 78.0, 119.0, 255.0, 401.0, 848.0, 1841.0, 4445.0, 11020.0, 30298.0, 100072.0, 324296.0, 380223.0, 132605.0, 38404.0, 13663.0, 5420.0, 2284.0, 1008.0, 465.0, 226.0, 152.0, 94.0, 57.0, 37.0, 29.0, 16.0, 11.0, 7.0, 6.0, 7.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10015869140625, -0.09671783447265625, -0.0932769775390625, -0.08983612060546875, -0.086395263671875, -0.08295440673828125, -0.0795135498046875, -0.07607269287109375, -0.0726318359375, -0.06919097900390625, -0.0657501220703125, -0.06230926513671875, -0.058868408203125, -0.05542755126953125, -0.0519866943359375, -0.04854583740234375, -0.04510498046875, -0.04166412353515625, -0.0382232666015625, -0.03478240966796875, -0.031341552734375, -0.02790069580078125, -0.0244598388671875, -0.02101898193359375, -0.017578125, -0.01413726806640625, -0.0106964111328125, -0.00725555419921875, -0.003814697265625, -0.00037384033203125, 0.0030670166015625, 0.00650787353515625, 0.00994873046875, 0.01338958740234375, 0.0168304443359375, 0.02027130126953125, 0.023712158203125, 0.02715301513671875, 0.0305938720703125, 0.03403472900390625, 0.0374755859375, 0.04091644287109375, 0.0443572998046875, 0.04779815673828125, 0.051239013671875, 0.05467987060546875, 0.0581207275390625, 0.06156158447265625, 0.06500244140625, 0.06844329833984375, 0.0718841552734375, 0.07532501220703125, 0.078765869140625, 0.08220672607421875, 0.0856475830078125, 0.08908843994140625, 0.092529296875, 0.09597015380859375, 0.0994110107421875, 0.10285186767578125, 0.106292724609375, 0.10973358154296875, 0.1131744384765625, 0.11661529541015625, 0.12005615234375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 10.0, 11.0, 22.0, 54.0, 54.0, 68.0, 73.0, 91.0, 97.0, 106.0, 94.0, 94.0, 62.0, 44.0, 42.0, 33.0, 14.0, 11.0, 9.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0810546875, -0.07867050170898438, -0.07628631591796875, -0.07390213012695312, -0.0715179443359375, -0.06913375854492188, -0.06674957275390625, -0.06436538696289062, -0.061981201171875, -0.059597015380859375, -0.05721282958984375, -0.054828643798828125, -0.0524444580078125, -0.050060272216796875, -0.04767608642578125, -0.045291900634765625, -0.04290771484375, -0.040523529052734375, -0.03813934326171875, -0.035755157470703125, -0.0333709716796875, -0.030986785888671875, -0.02860260009765625, -0.026218414306640625, -0.023834228515625, -0.021450042724609375, -0.01906585693359375, -0.016681671142578125, -0.0142974853515625, -0.011913299560546875, -0.00952911376953125, -0.007144927978515625, -0.0047607421875, -0.002376556396484375, 7.62939453125e-06, 0.002391815185546875, 0.0047760009765625, 0.007160186767578125, 0.00954437255859375, 0.011928558349609375, 0.014312744140625, 0.016696929931640625, 0.01908111572265625, 0.021465301513671875, 0.0238494873046875, 0.026233673095703125, 0.02861785888671875, 0.031002044677734375, 0.03338623046875, 0.035770416259765625, 0.03815460205078125, 0.040538787841796875, 0.0429229736328125, 0.045307159423828125, 0.04769134521484375, 0.050075531005859375, 0.052459716796875, 0.054843902587890625, 0.05722808837890625, 0.059612274169921875, 0.0619964599609375, 0.06438064575195312, 0.06676483154296875, 0.06914901733398438, 0.071533203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 5.0, 9.0, 6.0, 10.0, 16.0, 22.0, 23.0, 30.0, 45.0, 74.0, 105.0, 123.0, 232.0, 408.0, 892.0, 2207.0, 7614.0, 29222.0, 118819.0, 376145.0, 362746.0, 111376.0, 27379.0, 7015.0, 2119.0, 825.0, 402.0, 233.0, 139.0, 82.0, 49.0, 38.0, 31.0, 24.0, 14.0, 18.0, 14.0, 10.0, 10.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12493896484375, -0.1212615966796875, -0.117584228515625, -0.1139068603515625, -0.1102294921875, -0.1065521240234375, -0.102874755859375, -0.0991973876953125, -0.09552001953125, -0.0918426513671875, -0.088165283203125, -0.0844879150390625, -0.080810546875, -0.0771331787109375, -0.073455810546875, -0.0697784423828125, -0.06610107421875, -0.0624237060546875, -0.058746337890625, -0.0550689697265625, -0.0513916015625, -0.0477142333984375, -0.044036865234375, -0.0403594970703125, -0.03668212890625, -0.0330047607421875, -0.029327392578125, -0.0256500244140625, -0.02197265625, -0.0182952880859375, -0.014617919921875, -0.0109405517578125, -0.00726318359375, -0.0035858154296875, 9.1552734375e-05, 0.0037689208984375, 0.0074462890625, 0.0111236572265625, 0.014801025390625, 0.0184783935546875, 0.02215576171875, 0.0258331298828125, 0.029510498046875, 0.0331878662109375, 0.036865234375, 0.0405426025390625, 0.044219970703125, 0.0478973388671875, 0.05157470703125, 0.0552520751953125, 0.058929443359375, 0.0626068115234375, 0.0662841796875, 0.0699615478515625, 0.073638916015625, 0.0773162841796875, 0.08099365234375, 0.0846710205078125, 0.088348388671875, 0.0920257568359375, 0.095703125, 0.0993804931640625, 0.103057861328125, 0.1067352294921875, 0.11041259765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 10.0, 4.0, 8.0, 8.0, 11.0, 18.0, 15.0, 12.0, 12.0, 18.0, 22.0, 18.0, 27.0, 22.0, 29.0, 43.0, 33.0, 43.0, 43.0, 37.0, 32.0, 29.0, 36.0, 29.0, 35.0, 41.0, 36.0, 31.0, 30.0, 32.0, 42.0, 27.0, 22.0, 24.0, 20.0, 16.0, 12.0, 16.0, 9.0, 8.0, 9.0, 2.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.08502197265625, -0.08223438262939453, -0.07944679260253906, -0.0766592025756836, -0.07387161254882812, -0.07108402252197266, -0.06829643249511719, -0.06550884246826172, -0.06272125244140625, -0.05993366241455078, -0.05714607238769531, -0.054358482360839844, -0.051570892333984375, -0.048783302307128906, -0.04599571228027344, -0.04320812225341797, -0.0404205322265625, -0.03763294219970703, -0.03484535217285156, -0.032057762145996094, -0.029270172119140625, -0.026482582092285156, -0.023694992065429688, -0.02090740203857422, -0.01811981201171875, -0.015332221984863281, -0.012544631958007812, -0.009757041931152344, -0.006969451904296875, -0.004181861877441406, -0.0013942718505859375, 0.0013933181762695312, 0.004180908203125, 0.006968498229980469, 0.009756088256835938, 0.012543678283691406, 0.015331268310546875, 0.018118858337402344, 0.020906448364257812, 0.02369403839111328, 0.02648162841796875, 0.02926921844482422, 0.03205680847167969, 0.034844398498535156, 0.037631988525390625, 0.040419578552246094, 0.04320716857910156, 0.04599475860595703, 0.0487823486328125, 0.05156993865966797, 0.05435752868652344, 0.057145118713378906, 0.059932708740234375, 0.06272029876708984, 0.06550788879394531, 0.06829547882080078, 0.07108306884765625, 0.07387065887451172, 0.07665824890136719, 0.07944583892822266, 0.08223342895507812, 0.0850210189819336, 0.08780860900878906, 0.09059619903564453, 0.0933837890625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 3.0, 13.0, 18.0, 21.0, 36.0, 48.0, 72.0, 147.0, 256.0, 521.0, 1051.0, 2141.0, 4210.0, 8675.0, 18622.0, 41917.0, 97393.0, 210256.0, 288970.0, 205290.0, 94027.0, 40163.0, 17854.0, 8422.0, 4258.0, 2018.0, 1039.0, 502.0, 252.0, 123.0, 73.0, 55.0, 38.0, 14.0, 15.0, 8.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.025909423828125, -0.024999618530273438, -0.024089813232421875, -0.023180007934570312, -0.02227020263671875, -0.021360397338867188, -0.020450592041015625, -0.019540786743164062, -0.0186309814453125, -0.017721176147460938, -0.016811370849609375, -0.015901565551757812, -0.01499176025390625, -0.014081954956054688, -0.013172149658203125, -0.012262344360351562, -0.0113525390625, -0.010442733764648438, -0.009532928466796875, -0.008623123168945312, -0.00771331787109375, -0.0068035125732421875, -0.005893707275390625, -0.0049839019775390625, -0.0040740966796875, -0.0031642913818359375, -0.002254486083984375, -0.0013446807861328125, -0.00043487548828125, 0.0004749298095703125, 0.001384735107421875, 0.0022945404052734375, 0.003204345703125, 0.0041141510009765625, 0.005023956298828125, 0.0059337615966796875, 0.00684356689453125, 0.0077533721923828125, 0.008663177490234375, 0.009572982788085938, 0.0104827880859375, 0.011392593383789062, 0.012302398681640625, 0.013212203979492188, 0.01412200927734375, 0.015031814575195312, 0.015941619873046875, 0.016851425170898438, 0.01776123046875, 0.018671035766601562, 0.019580841064453125, 0.020490646362304688, 0.02140045166015625, 0.022310256958007812, 0.023220062255859375, 0.024129867553710938, 0.0250396728515625, 0.025949478149414062, 0.026859283447265625, 0.027769088745117188, 0.02867889404296875, 0.029588699340820312, 0.030498504638671875, 0.03140830993652344, 0.032318115234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 11.0, 7.0, 9.0, 14.0, 10.0, 23.0, 28.0, 29.0, 27.0, 33.0, 50.0, 47.0, 67.0, 50.0, 65.0, 51.0, 51.0, 76.0, 42.0, 62.0, 43.0, 29.0, 30.0, 25.0, 24.0, 16.0, 15.0, 13.0, 12.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.106231689453125e-06, -7.841736078262329e-06, -7.577240467071533e-06, -7.312744855880737e-06, -7.048249244689941e-06, -6.7837536334991455e-06, -6.51925802230835e-06, -6.254762411117554e-06, -5.990266799926758e-06, -5.725771188735962e-06, -5.461275577545166e-06, -5.19677996635437e-06, -4.932284355163574e-06, -4.667788743972778e-06, -4.403293132781982e-06, -4.1387975215911865e-06, -3.874301910400391e-06, -3.6098062992095947e-06, -3.345310688018799e-06, -3.080815076828003e-06, -2.816319465637207e-06, -2.551823854446411e-06, -2.2873282432556152e-06, -2.0228326320648193e-06, -1.7583370208740234e-06, -1.4938414096832275e-06, -1.2293457984924316e-06, -9.648501873016357e-07, -7.003545761108398e-07, -4.3585896492004395e-07, -1.7136335372924805e-07, 9.313225746154785e-08, 3.5762786865234375e-07, 6.221234798431396e-07, 8.866190910339355e-07, 1.1511147022247314e-06, 1.4156103134155273e-06, 1.6801059246063232e-06, 1.944601535797119e-06, 2.209097146987915e-06, 2.473592758178711e-06, 2.738088369369507e-06, 3.0025839805603027e-06, 3.2670795917510986e-06, 3.5315752029418945e-06, 3.7960708141326904e-06, 4.060566425323486e-06, 4.325062036514282e-06, 4.589557647705078e-06, 4.854053258895874e-06, 5.11854887008667e-06, 5.383044481277466e-06, 5.647540092468262e-06, 5.912035703659058e-06, 6.1765313148498535e-06, 6.441026926040649e-06, 6.705522537231445e-06, 6.970018148422241e-06, 7.234513759613037e-06, 7.499009370803833e-06, 7.763504981994629e-06, 8.028000593185425e-06, 8.29249620437622e-06, 8.556991815567017e-06, 8.821487426757812e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 17.0, 15.0, 22.0, 35.0, 29.0, 51.0, 76.0, 108.0, 134.0, 246.0, 436.0, 795.0, 1521.0, 3479.0, 7593.0, 18834.0, 50258.0, 136749.0, 287026.0, 298989.0, 150764.0, 54926.0, 20797.0, 8291.0, 3542.0, 1739.0, 858.0, 433.0, 269.0, 145.0, 96.0, 66.0, 58.0, 37.0, 34.0, 28.0, 12.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0296173095703125, -0.02866339683532715, -0.027709484100341797, -0.026755571365356445, -0.025801658630371094, -0.024847745895385742, -0.02389383316040039, -0.02293992042541504, -0.021986007690429688, -0.021032094955444336, -0.020078182220458984, -0.019124269485473633, -0.01817035675048828, -0.01721644401550293, -0.016262531280517578, -0.015308618545532227, -0.014354705810546875, -0.013400793075561523, -0.012446880340576172, -0.01149296760559082, -0.010539054870605469, -0.009585142135620117, -0.008631229400634766, -0.007677316665649414, -0.0067234039306640625, -0.005769491195678711, -0.004815578460693359, -0.003861665725708008, -0.0029077529907226562, -0.0019538402557373047, -0.0009999275207519531, -4.601478576660156e-05, 0.00090789794921875, 0.0018618106842041016, 0.002815723419189453, 0.0037696361541748047, 0.004723548889160156, 0.005677461624145508, 0.006631374359130859, 0.007585287094116211, 0.008539199829101562, 0.009493112564086914, 0.010447025299072266, 0.011400938034057617, 0.012354850769042969, 0.01330876350402832, 0.014262676239013672, 0.015216588973999023, 0.016170501708984375, 0.017124414443969727, 0.018078327178955078, 0.01903223991394043, 0.01998615264892578, 0.020940065383911133, 0.021893978118896484, 0.022847890853881836, 0.023801803588867188, 0.02475571632385254, 0.02570962905883789, 0.026663541793823242, 0.027617454528808594, 0.028571367263793945, 0.029525279998779297, 0.03047919273376465, 0.03143310546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 5.0, 11.0, 12.0, 10.0, 15.0, 15.0, 17.0, 21.0, 29.0, 21.0, 31.0, 36.0, 46.0, 37.0, 52.0, 52.0, 57.0, 63.0, 48.0, 44.0, 69.0, 56.0, 40.0, 28.0, 31.0, 32.0, 24.0, 24.0, 5.0, 13.0, 11.0, 7.0, 12.0, 6.0, 7.0, 5.0, 1.0, 6.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0216827392578125, -0.020970821380615234, -0.02025890350341797, -0.019546985626220703, -0.018835067749023438, -0.018123149871826172, -0.017411231994628906, -0.01669931411743164, -0.015987396240234375, -0.01527547836303711, -0.014563560485839844, -0.013851642608642578, -0.013139724731445312, -0.012427806854248047, -0.011715888977050781, -0.011003971099853516, -0.01029205322265625, -0.009580135345458984, -0.008868217468261719, -0.008156299591064453, -0.0074443817138671875, -0.006732463836669922, -0.006020545959472656, -0.005308628082275391, -0.004596710205078125, -0.0038847923278808594, -0.0031728744506835938, -0.002460956573486328, -0.0017490386962890625, -0.0010371208190917969, -0.00032520294189453125, 0.0003867149353027344, 0.0010986328125, 0.0018105506896972656, 0.0025224685668945312, 0.003234386444091797, 0.0039463043212890625, 0.004658222198486328, 0.005370140075683594, 0.006082057952880859, 0.006793975830078125, 0.007505893707275391, 0.008217811584472656, 0.008929729461669922, 0.009641647338867188, 0.010353565216064453, 0.011065483093261719, 0.011777400970458984, 0.01248931884765625, 0.013201236724853516, 0.013913154602050781, 0.014625072479248047, 0.015336990356445312, 0.016048908233642578, 0.016760826110839844, 0.01747274398803711, 0.018184661865234375, 0.01889657974243164, 0.019608497619628906, 0.020320415496826172, 0.021032333374023438, 0.021744251251220703, 0.02245616912841797, 0.023168087005615234, 0.0238800048828125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 32.0, 155.0, 341.0, 311.0, 136.0, 23.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.8679152727127075, -1.8333016633987427, -1.7986879348754883, -1.7640743255615234, -1.729460597038269, -1.6948469877243042, -1.6602332592010498, -1.625619649887085, -1.5910060405731201, -1.5563924312591553, -1.5217787027359009, -1.487165093421936, -1.4525513648986816, -1.4179377555847168, -1.3833240270614624, -1.3487104177474976, -1.3140966892242432, -1.2794830799102783, -1.244869351387024, -1.210255742073059, -1.1756420135498047, -1.1410284042358398, -1.1064146757125854, -1.0718010663986206, -1.0371873378753662, -1.0025737285614014, -0.967960000038147, -0.9333463311195374, -0.8987326622009277, -0.8641190528869629, -0.8295053839683533, -0.7948917150497437, -0.7602779865264893, -0.7256643176078796, -0.69105064868927, -0.6564369797706604, -0.6218233108520508, -0.5872097015380859, -0.5525960326194763, -0.5179823637008667, -0.4833686947822571, -0.44875502586364746, -0.41414135694503784, -0.3795277178287506, -0.344914048910141, -0.31030037999153137, -0.27568674087524414, -0.24107307195663452, -0.2064594030380249, -0.17184573411941528, -0.13723208010196686, -0.10261841863393784, -0.06800475716590881, -0.033391088247299194, 0.001222565770149231, 0.035836219787597656, 0.07044988870620728, 0.1050635501742363, 0.13967721164226532, 0.17429086565971375, 0.20890453457832336, 0.24351820349693298, 0.2781318426132202, 0.31274551153182983, 0.34735918045043945]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 2.0, 4.0, 6.0, 8.0, 8.0, 14.0, 16.0, 18.0, 17.0, 22.0, 18.0, 20.0, 45.0, 35.0, 26.0, 41.0, 35.0, 41.0, 46.0, 38.0, 43.0, 46.0, 43.0, 45.0, 36.0, 33.0, 25.0, 36.0, 36.0, 28.0, 26.0, 18.0, 26.0, 26.0, 12.0, 15.0, 15.0, 11.0, 7.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.33069419860839844, -0.3213156759738922, -0.311937153339386, -0.30255863070487976, -0.29318010807037354, -0.2838015854358673, -0.2744230628013611, -0.26504454016685486, -0.25566601753234863, -0.2462874948978424, -0.23690897226333618, -0.22753044962882996, -0.21815192699432373, -0.2087734043598175, -0.19939488172531128, -0.19001635909080505, -0.18063785135746002, -0.1712593287229538, -0.16188080608844757, -0.15250228345394135, -0.14312376081943512, -0.1337452381849289, -0.12436672300100327, -0.11498820036649704, -0.10560967773199081, -0.09623115509748459, -0.08685263246297836, -0.07747411727905273, -0.06809559464454651, -0.058717068284749985, -0.04933854937553406, -0.03996002674102783, -0.030581504106521606, -0.02120298147201538, -0.011824460700154305, -0.002445939928293228, 0.0069325827062129974, 0.016311105340719223, 0.02568962424993515, 0.035068146884441376, 0.0444466695189476, 0.05382519215345383, 0.06320371478796005, 0.07258222997188568, 0.0819607526063919, 0.09133927524089813, 0.10071779787540436, 0.11009632050991058, 0.11947484314441681, 0.12885336577892303, 0.13823188841342926, 0.14761041104793549, 0.1569889336824417, 0.16636745631694794, 0.17574596405029297, 0.1851244866847992, 0.19450300931930542, 0.20388153195381165, 0.21326005458831787, 0.2226385772228241, 0.23201709985733032, 0.24139562249183655, 0.2507741451263428, 0.260152667760849, 0.2695311903953552]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 2.0, 7.0, 9.0, 19.0, 27.0, 36.0, 68.0, 105.0, 183.0, 312.0, 613.0, 1610.0, 5369.0, 32016.0, 436860.0, 3147273.0, 524141.0, 36395.0, 6443.0, 1658.0, 599.0, 262.0, 108.0, 65.0, 37.0, 27.0, 13.0, 9.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1026611328125, -0.09977149963378906, -0.09688186645507812, -0.09399223327636719, -0.09110260009765625, -0.08821296691894531, -0.08532333374023438, -0.08243370056152344, -0.0795440673828125, -0.07665443420410156, -0.07376480102539062, -0.07087516784667969, -0.06798553466796875, -0.06509590148925781, -0.062206268310546875, -0.05931663513183594, -0.056427001953125, -0.05353736877441406, -0.050647735595703125, -0.04775810241699219, -0.04486846923828125, -0.04197883605957031, -0.039089202880859375, -0.03619956970214844, -0.0333099365234375, -0.030420303344726562, -0.027530670166015625, -0.024641036987304688, -0.02175140380859375, -0.018861770629882812, -0.015972137451171875, -0.013082504272460938, -0.01019287109375, -0.0073032379150390625, -0.004413604736328125, -0.0015239715576171875, 0.00136566162109375, 0.0042552947998046875, 0.007144927978515625, 0.010034561157226562, 0.0129241943359375, 0.015813827514648438, 0.018703460693359375, 0.021593093872070312, 0.02448272705078125, 0.027372360229492188, 0.030261993408203125, 0.03315162658691406, 0.036041259765625, 0.03893089294433594, 0.041820526123046875, 0.04471015930175781, 0.04759979248046875, 0.05048942565917969, 0.053379058837890625, 0.05626869201660156, 0.0591583251953125, 0.06204795837402344, 0.06493759155273438, 0.06782722473144531, 0.07071685791015625, 0.07360649108886719, 0.07649612426757812, 0.07938575744628906, 0.082275390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 5.0, 2.0, 16.0, 22.0, 36.0, 40.0, 48.0, 56.0, 71.0, 81.0, 82.0, 82.0, 68.0, 66.0, 86.0, 58.0, 45.0, 39.0, 32.0, 18.0, 17.0, 9.0, 6.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06744384765625, -0.06548452377319336, -0.06352519989013672, -0.06156587600708008, -0.05960655212402344, -0.0576472282409668, -0.055687904357910156, -0.053728580474853516, -0.051769256591796875, -0.049809932708740234, -0.047850608825683594, -0.04589128494262695, -0.04393196105957031, -0.04197263717651367, -0.04001331329345703, -0.03805398941040039, -0.03609466552734375, -0.03413534164428711, -0.03217601776123047, -0.030216693878173828, -0.028257369995117188, -0.026298046112060547, -0.024338722229003906, -0.022379398345947266, -0.020420074462890625, -0.018460750579833984, -0.016501426696777344, -0.014542102813720703, -0.012582778930664062, -0.010623455047607422, -0.008664131164550781, -0.006704807281494141, -0.0047454833984375, -0.0027861595153808594, -0.0008268356323242188, 0.0011324882507324219, 0.0030918121337890625, 0.005051136016845703, 0.007010459899902344, 0.008969783782958984, 0.010929107666015625, 0.012888431549072266, 0.014847755432128906, 0.016807079315185547, 0.018766403198242188, 0.020725727081298828, 0.02268505096435547, 0.02464437484741211, 0.02660369873046875, 0.02856302261352539, 0.03052234649658203, 0.03248167037963867, 0.03444099426269531, 0.03640031814575195, 0.038359642028808594, 0.040318965911865234, 0.042278289794921875, 0.044237613677978516, 0.046196937561035156, 0.0481562614440918, 0.05011558532714844, 0.05207490921020508, 0.05403423309326172, 0.05599355697631836, 0.057952880859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 9.0, 4.0, 5.0, 16.0, 16.0, 24.0, 31.0, 39.0, 61.0, 84.0, 106.0, 165.0, 260.0, 457.0, 887.0, 2982.0, 16348.0, 148826.0, 1686839.0, 2104958.0, 204843.0, 21304.0, 3672.0, 1017.0, 461.0, 255.0, 180.0, 124.0, 85.0, 64.0, 44.0, 25.0, 26.0, 18.0, 20.0, 9.0, 3.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0758056640625, -0.07300472259521484, -0.07020378112792969, -0.06740283966064453, -0.06460189819335938, -0.06180095672607422, -0.05900001525878906, -0.056199073791503906, -0.05339813232421875, -0.050597190856933594, -0.04779624938964844, -0.04499530792236328, -0.042194366455078125, -0.03939342498779297, -0.03659248352050781, -0.033791542053222656, -0.0309906005859375, -0.028189659118652344, -0.025388717651367188, -0.02258777618408203, -0.019786834716796875, -0.01698589324951172, -0.014184951782226562, -0.011384010314941406, -0.00858306884765625, -0.005782127380371094, -0.0029811859130859375, -0.00018024444580078125, 0.002620697021484375, 0.005421638488769531, 0.008222579956054688, 0.011023521423339844, 0.013824462890625, 0.016625404357910156, 0.019426345825195312, 0.02222728729248047, 0.025028228759765625, 0.02782917022705078, 0.030630111694335938, 0.033431053161621094, 0.03623199462890625, 0.039032936096191406, 0.04183387756347656, 0.04463481903076172, 0.047435760498046875, 0.05023670196533203, 0.05303764343261719, 0.055838584899902344, 0.0586395263671875, 0.061440467834472656, 0.06424140930175781, 0.06704235076904297, 0.06984329223632812, 0.07264423370361328, 0.07544517517089844, 0.0782461166381836, 0.08104705810546875, 0.0838479995727539, 0.08664894104003906, 0.08944988250732422, 0.09225082397460938, 0.09505176544189453, 0.09785270690917969, 0.10065364837646484, 0.10345458984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 8.0, 15.0, 19.0, 41.0, 42.0, 63.0, 66.0, 97.0, 119.0, 174.0, 166.0, 255.0, 258.0, 307.0, 367.0, 377.0, 315.0, 287.0, 245.0, 220.0, 139.0, 117.0, 89.0, 78.0, 53.0, 33.0, 28.0, 19.0, 14.0, 19.0, 6.0, 9.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0513916015625, -0.04992198944091797, -0.04845237731933594, -0.046982765197753906, -0.045513153076171875, -0.044043540954589844, -0.04257392883300781, -0.04110431671142578, -0.03963470458984375, -0.03816509246826172, -0.03669548034667969, -0.035225868225097656, -0.033756256103515625, -0.032286643981933594, -0.030817031860351562, -0.02934741973876953, -0.0278778076171875, -0.02640819549560547, -0.024938583374023438, -0.023468971252441406, -0.021999359130859375, -0.020529747009277344, -0.019060134887695312, -0.01759052276611328, -0.01612091064453125, -0.014651298522949219, -0.013181686401367188, -0.011712074279785156, -0.010242462158203125, -0.008772850036621094, -0.0073032379150390625, -0.005833625793457031, -0.004364013671875, -0.0028944015502929688, -0.0014247894287109375, 4.482269287109375e-05, 0.001514434814453125, 0.0029840469360351562, 0.0044536590576171875, 0.005923271179199219, 0.00739288330078125, 0.008862495422363281, 0.010332107543945312, 0.011801719665527344, 0.013271331787109375, 0.014740943908691406, 0.016210556030273438, 0.01768016815185547, 0.0191497802734375, 0.02061939239501953, 0.022089004516601562, 0.023558616638183594, 0.025028228759765625, 0.026497840881347656, 0.027967453002929688, 0.02943706512451172, 0.03090667724609375, 0.03237628936767578, 0.03384590148925781, 0.035315513610839844, 0.036785125732421875, 0.038254737854003906, 0.03972434997558594, 0.04119396209716797, 0.04266357421875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 13.0, 17.0, 58.0, 130.0, 239.0, 242.0, 174.0, 83.0, 35.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7170203924179077, -0.6996951699256897, -0.6823700070381165, -0.6650447845458984, -0.6477196216583252, -0.6303943991661072, -0.6130692362785339, -0.5957440137863159, -0.5784188508987427, -0.5610936284065247, -0.5437684655189514, -0.5264432430267334, -0.5091180801391602, -0.4917928874492645, -0.4744676947593689, -0.4571424722671509, -0.43981727957725525, -0.4224920868873596, -0.405166894197464, -0.38784170150756836, -0.37051650881767273, -0.3531913161277771, -0.3358660936355591, -0.31854093074798584, -0.3012157082557678, -0.2838905155658722, -0.26656532287597656, -0.24924013018608093, -0.2319149374961853, -0.21458974480628967, -0.19726453721523285, -0.17993934452533722, -0.16261416673660278, -0.14528897404670715, -0.12796378135681152, -0.1106385812163353, -0.09331338852643967, -0.07598819583654404, -0.05866299569606781, -0.04133780300617218, -0.02401261031627655, -0.006687415763735771, 0.010637778788805008, 0.027962975203990936, 0.045288167893886566, 0.0626133605837822, 0.07993856072425842, 0.09726375341415405, 0.11458894610404968, 0.1319141387939453, 0.14923933148384094, 0.16656452417373657, 0.1838897168636322, 0.20121490955352783, 0.21854011714458466, 0.23586530983448029, 0.2531905174255371, 0.27051571011543274, 0.28784090280532837, 0.305166095495224, 0.32249128818511963, 0.33981648087501526, 0.3571416735649109, 0.3744668960571289, 0.39179205894470215]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 9.0, 9.0, 5.0, 7.0, 9.0, 8.0, 20.0, 20.0, 13.0, 21.0, 24.0, 28.0, 30.0, 19.0, 43.0, 32.0, 35.0, 30.0, 47.0, 33.0, 43.0, 34.0, 40.0, 41.0, 41.0, 28.0, 33.0, 28.0, 40.0, 28.0, 32.0, 23.0, 20.0, 21.0, 18.0, 16.0, 9.0, 10.0, 11.0, 6.0, 11.0, 4.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.15804046392440796, -0.1530129611492157, -0.14798545837402344, -0.14295795559883118, -0.13793045282363892, -0.13290293514728546, -0.1278754323720932, -0.12284792959690094, -0.11782042682170868, -0.11279292404651642, -0.10776542127132416, -0.1027379110455513, -0.09771040827035904, -0.09268290549516678, -0.08765539526939392, -0.08262789249420166, -0.0776003897190094, -0.07257288694381714, -0.06754538416862488, -0.06251787394285202, -0.05749037116765976, -0.0524628683924675, -0.04743536189198494, -0.04240785539150238, -0.03738035261631012, -0.03235284984111786, -0.0273253433406353, -0.02229783870279789, -0.01727033406496048, -0.01224282942712307, -0.00721532478928566, -0.0021878182888031006, 0.00283968448638916, 0.00786718912422657, 0.01289469376206398, 0.01792219839990139, 0.0229497030377388, 0.02797720767557621, 0.03300471231341362, 0.03803221881389618, 0.04305972158908844, 0.0480872243642807, 0.05311473086476326, 0.05814223736524582, 0.06316974014043808, 0.06819724291563034, 0.0732247531414032, 0.07825225591659546, 0.08327975869178772, 0.08830726146697998, 0.09333476424217224, 0.0983622744679451, 0.10338977724313736, 0.10841728001832962, 0.11344479024410248, 0.11847229301929474, 0.123499795794487, 0.12852729856967926, 0.13355480134487152, 0.13858230412006378, 0.14360982179641724, 0.1486373245716095, 0.15366482734680176, 0.15869233012199402, 0.16371983289718628]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 11.0, 8.0, 18.0, 26.0, 42.0, 52.0, 69.0, 119.0, 170.0, 318.0, 546.0, 1042.0, 2241.0, 5196.0, 12501.0, 33094.0, 90612.0, 245215.0, 367393.0, 182735.0, 65489.0, 24491.0, 9579.0, 3935.0, 1699.0, 796.0, 434.0, 261.0, 154.0, 85.0, 69.0, 47.0, 24.0, 25.0, 12.0, 10.0, 13.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083251953125, -0.0804147720336914, -0.07757759094238281, -0.07474040985107422, -0.07190322875976562, -0.06906604766845703, -0.06622886657714844, -0.06339168548583984, -0.06055450439453125, -0.057717323303222656, -0.05488014221191406, -0.05204296112060547, -0.049205780029296875, -0.04636859893798828, -0.04353141784667969, -0.040694236755371094, -0.0378570556640625, -0.035019874572753906, -0.03218269348144531, -0.02934551239013672, -0.026508331298828125, -0.02367115020751953, -0.020833969116210938, -0.017996788024902344, -0.01515960693359375, -0.012322425842285156, -0.009485244750976562, -0.006648063659667969, -0.003810882568359375, -0.0009737014770507812, 0.0018634796142578125, 0.004700660705566406, 0.007537841796875, 0.010375022888183594, 0.013212203979492188, 0.01604938507080078, 0.018886566162109375, 0.02172374725341797, 0.024560928344726562, 0.027398109436035156, 0.03023529052734375, 0.033072471618652344, 0.03590965270996094, 0.03874683380126953, 0.041584014892578125, 0.04442119598388672, 0.04725837707519531, 0.050095558166503906, 0.0529327392578125, 0.055769920349121094, 0.05860710144042969, 0.06144428253173828, 0.06428146362304688, 0.06711864471435547, 0.06995582580566406, 0.07279300689697266, 0.07563018798828125, 0.07846736907958984, 0.08130455017089844, 0.08414173126220703, 0.08697891235351562, 0.08981609344482422, 0.09265327453613281, 0.0954904556274414, 0.09832763671875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 23.0, 19.0, 34.0, 39.0, 54.0, 86.0, 68.0, 75.0, 83.0, 87.0, 72.0, 77.0, 66.0, 64.0, 32.0, 39.0, 21.0, 12.0, 17.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0625, -0.06054210662841797, -0.05858421325683594, -0.056626319885253906, -0.054668426513671875, -0.052710533142089844, -0.05075263977050781, -0.04879474639892578, -0.04683685302734375, -0.04487895965576172, -0.04292106628417969, -0.040963172912597656, -0.039005279541015625, -0.037047386169433594, -0.03508949279785156, -0.03313159942626953, -0.0311737060546875, -0.02921581268310547, -0.027257919311523438, -0.025300025939941406, -0.023342132568359375, -0.021384239196777344, -0.019426345825195312, -0.01746845245361328, -0.01551055908203125, -0.013552665710449219, -0.011594772338867188, -0.009636878967285156, -0.007678985595703125, -0.005721092224121094, -0.0037631988525390625, -0.0018053054809570312, 0.000152587890625, 0.0021104812622070312, 0.0040683746337890625, 0.006026268005371094, 0.007984161376953125, 0.009942054748535156, 0.011899948120117188, 0.013857841491699219, 0.01581573486328125, 0.01777362823486328, 0.019731521606445312, 0.021689414978027344, 0.023647308349609375, 0.025605201721191406, 0.027563095092773438, 0.02952098846435547, 0.0314788818359375, 0.03343677520751953, 0.03539466857910156, 0.037352561950683594, 0.039310455322265625, 0.041268348693847656, 0.04322624206542969, 0.04518413543701172, 0.04714202880859375, 0.04909992218017578, 0.05105781555175781, 0.053015708923339844, 0.054973602294921875, 0.056931495666503906, 0.05888938903808594, 0.06084728240966797, 0.06280517578125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 10.0, 8.0, 9.0, 11.0, 11.0, 14.0, 23.0, 26.0, 52.0, 65.0, 81.0, 129.0, 310.0, 977.0, 3559.0, 13655.0, 49508.0, 164507.0, 390513.0, 290560.0, 96347.0, 27618.0, 7446.0, 1934.0, 571.0, 196.0, 90.0, 70.0, 55.0, 45.0, 29.0, 26.0, 30.0, 19.0, 9.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.10394287109375, -0.10056495666503906, -0.09718704223632812, -0.09380912780761719, -0.09043121337890625, -0.08705329895019531, -0.08367538452148438, -0.08029747009277344, -0.0769195556640625, -0.07354164123535156, -0.07016372680664062, -0.06678581237792969, -0.06340789794921875, -0.06002998352050781, -0.056652069091796875, -0.05327415466308594, -0.049896240234375, -0.04651832580566406, -0.043140411376953125, -0.03976249694824219, -0.03638458251953125, -0.03300666809082031, -0.029628753662109375, -0.026250839233398438, -0.0228729248046875, -0.019495010375976562, -0.016117095947265625, -0.012739181518554688, -0.00936126708984375, -0.0059833526611328125, -0.002605438232421875, 0.0007724761962890625, 0.004150390625, 0.0075283050537109375, 0.010906219482421875, 0.014284133911132812, 0.01766204833984375, 0.021039962768554688, 0.024417877197265625, 0.027795791625976562, 0.0311737060546875, 0.03455162048339844, 0.037929534912109375, 0.04130744934082031, 0.04468536376953125, 0.04806327819824219, 0.051441192626953125, 0.05481910705566406, 0.058197021484375, 0.06157493591308594, 0.06495285034179688, 0.06833076477050781, 0.07170867919921875, 0.07508659362792969, 0.07846450805664062, 0.08184242248535156, 0.0852203369140625, 0.08859825134277344, 0.09197616577148438, 0.09535408020019531, 0.09873199462890625, 0.10210990905761719, 0.10548782348632812, 0.10886573791503906, 0.11224365234375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 9.0, 10.0, 12.0, 15.0, 10.0, 23.0, 28.0, 25.0, 22.0, 35.0, 33.0, 34.0, 34.0, 34.0, 34.0, 40.0, 37.0, 42.0, 41.0, 38.0, 45.0, 35.0, 45.0, 43.0, 30.0, 37.0, 27.0, 24.0, 25.0, 19.0, 27.0, 13.0, 11.0, 11.0, 7.0, 8.0, 7.0, 4.0, 4.0, 6.0, 4.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.089111328125, -0.08628463745117188, -0.08345794677734375, -0.08063125610351562, -0.0778045654296875, -0.07497787475585938, -0.07215118408203125, -0.06932449340820312, -0.066497802734375, -0.06367111206054688, -0.06084442138671875, -0.058017730712890625, -0.0551910400390625, -0.052364349365234375, -0.04953765869140625, -0.046710968017578125, -0.04388427734375, -0.041057586669921875, -0.03823089599609375, -0.035404205322265625, -0.0325775146484375, -0.029750823974609375, -0.02692413330078125, -0.024097442626953125, -0.021270751953125, -0.018444061279296875, -0.01561737060546875, -0.012790679931640625, -0.0099639892578125, -0.007137298583984375, -0.00431060791015625, -0.001483917236328125, 0.0013427734375, 0.004169464111328125, 0.00699615478515625, 0.009822845458984375, 0.0126495361328125, 0.015476226806640625, 0.01830291748046875, 0.021129608154296875, 0.023956298828125, 0.026782989501953125, 0.02960968017578125, 0.032436370849609375, 0.0352630615234375, 0.038089752197265625, 0.04091644287109375, 0.043743133544921875, 0.04656982421875, 0.049396514892578125, 0.05222320556640625, 0.055049896240234375, 0.0578765869140625, 0.060703277587890625, 0.06352996826171875, 0.06635665893554688, 0.069183349609375, 0.07201004028320312, 0.07483673095703125, 0.07766342163085938, 0.0804901123046875, 0.08331680297851562, 0.08614349365234375, 0.08897018432617188, 0.091796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 14.0, 21.0, 23.0, 24.0, 54.0, 57.0, 104.0, 178.0, 272.0, 415.0, 682.0, 1218.0, 1955.0, 3602.0, 6524.0, 11977.0, 23410.0, 47146.0, 93448.0, 166246.0, 224305.0, 202176.0, 127437.0, 67242.0, 33169.0, 16783.0, 8720.0, 4685.0, 2680.0, 1525.0, 885.0, 572.0, 324.0, 212.0, 156.0, 91.0, 63.0, 41.0, 26.0, 17.0, 13.0, 14.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0232086181640625, -0.02247762680053711, -0.02174663543701172, -0.021015644073486328, -0.020284652709960938, -0.019553661346435547, -0.018822669982910156, -0.018091678619384766, -0.017360687255859375, -0.016629695892333984, -0.015898704528808594, -0.015167713165283203, -0.014436721801757812, -0.013705730438232422, -0.012974739074707031, -0.01224374771118164, -0.01151275634765625, -0.01078176498413086, -0.010050773620605469, -0.009319782257080078, -0.008588790893554688, -0.007857799530029297, -0.007126808166503906, -0.006395816802978516, -0.005664825439453125, -0.004933834075927734, -0.004202842712402344, -0.003471851348876953, -0.0027408599853515625, -0.002009868621826172, -0.0012788772583007812, -0.0005478858947753906, 0.00018310546875, 0.0009140968322753906, 0.0016450881958007812, 0.002376079559326172, 0.0031070709228515625, 0.003838062286376953, 0.004569053649902344, 0.005300045013427734, 0.006031036376953125, 0.006762027740478516, 0.007493019104003906, 0.008224010467529297, 0.008955001831054688, 0.009685993194580078, 0.010416984558105469, 0.01114797592163086, 0.01187896728515625, 0.01260995864868164, 0.013340950012207031, 0.014071941375732422, 0.014802932739257812, 0.015533924102783203, 0.016264915466308594, 0.016995906829833984, 0.017726898193359375, 0.018457889556884766, 0.019188880920410156, 0.019919872283935547, 0.020650863647460938, 0.021381855010986328, 0.02211284637451172, 0.02284383773803711, 0.0235748291015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 6.0, 6.0, 11.0, 10.0, 23.0, 21.0, 20.0, 34.0, 39.0, 58.0, 75.0, 89.0, 93.0, 93.0, 89.0, 71.0, 65.0, 46.0, 30.0, 32.0, 16.0, 13.0, 12.0, 12.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4662742614746094e-05, -1.4230608940124512e-05, -1.379847526550293e-05, -1.3366341590881348e-05, -1.2934207916259766e-05, -1.2502074241638184e-05, -1.2069940567016602e-05, -1.163780689239502e-05, -1.1205673217773438e-05, -1.0773539543151855e-05, -1.0341405868530273e-05, -9.909272193908691e-06, -9.47713851928711e-06, -9.045004844665527e-06, -8.612871170043945e-06, -8.180737495422363e-06, -7.748603820800781e-06, -7.316470146179199e-06, -6.884336471557617e-06, -6.452202796936035e-06, -6.020069122314453e-06, -5.587935447692871e-06, -5.155801773071289e-06, -4.723668098449707e-06, -4.291534423828125e-06, -3.859400749206543e-06, -3.427267074584961e-06, -2.995133399963379e-06, -2.562999725341797e-06, -2.130866050720215e-06, -1.6987323760986328e-06, -1.2665987014770508e-06, -8.344650268554688e-07, -4.023313522338867e-07, 2.9802322387695312e-08, 4.6193599700927734e-07, 8.940696716308594e-07, 1.3262033462524414e-06, 1.7583370208740234e-06, 2.1904706954956055e-06, 2.6226043701171875e-06, 3.0547380447387695e-06, 3.4868717193603516e-06, 3.919005393981934e-06, 4.351139068603516e-06, 4.783272743225098e-06, 5.21540641784668e-06, 5.647540092468262e-06, 6.079673767089844e-06, 6.511807441711426e-06, 6.943941116333008e-06, 7.37607479095459e-06, 7.808208465576172e-06, 8.240342140197754e-06, 8.672475814819336e-06, 9.104609489440918e-06, 9.5367431640625e-06, 9.968876838684082e-06, 1.0401010513305664e-05, 1.0833144187927246e-05, 1.1265277862548828e-05, 1.169741153717041e-05, 1.2129545211791992e-05, 1.2561678886413574e-05, 1.2993812561035156e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 1.0, 4.0, 12.0, 15.0, 30.0, 42.0, 55.0, 127.0, 219.0, 450.0, 1042.0, 2298.0, 5709.0, 15960.0, 47471.0, 145940.0, 321879.0, 307571.0, 133167.0, 42662.0, 14341.0, 5464.0, 2188.0, 953.0, 447.0, 213.0, 123.0, 58.0, 31.0, 27.0, 13.0, 13.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0380859375, -0.03702664375305176, -0.035967350006103516, -0.03490805625915527, -0.03384876251220703, -0.03278946876525879, -0.03173017501831055, -0.030670881271362305, -0.029611587524414062, -0.02855229377746582, -0.027493000030517578, -0.026433706283569336, -0.025374412536621094, -0.02431511878967285, -0.02325582504272461, -0.022196531295776367, -0.021137237548828125, -0.020077943801879883, -0.01901865005493164, -0.0179593563079834, -0.016900062561035156, -0.015840768814086914, -0.014781475067138672, -0.01372218132019043, -0.012662887573242188, -0.011603593826293945, -0.010544300079345703, -0.009485006332397461, -0.008425712585449219, -0.0073664188385009766, -0.006307125091552734, -0.005247831344604492, -0.00418853759765625, -0.003129243850708008, -0.0020699501037597656, -0.0010106563568115234, 4.863739013671875e-05, 0.001107931137084961, 0.002167224884033203, 0.0032265186309814453, 0.0042858123779296875, 0.00534510612487793, 0.006404399871826172, 0.007463693618774414, 0.008522987365722656, 0.009582281112670898, 0.01064157485961914, 0.011700868606567383, 0.012760162353515625, 0.013819456100463867, 0.01487874984741211, 0.01593804359436035, 0.016997337341308594, 0.018056631088256836, 0.019115924835205078, 0.02017521858215332, 0.021234512329101562, 0.022293806076049805, 0.023353099822998047, 0.02441239356994629, 0.02547168731689453, 0.026530981063842773, 0.027590274810791016, 0.028649568557739258, 0.0297088623046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 6.0, 11.0, 12.0, 13.0, 15.0, 15.0, 19.0, 25.0, 36.0, 31.0, 36.0, 35.0, 54.0, 40.0, 51.0, 70.0, 60.0, 60.0, 63.0, 60.0, 44.0, 33.0, 42.0, 39.0, 25.0, 18.0, 16.0, 12.0, 13.0, 4.0, 12.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0240631103515625, -0.02329850196838379, -0.022533893585205078, -0.021769285202026367, -0.021004676818847656, -0.020240068435668945, -0.019475460052490234, -0.018710851669311523, -0.017946243286132812, -0.0171816349029541, -0.01641702651977539, -0.01565241813659668, -0.014887809753417969, -0.014123201370239258, -0.013358592987060547, -0.012593984603881836, -0.011829376220703125, -0.011064767837524414, -0.010300159454345703, -0.009535551071166992, -0.008770942687988281, -0.00800633430480957, -0.007241725921630859, -0.0064771175384521484, -0.0057125091552734375, -0.0049479007720947266, -0.004183292388916016, -0.0034186840057373047, -0.0026540756225585938, -0.0018894672393798828, -0.0011248588562011719, -0.00036025047302246094, 0.00040435791015625, 0.001168966293334961, 0.0019335746765136719, 0.002698183059692383, 0.0034627914428710938, 0.004227399826049805, 0.004992008209228516, 0.0057566165924072266, 0.0065212249755859375, 0.0072858333587646484, 0.00805044174194336, 0.00881505012512207, 0.009579658508300781, 0.010344266891479492, 0.011108875274658203, 0.011873483657836914, 0.012638092041015625, 0.013402700424194336, 0.014167308807373047, 0.014931917190551758, 0.01569652557373047, 0.01646113395690918, 0.01722574234008789, 0.0179903507232666, 0.018754959106445312, 0.019519567489624023, 0.020284175872802734, 0.021048784255981445, 0.021813392639160156, 0.022578001022338867, 0.023342609405517578, 0.02410721778869629, 0.024871826171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 15.0, 45.0, 70.0, 134.0, 192.0, 202.0, 153.0, 97.0, 57.0, 20.0, 16.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7102943062782288, -0.6911340355873108, -0.6719738245010376, -0.6528135538101196, -0.6336533427238464, -0.6144930720329285, -0.5953328609466553, -0.5761725902557373, -0.5570123195648193, -0.5378520488739014, -0.5186918377876282, -0.4995315670967102, -0.4803713262081146, -0.46121108531951904, -0.44205084443092346, -0.4228906035423279, -0.4037303626537323, -0.3845701217651367, -0.36540988087654114, -0.34624963998794556, -0.3270893692970276, -0.307929128408432, -0.2887688875198364, -0.26960861682891846, -0.25044840574264526, -0.23128816485404968, -0.2121279090642929, -0.19296766817569733, -0.17380741238594055, -0.15464717149734497, -0.1354869306087494, -0.11632667481899261, -0.09716641902923584, -0.07800617069005966, -0.05884592607617378, -0.0396856814622879, -0.020525433123111725, -0.0013651847839355469, 0.017795056104660034, 0.03695531189441681, 0.05611555278301239, 0.07527580112218857, 0.09443604946136475, 0.11359629034996033, 0.1327565312385559, 0.15191678702831268, 0.17107702791690826, 0.19023728370666504, 0.20939752459526062, 0.2285577654838562, 0.24771802127361298, 0.26687824726104736, 0.28603851795196533, 0.3051987588405609, 0.3243589997291565, 0.34351927042007446, 0.36267948150634766, 0.38183972239494324, 0.4009999632835388, 0.4201602339744568, 0.43932047486305237, 0.45848071575164795, 0.47764095664024353, 0.4968011975288391, 0.5159614682197571]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 6.0, 5.0, 13.0, 1.0, 6.0, 9.0, 15.0, 8.0, 21.0, 31.0, 27.0, 29.0, 23.0, 35.0, 53.0, 33.0, 50.0, 45.0, 38.0, 43.0, 44.0, 38.0, 37.0, 38.0, 40.0, 37.0, 33.0, 32.0, 28.0, 30.0, 33.0, 21.0, 18.0, 17.0, 12.0, 11.0, 11.0, 7.0, 7.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3220139145851135, -0.311942994594574, -0.3018721044063568, -0.29180118441581726, -0.2817302942276001, -0.27165937423706055, -0.261588454246521, -0.25151753425598145, -0.24144664406776428, -0.23137573897838593, -0.22130483388900757, -0.21123391389846802, -0.20116300880908966, -0.1910921037197113, -0.18102118372917175, -0.1709502786397934, -0.16087937355041504, -0.15080846846103668, -0.14073756337165833, -0.13066664338111877, -0.12059573829174042, -0.11052483320236206, -0.1004539206624031, -0.09038300812244415, -0.0803121030330658, -0.07024119794368744, -0.060170285403728485, -0.05009937658905983, -0.040028467774391174, -0.02995755895972252, -0.019886650145053864, -0.00981573760509491, 0.00025516748428344727, 0.010326076298952103, 0.020396985113620758, 0.030467893928289413, 0.04053880274295807, 0.050609711557626724, 0.06068062037229538, 0.07075153291225433, 0.08082243800163269, 0.09089334309101105, 0.10096425563097, 0.11103516817092896, 0.12110607326030731, 0.13117697834968567, 0.14124789834022522, 0.15131880342960358, 0.16138970851898193, 0.1714606136083603, 0.18153151869773865, 0.1916024386882782, 0.20167334377765656, 0.2117442488670349, 0.22181516885757446, 0.23188607394695282, 0.24195697903633118, 0.2520278990268707, 0.2620987892150879, 0.27216970920562744, 0.282240629196167, 0.29231151938438416, 0.3023824393749237, 0.31245332956314087, 0.3225242495536804]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 8.0, 13.0, 15.0, 17.0, 42.0, 67.0, 135.0, 283.0, 652.0, 2081.0, 10253.0, 142392.0, 3363695.0, 645299.0, 24587.0, 3417.0, 769.0, 294.0, 133.0, 46.0, 42.0, 24.0, 9.0, 7.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.155029296875, -0.15091609954833984, -0.1468029022216797, -0.14268970489501953, -0.13857650756835938, -0.13446331024169922, -0.13035011291503906, -0.1262369155883789, -0.12212371826171875, -0.1180105209350586, -0.11389732360839844, -0.10978412628173828, -0.10567092895507812, -0.10155773162841797, -0.09744453430175781, -0.09333133697509766, -0.0892181396484375, -0.08510494232177734, -0.08099174499511719, -0.07687854766845703, -0.07276535034179688, -0.06865215301513672, -0.06453895568847656, -0.060425758361816406, -0.05631256103515625, -0.052199363708496094, -0.04808616638183594, -0.04397296905517578, -0.039859771728515625, -0.03574657440185547, -0.03163337707519531, -0.027520179748535156, -0.023406982421875, -0.019293785095214844, -0.015180587768554688, -0.011067390441894531, -0.006954193115234375, -0.0028409957885742188, 0.0012722015380859375, 0.005385398864746094, 0.00949859619140625, 0.013611793518066406, 0.017724990844726562, 0.02183818817138672, 0.025951385498046875, 0.03006458282470703, 0.03417778015136719, 0.038290977478027344, 0.0424041748046875, 0.046517372131347656, 0.05063056945800781, 0.05474376678466797, 0.058856964111328125, 0.06297016143798828, 0.06708335876464844, 0.0711965560913086, 0.07530975341796875, 0.0794229507446289, 0.08353614807128906, 0.08764934539794922, 0.09176254272460938, 0.09587574005126953, 0.09998893737792969, 0.10410213470458984, 0.10821533203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 10.0, 13.0, 18.0, 34.0, 39.0, 54.0, 70.0, 73.0, 79.0, 84.0, 76.0, 80.0, 80.0, 56.0, 52.0, 51.0, 40.0, 31.0, 15.0, 15.0, 11.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06927490234375, -0.0671854019165039, -0.06509590148925781, -0.06300640106201172, -0.060916900634765625, -0.05882740020751953, -0.05673789978027344, -0.054648399353027344, -0.05255889892578125, -0.050469398498535156, -0.04837989807128906, -0.04629039764404297, -0.044200897216796875, -0.04211139678955078, -0.04002189636230469, -0.037932395935058594, -0.0358428955078125, -0.033753395080566406, -0.03166389465332031, -0.02957439422607422, -0.027484893798828125, -0.02539539337158203, -0.023305892944335938, -0.021216392517089844, -0.01912689208984375, -0.017037391662597656, -0.014947891235351562, -0.012858390808105469, -0.010768890380859375, -0.008679389953613281, -0.0065898895263671875, -0.004500389099121094, -0.002410888671875, -0.00032138824462890625, 0.0017681121826171875, 0.0038576126098632812, 0.005947113037109375, 0.008036613464355469, 0.010126113891601562, 0.012215614318847656, 0.01430511474609375, 0.016394615173339844, 0.018484115600585938, 0.02057361602783203, 0.022663116455078125, 0.02475261688232422, 0.026842117309570312, 0.028931617736816406, 0.0310211181640625, 0.033110618591308594, 0.03520011901855469, 0.03728961944580078, 0.039379119873046875, 0.04146862030029297, 0.04355812072753906, 0.045647621154785156, 0.04773712158203125, 0.049826622009277344, 0.05191612243652344, 0.05400562286376953, 0.056095123291015625, 0.05818462371826172, 0.06027412414550781, 0.062363624572753906, 0.064453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 7.0, 19.0, 20.0, 34.0, 57.0, 103.0, 189.0, 360.0, 983.0, 5660.0, 95206.0, 2839508.0, 1213994.0, 33835.0, 2958.0, 679.0, 290.0, 143.0, 79.0, 50.0, 44.0, 22.0, 11.0, 6.0, 7.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11798095703125, -0.1135854721069336, -0.10918998718261719, -0.10479450225830078, -0.10039901733398438, -0.09600353240966797, -0.09160804748535156, -0.08721256256103516, -0.08281707763671875, -0.07842159271240234, -0.07402610778808594, -0.06963062286376953, -0.06523513793945312, -0.06083965301513672, -0.05644416809082031, -0.052048683166503906, -0.0476531982421875, -0.043257713317871094, -0.03886222839355469, -0.03446674346923828, -0.030071258544921875, -0.02567577362060547, -0.021280288696289062, -0.016884803771972656, -0.01248931884765625, -0.008093833923339844, -0.0036983489990234375, 0.0006971359252929688, 0.005092620849609375, 0.009488105773925781, 0.013883590698242188, 0.018279075622558594, 0.022674560546875, 0.027070045471191406, 0.03146553039550781, 0.03586101531982422, 0.040256500244140625, 0.04465198516845703, 0.04904747009277344, 0.053442955017089844, 0.05783843994140625, 0.062233924865722656, 0.06662940979003906, 0.07102489471435547, 0.07542037963867188, 0.07981586456298828, 0.08421134948730469, 0.0886068344116211, 0.0930023193359375, 0.0973978042602539, 0.10179328918457031, 0.10618877410888672, 0.11058425903320312, 0.11497974395751953, 0.11937522888183594, 0.12377071380615234, 0.12816619873046875, 0.13256168365478516, 0.13695716857910156, 0.14135265350341797, 0.14574813842773438, 0.15014362335205078, 0.1545391082763672, 0.1589345932006836, 0.163330078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 8.0, 9.0, 13.0, 18.0, 31.0, 51.0, 72.0, 91.0, 111.0, 188.0, 230.0, 351.0, 426.0, 497.0, 483.0, 389.0, 327.0, 240.0, 153.0, 123.0, 81.0, 54.0, 34.0, 26.0, 15.0, 15.0, 10.0, 6.0, 10.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.071533203125, -0.0696406364440918, -0.0677480697631836, -0.06585550308227539, -0.06396293640136719, -0.062070369720458984, -0.06017780303955078, -0.05828523635864258, -0.056392669677734375, -0.05450010299682617, -0.05260753631591797, -0.050714969635009766, -0.04882240295410156, -0.04692983627319336, -0.045037269592285156, -0.04314470291137695, -0.04125213623046875, -0.03935956954956055, -0.037467002868652344, -0.03557443618774414, -0.03368186950683594, -0.031789302825927734, -0.02989673614501953, -0.028004169464111328, -0.026111602783203125, -0.024219036102294922, -0.02232646942138672, -0.020433902740478516, -0.018541336059570312, -0.01664876937866211, -0.014756202697753906, -0.012863636016845703, -0.0109710693359375, -0.009078502655029297, -0.007185935974121094, -0.005293369293212891, -0.0034008026123046875, -0.0015082359313964844, 0.00038433074951171875, 0.002276897430419922, 0.004169464111328125, 0.006062030792236328, 0.007954597473144531, 0.009847164154052734, 0.011739730834960938, 0.01363229751586914, 0.015524864196777344, 0.017417430877685547, 0.01930999755859375, 0.021202564239501953, 0.023095130920410156, 0.02498769760131836, 0.026880264282226562, 0.028772830963134766, 0.03066539764404297, 0.03255796432495117, 0.034450531005859375, 0.03634309768676758, 0.03823566436767578, 0.040128231048583984, 0.04202079772949219, 0.04391336441040039, 0.045805931091308594, 0.0476984977722168, 0.049591064453125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 10.0, 6.0, 23.0, 26.0, 38.0, 60.0, 94.0, 105.0, 93.0, 99.0, 116.0, 91.0, 88.0, 56.0, 41.0, 28.0, 8.0, 8.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4136260449886322, -0.4049478769302368, -0.39626970887184143, -0.38759151101112366, -0.37891334295272827, -0.3702351748943329, -0.3615570068359375, -0.3528788387775421, -0.34420067071914673, -0.33552250266075134, -0.32684433460235596, -0.3181661367416382, -0.3094879686832428, -0.3008098006248474, -0.292131632566452, -0.28345346450805664, -0.27477526664733887, -0.2660970985889435, -0.2574189305305481, -0.24874074757099152, -0.24006256461143494, -0.23138439655303955, -0.22270622849464417, -0.21402806043624878, -0.2053498774766922, -0.19667170941829681, -0.18799352645874023, -0.17931535840034485, -0.17063719034194946, -0.16195900738239288, -0.1532808393239975, -0.14460265636444092, -0.13592448830604553, -0.12724632024765015, -0.11856813728809357, -0.10988996922969818, -0.1012117937207222, -0.09253361821174622, -0.08385545015335083, -0.07517727464437485, -0.06649909913539886, -0.05782092362642288, -0.0491427518427372, -0.040464580059051514, -0.03178640455007553, -0.02310822904109955, -0.014430057257413864, -0.00575188547372818, 0.0029262900352478027, 0.011604463681578636, 0.02028263732790947, 0.028960810974240303, 0.037638984620571136, 0.04631716012954712, 0.0549953319132328, 0.06367350369691849, 0.07235167920589447, 0.08102985471487045, 0.08970803022384644, 0.09838619828224182, 0.1070643737912178, 0.11574254930019379, 0.12442071735858917, 0.13309890031814575, 0.14177706837654114]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 14.0, 13.0, 7.0, 19.0, 16.0, 22.0, 25.0, 26.0, 43.0, 33.0, 39.0, 40.0, 45.0, 38.0, 43.0, 50.0, 46.0, 53.0, 42.0, 52.0, 34.0, 36.0, 17.0, 30.0, 35.0, 24.0, 24.0, 15.0, 23.0, 16.0, 13.0, 9.0, 6.0, 5.0, 8.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18157178163528442, -0.17576788365840912, -0.169964000582695, -0.1641601026058197, -0.1583562195301056, -0.15255232155323029, -0.14674842357635498, -0.14094454050064087, -0.13514064252376556, -0.12933674454689026, -0.12353286147117615, -0.11772896349430084, -0.11192507296800613, -0.10612118244171143, -0.10031728446483612, -0.09451339393854141, -0.0887095034122467, -0.082905612885952, -0.07710172235965729, -0.07129782438278198, -0.06549393385648727, -0.059690043330192566, -0.05388614907860756, -0.04808225482702255, -0.042278364300727844, -0.036474473774433136, -0.03067057952284813, -0.024866687133908272, -0.019062794744968414, -0.013258902356028557, -0.007455009967088699, -0.0016511157155036926, 0.004152774810791016, 0.009956667199730873, 0.01576055958867073, 0.021564451977610588, 0.027368344366550446, 0.033172234892845154, 0.03897612914443016, 0.04478002339601517, 0.050583913922309875, 0.056387804448604584, 0.06219169870018959, 0.0679955929517746, 0.0737994834780693, 0.07960337400436401, 0.08540727198123932, 0.09121116250753403, 0.09701505303382874, 0.10281894356012344, 0.10862283408641815, 0.11442673206329346, 0.12023062258958817, 0.12603451311588287, 0.13183841109275818, 0.1376422941684723, 0.1434461921453476, 0.1492500901222229, 0.155053973197937, 0.16085787117481232, 0.16666176915168762, 0.17246565222740173, 0.17826955020427704, 0.18407344818115234, 0.18987733125686646]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 4.0, 10.0, 5.0, 10.0, 14.0, 16.0, 29.0, 40.0, 74.0, 120.0, 151.0, 261.0, 451.0, 980.0, 2036.0, 4700.0, 12039.0, 32688.0, 96371.0, 271473.0, 368854.0, 169050.0, 55845.0, 19713.0, 7467.0, 3197.0, 1408.0, 632.0, 343.0, 175.0, 130.0, 81.0, 49.0, 44.0, 23.0, 22.0, 10.0, 8.0, 10.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1734619140625, -0.1683979034423828, -0.16333389282226562, -0.15826988220214844, -0.15320587158203125, -0.14814186096191406, -0.14307785034179688, -0.1380138397216797, -0.1329498291015625, -0.1278858184814453, -0.12282180786132812, -0.11775779724121094, -0.11269378662109375, -0.10762977600097656, -0.10256576538085938, -0.09750175476074219, -0.092437744140625, -0.08737373352050781, -0.08230972290039062, -0.07724571228027344, -0.07218170166015625, -0.06711769104003906, -0.062053680419921875, -0.05698966979980469, -0.0519256591796875, -0.04686164855957031, -0.041797637939453125, -0.03673362731933594, -0.03166961669921875, -0.026605606079101562, -0.021541595458984375, -0.016477584838867188, -0.01141357421875, -0.0063495635986328125, -0.001285552978515625, 0.0037784576416015625, 0.00884246826171875, 0.013906478881835938, 0.018970489501953125, 0.024034500122070312, 0.0290985107421875, 0.03416252136230469, 0.039226531982421875, 0.04429054260253906, 0.04935455322265625, 0.05441856384277344, 0.059482574462890625, 0.06454658508300781, 0.069610595703125, 0.07467460632324219, 0.07973861694335938, 0.08480262756347656, 0.08986663818359375, 0.09493064880371094, 0.09999465942382812, 0.10505867004394531, 0.1101226806640625, 0.11518669128417969, 0.12025070190429688, 0.12531471252441406, 0.13037872314453125, 0.13544273376464844, 0.14050674438476562, 0.1455707550048828, 0.150634765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 11.0, 16.0, 19.0, 21.0, 48.0, 55.0, 77.0, 65.0, 84.0, 70.0, 81.0, 75.0, 68.0, 80.0, 47.0, 58.0, 32.0, 28.0, 19.0, 18.0, 5.0, 8.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06817626953125, -0.06618261337280273, -0.06418895721435547, -0.0621953010559082, -0.06020164489746094, -0.05820798873901367, -0.056214332580566406, -0.05422067642211914, -0.052227020263671875, -0.05023336410522461, -0.048239707946777344, -0.04624605178833008, -0.04425239562988281, -0.04225873947143555, -0.04026508331298828, -0.038271427154541016, -0.03627777099609375, -0.034284114837646484, -0.03229045867919922, -0.030296802520751953, -0.028303146362304688, -0.026309490203857422, -0.024315834045410156, -0.02232217788696289, -0.020328521728515625, -0.01833486557006836, -0.016341209411621094, -0.014347553253173828, -0.012353897094726562, -0.010360240936279297, -0.008366584777832031, -0.006372928619384766, -0.0043792724609375, -0.0023856163024902344, -0.00039196014404296875, 0.0016016960144042969, 0.0035953521728515625, 0.005589008331298828, 0.007582664489746094, 0.00957632064819336, 0.011569976806640625, 0.01356363296508789, 0.015557289123535156, 0.017550945281982422, 0.019544601440429688, 0.021538257598876953, 0.02353191375732422, 0.025525569915771484, 0.02751922607421875, 0.029512882232666016, 0.03150653839111328, 0.03350019454956055, 0.03549385070800781, 0.03748750686645508, 0.039481163024902344, 0.04147481918334961, 0.043468475341796875, 0.04546213150024414, 0.047455787658691406, 0.04944944381713867, 0.05144309997558594, 0.0534367561340332, 0.05543041229248047, 0.057424068450927734, 0.059417724609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 8.0, 8.0, 7.0, 12.0, 15.0, 21.0, 33.0, 36.0, 50.0, 75.0, 138.0, 211.0, 365.0, 674.0, 1431.0, 3136.0, 7207.0, 17585.0, 43995.0, 106648.0, 218486.0, 286768.0, 200959.0, 94412.0, 38595.0, 15699.0, 6369.0, 2719.0, 1268.0, 651.0, 323.0, 219.0, 135.0, 97.0, 52.0, 40.0, 33.0, 21.0, 16.0, 10.0, 6.0, 10.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.10252666473388672, -0.09915733337402344, -0.09578800201416016, -0.09241867065429688, -0.0890493392944336, -0.08568000793457031, -0.08231067657470703, -0.07894134521484375, -0.07557201385498047, -0.07220268249511719, -0.0688333511352539, -0.06546401977539062, -0.062094688415527344, -0.05872535705566406, -0.05535602569580078, -0.0519866943359375, -0.04861736297607422, -0.04524803161621094, -0.041878700256347656, -0.038509368896484375, -0.035140037536621094, -0.03177070617675781, -0.02840137481689453, -0.02503204345703125, -0.02166271209716797, -0.018293380737304688, -0.014924049377441406, -0.011554718017578125, -0.008185386657714844, -0.0048160552978515625, -0.0014467239379882812, 0.001922607421875, 0.005291938781738281, 0.008661270141601562, 0.012030601501464844, 0.015399932861328125, 0.018769264221191406, 0.022138595581054688, 0.02550792694091797, 0.02887725830078125, 0.03224658966064453, 0.03561592102050781, 0.038985252380371094, 0.042354583740234375, 0.045723915100097656, 0.04909324645996094, 0.05246257781982422, 0.0558319091796875, 0.05920124053955078, 0.06257057189941406, 0.06593990325927734, 0.06930923461914062, 0.0726785659790039, 0.07604789733886719, 0.07941722869873047, 0.08278656005859375, 0.08615589141845703, 0.08952522277832031, 0.0928945541381836, 0.09626388549804688, 0.09963321685791016, 0.10300254821777344, 0.10637187957763672, 0.1097412109375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 11.0, 11.0, 9.0, 11.0, 18.0, 16.0, 20.0, 19.0, 23.0, 24.0, 23.0, 36.0, 35.0, 41.0, 39.0, 34.0, 49.0, 45.0, 48.0, 51.0, 49.0, 51.0, 29.0, 32.0, 42.0, 34.0, 33.0, 20.0, 20.0, 23.0, 26.0, 20.0, 15.0, 11.0, 10.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11669921875, -0.11301040649414062, -0.10932159423828125, -0.10563278198242188, -0.1019439697265625, -0.09825515747070312, -0.09456634521484375, -0.09087753295898438, -0.087188720703125, -0.08349990844726562, -0.07981109619140625, -0.07612228393554688, -0.0724334716796875, -0.06874465942382812, -0.06505584716796875, -0.061367034912109375, -0.05767822265625, -0.053989410400390625, -0.05030059814453125, -0.046611785888671875, -0.0429229736328125, -0.039234161376953125, -0.03554534912109375, -0.031856536865234375, -0.028167724609375, -0.024478912353515625, -0.02079010009765625, -0.017101287841796875, -0.0134124755859375, -0.009723663330078125, -0.00603485107421875, -0.002346038818359375, 0.0013427734375, 0.005031585693359375, 0.00872039794921875, 0.012409210205078125, 0.0160980224609375, 0.019786834716796875, 0.02347564697265625, 0.027164459228515625, 0.030853271484375, 0.034542083740234375, 0.03823089599609375, 0.041919708251953125, 0.0456085205078125, 0.049297332763671875, 0.05298614501953125, 0.056674957275390625, 0.06036376953125, 0.06405258178710938, 0.06774139404296875, 0.07143020629882812, 0.0751190185546875, 0.07880783081054688, 0.08249664306640625, 0.08618545532226562, 0.089874267578125, 0.09356307983398438, 0.09725189208984375, 0.10094070434570312, 0.1046295166015625, 0.10831832885742188, 0.11200714111328125, 0.11569595336914062, 0.119384765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 8.0, 11.0, 14.0, 16.0, 22.0, 52.0, 82.0, 112.0, 193.0, 326.0, 544.0, 832.0, 1433.0, 2369.0, 3981.0, 6760.0, 12092.0, 22303.0, 42249.0, 83749.0, 161253.0, 245691.0, 213596.0, 119838.0, 60519.0, 31291.0, 16735.0, 9218.0, 5384.0, 3142.0, 1863.0, 1072.0, 688.0, 418.0, 238.0, 160.0, 108.0, 72.0, 34.0, 22.0, 24.0, 13.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.044769287109375, -0.0435175895690918, -0.042265892028808594, -0.04101419448852539, -0.03976249694824219, -0.038510799407958984, -0.03725910186767578, -0.03600740432739258, -0.034755706787109375, -0.03350400924682617, -0.03225231170654297, -0.031000614166259766, -0.029748916625976562, -0.02849721908569336, -0.027245521545410156, -0.025993824005126953, -0.02474212646484375, -0.023490428924560547, -0.022238731384277344, -0.02098703384399414, -0.019735336303710938, -0.018483638763427734, -0.01723194122314453, -0.015980243682861328, -0.014728546142578125, -0.013476848602294922, -0.012225151062011719, -0.010973453521728516, -0.009721755981445312, -0.00847005844116211, -0.007218360900878906, -0.005966663360595703, -0.0047149658203125, -0.003463268280029297, -0.0022115707397460938, -0.0009598731994628906, 0.0002918243408203125, 0.0015435218811035156, 0.0027952194213867188, 0.004046916961669922, 0.005298614501953125, 0.006550312042236328, 0.007802009582519531, 0.009053707122802734, 0.010305404663085938, 0.01155710220336914, 0.012808799743652344, 0.014060497283935547, 0.01531219482421875, 0.016563892364501953, 0.017815589904785156, 0.01906728744506836, 0.020318984985351562, 0.021570682525634766, 0.02282238006591797, 0.024074077606201172, 0.025325775146484375, 0.026577472686767578, 0.02782917022705078, 0.029080867767333984, 0.030332565307617188, 0.03158426284790039, 0.032835960388183594, 0.0340876579284668, 0.03533935546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 3.0, 3.0, 13.0, 11.0, 13.0, 12.0, 25.0, 28.0, 28.0, 34.0, 39.0, 50.0, 54.0, 67.0, 53.0, 73.0, 69.0, 56.0, 50.0, 57.0, 48.0, 46.0, 32.0, 19.0, 21.0, 21.0, 15.0, 13.0, 7.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.7762184143066406e-05, -1.728162169456482e-05, -1.6801059246063232e-05, -1.6320496797561646e-05, -1.583993434906006e-05, -1.535937190055847e-05, -1.4878809452056885e-05, -1.4398247003555298e-05, -1.3917684555053711e-05, -1.3437122106552124e-05, -1.2956559658050537e-05, -1.247599720954895e-05, -1.1995434761047363e-05, -1.1514872312545776e-05, -1.103430986404419e-05, -1.0553747415542603e-05, -1.0073184967041016e-05, -9.592622518539429e-06, -9.112060070037842e-06, -8.631497621536255e-06, -8.150935173034668e-06, -7.670372724533081e-06, -7.189810276031494e-06, -6.709247827529907e-06, -6.22868537902832e-06, -5.748122930526733e-06, -5.2675604820251465e-06, -4.7869980335235596e-06, -4.306435585021973e-06, -3.825873136520386e-06, -3.345310688018799e-06, -2.864748239517212e-06, -2.384185791015625e-06, -1.903623342514038e-06, -1.4230608940124512e-06, -9.424984455108643e-07, -4.6193599700927734e-07, 1.862645149230957e-08, 4.991888999938965e-07, 9.797513484954834e-07, 1.4603137969970703e-06, 1.9408762454986572e-06, 2.421438694000244e-06, 2.902001142501831e-06, 3.382563591003418e-06, 3.863126039505005e-06, 4.343688488006592e-06, 4.824250936508179e-06, 5.304813385009766e-06, 5.7853758335113525e-06, 6.2659382820129395e-06, 6.746500730514526e-06, 7.227063179016113e-06, 7.7076256275177e-06, 8.188188076019287e-06, 8.668750524520874e-06, 9.149312973022461e-06, 9.629875421524048e-06, 1.0110437870025635e-05, 1.0591000318527222e-05, 1.1071562767028809e-05, 1.1552125215530396e-05, 1.2032687664031982e-05, 1.251325011253357e-05, 1.2993812561035156e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 9.0, 14.0, 12.0, 19.0, 25.0, 36.0, 59.0, 101.0, 192.0, 290.0, 519.0, 868.0, 1675.0, 3208.0, 6139.0, 12241.0, 27118.0, 69268.0, 187731.0, 348850.0, 235576.0, 90078.0, 33788.0, 14943.0, 7324.0, 3832.0, 2066.0, 1105.0, 596.0, 365.0, 195.0, 120.0, 66.0, 40.0, 20.0, 15.0, 10.0, 12.0, 12.0, 6.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.06317138671875, -0.06157732009887695, -0.059983253479003906, -0.05838918685913086, -0.05679512023925781, -0.055201053619384766, -0.05360698699951172, -0.05201292037963867, -0.050418853759765625, -0.04882478713989258, -0.04723072052001953, -0.045636653900146484, -0.04404258728027344, -0.04244852066040039, -0.040854454040527344, -0.0392603874206543, -0.03766632080078125, -0.0360722541809082, -0.034478187561035156, -0.03288412094116211, -0.03129005432128906, -0.029695987701416016, -0.02810192108154297, -0.026507854461669922, -0.024913787841796875, -0.023319721221923828, -0.02172565460205078, -0.020131587982177734, -0.018537521362304688, -0.01694345474243164, -0.015349388122558594, -0.013755321502685547, -0.0121612548828125, -0.010567188262939453, -0.008973121643066406, -0.007379055023193359, -0.0057849884033203125, -0.004190921783447266, -0.0025968551635742188, -0.0010027885437011719, 0.000591278076171875, 0.002185344696044922, 0.0037794113159179688, 0.005373477935791016, 0.0069675445556640625, 0.00856161117553711, 0.010155677795410156, 0.011749744415283203, 0.01334381103515625, 0.014937877655029297, 0.016531944274902344, 0.01812601089477539, 0.019720077514648438, 0.021314144134521484, 0.02290821075439453, 0.024502277374267578, 0.026096343994140625, 0.027690410614013672, 0.02928447723388672, 0.030878543853759766, 0.03247261047363281, 0.03406667709350586, 0.035660743713378906, 0.03725481033325195, 0.038848876953125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 2.0, 6.0, 8.0, 7.0, 12.0, 15.0, 14.0, 17.0, 29.0, 26.0, 31.0, 45.0, 45.0, 53.0, 56.0, 69.0, 57.0, 70.0, 59.0, 56.0, 52.0, 49.0, 35.0, 34.0, 17.0, 29.0, 17.0, 17.0, 11.0, 7.0, 13.0, 5.0, 7.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03887939453125, -0.03773069381713867, -0.036581993103027344, -0.035433292388916016, -0.03428459167480469, -0.03313589096069336, -0.03198719024658203, -0.030838489532470703, -0.029689788818359375, -0.028541088104248047, -0.02739238739013672, -0.02624368667602539, -0.025094985961914062, -0.023946285247802734, -0.022797584533691406, -0.021648883819580078, -0.02050018310546875, -0.019351482391357422, -0.018202781677246094, -0.017054080963134766, -0.015905380249023438, -0.01475667953491211, -0.013607978820800781, -0.012459278106689453, -0.011310577392578125, -0.010161876678466797, -0.009013175964355469, -0.00786447525024414, -0.0067157745361328125, -0.005567073822021484, -0.004418373107910156, -0.003269672393798828, -0.0021209716796875, -0.0009722709655761719, 0.00017642974853515625, 0.0013251304626464844, 0.0024738311767578125, 0.0036225318908691406, 0.004771232604980469, 0.005919933319091797, 0.007068634033203125, 0.008217334747314453, 0.009366035461425781, 0.01051473617553711, 0.011663436889648438, 0.012812137603759766, 0.013960838317871094, 0.015109539031982422, 0.01625823974609375, 0.017406940460205078, 0.018555641174316406, 0.019704341888427734, 0.020853042602539062, 0.02200174331665039, 0.02315044403076172, 0.024299144744873047, 0.025447845458984375, 0.026596546173095703, 0.02774524688720703, 0.02889394760131836, 0.030042648315429688, 0.031191349029541016, 0.032340049743652344, 0.03348875045776367, 0.034637451171875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 16.0, 30.0, 45.0, 79.0, 125.0, 145.0, 182.0, 135.0, 102.0, 69.0, 42.0, 26.0, 7.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7855516076087952, -0.7596481442451477, -0.7337446212768555, -0.707841157913208, -0.6819376349449158, -0.6560341715812683, -0.6301306486129761, -0.6042271852493286, -0.5783237218856812, -0.5524202585220337, -0.5265167355537415, -0.500613272190094, -0.47470974922180176, -0.4488062858581543, -0.42290279269218445, -0.3969992995262146, -0.37109577655792236, -0.3451922833919525, -0.31928879022598267, -0.2933853268623352, -0.26748180389404297, -0.24157832562923431, -0.21567484736442566, -0.1897713541984558, -0.16386786103248596, -0.1379643678665161, -0.11206088215112686, -0.08615739643573761, -0.06025390326976776, -0.03435041010379791, -0.008446931838989258, 0.01745656132698059, 0.043359994888305664, 0.06926348805427551, 0.09516697376966476, 0.12107045948505402, 0.14697395265102386, 0.1728774458169937, 0.19878092408180237, 0.22468441724777222, 0.25058791041374207, 0.2764914035797119, 0.30239489674568176, 0.3282983899116516, 0.3542018532752991, 0.3801053762435913, 0.40600883960723877, 0.4319123327732086, 0.45781582593917847, 0.4837193191051483, 0.5096228122711182, 0.5355262756347656, 0.5614297986030579, 0.5873332619667053, 0.6132367849349976, 0.639140248298645, 0.6650437116622925, 0.6909471750259399, 0.7168506979942322, 0.7427541613578796, 0.7686576843261719, 0.7945611476898193, 0.8204646110534668, 0.846368134021759, 0.8722716569900513]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 8.0, 3.0, 3.0, 4.0, 9.0, 9.0, 12.0, 9.0, 13.0, 25.0, 19.0, 15.0, 29.0, 21.0, 36.0, 37.0, 40.0, 33.0, 48.0, 44.0, 47.0, 46.0, 45.0, 46.0, 50.0, 36.0, 41.0, 48.0, 37.0, 29.0, 33.0, 18.0, 16.0, 21.0, 16.0, 12.0, 9.0, 6.0, 10.0, 8.0, 6.0, 3.0, 4.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5056268572807312, -0.4914681017398834, -0.47730934619903564, -0.46315059065818787, -0.4489918351173401, -0.4348330497741699, -0.42067432403564453, -0.40651553869247437, -0.3923567831516266, -0.3781980276107788, -0.36403927206993103, -0.34988051652908325, -0.3357217609882355, -0.3215630054473877, -0.30740422010421753, -0.29324546456336975, -0.279086709022522, -0.2649279534816742, -0.2507691979408264, -0.23661044239997864, -0.22245167195796967, -0.2082929164171219, -0.1941341608762741, -0.17997539043426514, -0.16581666469573975, -0.15165790915489197, -0.1374991536140442, -0.12334039062261581, -0.10918162763118744, -0.09502287209033966, -0.08086411654949188, -0.06670535355806351, -0.05254659056663513, -0.038387831300497055, -0.024229073897004128, -0.0100703164935112, 0.004088442772626877, 0.018247202038764954, 0.03240595757961273, 0.04656472057104111, 0.060723476111888885, 0.07488223165273666, 0.08904099464416504, 0.10319975018501282, 0.1173585057258606, 0.13151726126670837, 0.14567601680755615, 0.15983478724956512, 0.1739935427904129, 0.18815229833126068, 0.20231105387210846, 0.21646982431411743, 0.2306285798549652, 0.244787335395813, 0.25894609093666077, 0.27310484647750854, 0.2872636020183563, 0.3014223575592041, 0.3155811131000519, 0.32973986864089966, 0.34389862418174744, 0.3580573797225952, 0.3722161650657654, 0.38637492060661316, 0.40053367614746094]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 11.0, 2.0, 9.0, 10.0, 17.0, 15.0, 17.0, 39.0, 54.0, 75.0, 113.0, 161.0, 265.0, 438.0, 751.0, 1366.0, 2558.0, 5541.0, 13979.0, 41672.0, 164183.0, 863012.0, 2043359.0, 827009.0, 163187.0, 41502.0, 14089.0, 5511.0, 2515.0, 1238.0, 654.0, 336.0, 229.0, 152.0, 84.0, 40.0, 35.0, 14.0, 11.0, 12.0, 7.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0743408203125, -0.07245826721191406, -0.07057571411132812, -0.06869316101074219, -0.06681060791015625, -0.06492805480957031, -0.06304550170898438, -0.06116294860839844, -0.0592803955078125, -0.05739784240722656, -0.055515289306640625, -0.05363273620605469, -0.05175018310546875, -0.04986763000488281, -0.047985076904296875, -0.04610252380371094, -0.044219970703125, -0.04233741760253906, -0.040454864501953125, -0.03857231140136719, -0.03668975830078125, -0.03480720520019531, -0.032924652099609375, -0.031042098999023438, -0.0291595458984375, -0.027276992797851562, -0.025394439697265625, -0.023511886596679688, -0.02162933349609375, -0.019746780395507812, -0.017864227294921875, -0.015981674194335938, -0.01409912109375, -0.012216567993164062, -0.010334014892578125, -0.008451461791992188, -0.00656890869140625, -0.0046863555908203125, -0.002803802490234375, -0.0009212493896484375, 0.0009613037109375, 0.0028438568115234375, 0.004726409912109375, 0.0066089630126953125, 0.00849151611328125, 0.010374069213867188, 0.012256622314453125, 0.014139175415039062, 0.016021728515625, 0.017904281616210938, 0.019786834716796875, 0.021669387817382812, 0.02355194091796875, 0.025434494018554688, 0.027317047119140625, 0.029199600219726562, 0.0310821533203125, 0.03296470642089844, 0.034847259521484375, 0.03672981262207031, 0.03861236572265625, 0.04049491882324219, 0.042377471923828125, 0.04426002502441406, 0.046142578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 7.0, 10.0, 6.0, 15.0, 21.0, 22.0, 40.0, 50.0, 53.0, 53.0, 67.0, 54.0, 72.0, 72.0, 75.0, 55.0, 71.0, 57.0, 36.0, 39.0, 38.0, 23.0, 14.0, 18.0, 14.0, 5.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.072998046875, -0.07086467742919922, -0.06873130798339844, -0.06659793853759766, -0.06446456909179688, -0.062331199645996094, -0.06019783020019531, -0.05806446075439453, -0.05593109130859375, -0.05379772186279297, -0.05166435241699219, -0.049530982971191406, -0.047397613525390625, -0.045264244079589844, -0.04313087463378906, -0.04099750518798828, -0.0388641357421875, -0.03673076629638672, -0.03459739685058594, -0.032464027404785156, -0.030330657958984375, -0.028197288513183594, -0.026063919067382812, -0.02393054962158203, -0.02179718017578125, -0.01966381072998047, -0.017530441284179688, -0.015397071838378906, -0.013263702392578125, -0.011130332946777344, -0.008996963500976562, -0.006863594055175781, -0.004730224609375, -0.0025968551635742188, -0.0004634857177734375, 0.0016698837280273438, 0.003803253173828125, 0.005936622619628906, 0.008069992065429688, 0.010203361511230469, 0.01233673095703125, 0.014470100402832031, 0.016603469848632812, 0.018736839294433594, 0.020870208740234375, 0.023003578186035156, 0.025136947631835938, 0.02727031707763672, 0.0294036865234375, 0.03153705596923828, 0.03367042541503906, 0.035803794860839844, 0.037937164306640625, 0.040070533752441406, 0.04220390319824219, 0.04433727264404297, 0.04647064208984375, 0.04860401153564453, 0.05073738098144531, 0.052870750427246094, 0.055004119873046875, 0.057137489318847656, 0.05927085876464844, 0.06140422821044922, 0.06353759765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 16.0, 18.0, 36.0, 42.0, 64.0, 99.0, 169.0, 269.0, 450.0, 844.0, 1939.0, 4359.0, 12355.0, 41783.0, 194015.0, 1126460.0, 2183330.0, 500154.0, 91514.0, 23145.0, 7420.0, 2940.0, 1301.0, 639.0, 370.0, 194.0, 132.0, 87.0, 35.0, 37.0, 21.0, 18.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.06982707977294922, -0.06726646423339844, -0.06470584869384766, -0.062145233154296875, -0.059584617614746094, -0.05702400207519531, -0.05446338653564453, -0.05190277099609375, -0.04934215545654297, -0.04678153991699219, -0.044220924377441406, -0.041660308837890625, -0.039099693298339844, -0.03653907775878906, -0.03397846221923828, -0.0314178466796875, -0.02885723114013672, -0.026296615600585938, -0.023736000061035156, -0.021175384521484375, -0.018614768981933594, -0.016054153442382812, -0.013493537902832031, -0.01093292236328125, -0.008372306823730469, -0.0058116912841796875, -0.0032510757446289062, -0.000690460205078125, 0.0018701553344726562, 0.0044307708740234375, 0.006991386413574219, 0.009552001953125, 0.012112617492675781, 0.014673233032226562, 0.017233848571777344, 0.019794464111328125, 0.022355079650878906, 0.024915695190429688, 0.02747631072998047, 0.03003692626953125, 0.03259754180908203, 0.03515815734863281, 0.037718772888183594, 0.040279388427734375, 0.042840003967285156, 0.04540061950683594, 0.04796123504638672, 0.0505218505859375, 0.05308246612548828, 0.05564308166503906, 0.058203697204589844, 0.060764312744140625, 0.0633249282836914, 0.06588554382324219, 0.06844615936279297, 0.07100677490234375, 0.07356739044189453, 0.07612800598144531, 0.0786886215209961, 0.08124923706054688, 0.08380985260009766, 0.08637046813964844, 0.08893108367919922, 0.09149169921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 10.0, 8.0, 9.0, 18.0, 34.0, 46.0, 50.0, 67.0, 103.0, 116.0, 209.0, 302.0, 415.0, 505.0, 565.0, 446.0, 370.0, 241.0, 173.0, 107.0, 70.0, 55.0, 44.0, 29.0, 20.0, 12.0, 9.0, 11.0, 5.0, 8.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07757568359375, -0.07516765594482422, -0.07275962829589844, -0.07035160064697266, -0.06794357299804688, -0.0655355453491211, -0.06312751770019531, -0.06071949005126953, -0.05831146240234375, -0.05590343475341797, -0.05349540710449219, -0.051087379455566406, -0.048679351806640625, -0.046271324157714844, -0.04386329650878906, -0.04145526885986328, -0.0390472412109375, -0.03663921356201172, -0.03423118591308594, -0.031823158264160156, -0.029415130615234375, -0.027007102966308594, -0.024599075317382812, -0.02219104766845703, -0.01978302001953125, -0.01737499237060547, -0.014966964721679688, -0.012558937072753906, -0.010150909423828125, -0.007742881774902344, -0.0053348541259765625, -0.0029268264770507812, -0.000518798828125, 0.0018892288208007812, 0.0042972564697265625, 0.006705284118652344, 0.009113311767578125, 0.011521339416503906, 0.013929367065429688, 0.01633739471435547, 0.01874542236328125, 0.02115345001220703, 0.023561477661132812, 0.025969505310058594, 0.028377532958984375, 0.030785560607910156, 0.03319358825683594, 0.03560161590576172, 0.0380096435546875, 0.04041767120361328, 0.04282569885253906, 0.045233726501464844, 0.047641754150390625, 0.050049781799316406, 0.05245780944824219, 0.05486583709716797, 0.05727386474609375, 0.05968189239501953, 0.06208992004394531, 0.0644979476928711, 0.06690597534179688, 0.06931400299072266, 0.07172203063964844, 0.07413005828857422, 0.0765380859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 11.0, 10.0, 14.0, 21.0, 32.0, 41.0, 63.0, 68.0, 87.0, 83.0, 100.0, 99.0, 81.0, 73.0, 54.0, 56.0, 30.0, 27.0, 21.0, 4.0, 10.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.4895792007446289, -0.47923341393470764, -0.4688876271247864, -0.4585418105125427, -0.44819602370262146, -0.4378502368927002, -0.42750445008277893, -0.41715866327285767, -0.406812846660614, -0.39646705985069275, -0.3861212730407715, -0.37577545642852783, -0.36542966961860657, -0.3550838828086853, -0.34473809599876404, -0.3343923091888428, -0.3240464925765991, -0.31370070576667786, -0.3033549189567566, -0.29300910234451294, -0.2826633155345917, -0.2723175287246704, -0.26197174191474915, -0.2516259551048279, -0.24128016829490662, -0.23093438148498535, -0.2205885797739029, -0.21024279296398163, -0.19989699125289917, -0.1895512044429779, -0.17920541763305664, -0.16885961592197418, -0.15851381421089172, -0.14816802740097046, -0.137822225689888, -0.12747643887996674, -0.11713063716888428, -0.10678485035896301, -0.09643905609846115, -0.08609326183795929, -0.07574746757745743, -0.06540167331695557, -0.055055879056453705, -0.04471008852124214, -0.03436429426074028, -0.02401850000023842, -0.013672709465026855, -0.003326915204524994, 0.007018879055976868, 0.01736467331647873, 0.02771046571433544, 0.038056258112192154, 0.048402052372694016, 0.05874784663319588, 0.06909363716840744, 0.0794394314289093, 0.08978522568941116, 0.10013101994991302, 0.11047681421041489, 0.12082260847091675, 0.131168395280838, 0.14151419699192047, 0.15185998380184174, 0.1622057855129242, 0.17255157232284546]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 9.0, 5.0, 8.0, 10.0, 22.0, 12.0, 14.0, 20.0, 21.0, 32.0, 29.0, 21.0, 40.0, 43.0, 49.0, 54.0, 49.0, 42.0, 48.0, 40.0, 52.0, 37.0, 36.0, 40.0, 35.0, 33.0, 28.0, 29.0, 30.0, 23.0, 19.0, 10.0, 17.0, 18.0, 2.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23431766033172607, -0.22556370496749878, -0.21680974960327148, -0.20805580914020538, -0.1993018537759781, -0.1905478984117508, -0.1817939579486847, -0.1730400025844574, -0.1642860472202301, -0.1555320918560028, -0.1467781364917755, -0.1380241960287094, -0.12927024066448212, -0.12051628530025482, -0.11176233738660812, -0.10300838947296143, -0.09425443410873413, -0.08550047874450684, -0.07674653083086014, -0.06799258291721344, -0.059238627552986145, -0.05048467591404915, -0.04173072427511215, -0.032976772636175156, -0.02422282099723816, -0.015468869358301163, -0.006714917719364166, 0.00203903391957283, 0.010792985558509827, 0.019546937197446823, 0.02830088883638382, 0.037054840475320816, 0.04580879211425781, 0.05456274375319481, 0.0633166953921318, 0.0720706433057785, 0.0808245986700058, 0.0895785540342331, 0.09833250194787979, 0.10708644986152649, 0.11584040522575378, 0.12459436058998108, 0.13334831595420837, 0.14210225641727448, 0.15085621178150177, 0.15961016714572906, 0.16836410760879517, 0.17711806297302246, 0.18587201833724976, 0.19462597370147705, 0.20337992906570435, 0.21213386952877045, 0.22088782489299774, 0.22964178025722504, 0.23839572072029114, 0.24714967608451843, 0.2559036314487457, 0.264657586812973, 0.2734115421772003, 0.2821654975414276, 0.2909194231033325, 0.2996733784675598, 0.3084273338317871, 0.3171812891960144, 0.3259352445602417]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 6.0, 12.0, 16.0, 23.0, 22.0, 36.0, 49.0, 86.0, 150.0, 211.0, 361.0, 700.0, 1203.0, 2324.0, 4487.0, 9174.0, 18896.0, 39471.0, 89892.0, 218605.0, 330226.0, 187975.0, 76542.0, 34687.0, 16410.0, 8223.0, 4013.0, 2193.0, 1052.0, 592.0, 321.0, 191.0, 117.0, 79.0, 51.0, 34.0, 34.0, 19.0, 13.0, 15.0, 10.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.1142578125, -0.11083793640136719, -0.10741806030273438, -0.10399818420410156, -0.10057830810546875, -0.09715843200683594, -0.09373855590820312, -0.09031867980957031, -0.0868988037109375, -0.08347892761230469, -0.08005905151367188, -0.07663917541503906, -0.07321929931640625, -0.06979942321777344, -0.06637954711914062, -0.06295967102050781, -0.059539794921875, -0.05611991882324219, -0.052700042724609375, -0.04928016662597656, -0.04586029052734375, -0.04244041442871094, -0.039020538330078125, -0.03560066223144531, -0.0321807861328125, -0.028760910034179688, -0.025341033935546875, -0.021921157836914062, -0.01850128173828125, -0.015081405639648438, -0.011661529541015625, -0.008241653442382812, -0.00482177734375, -0.0014019012451171875, 0.002017974853515625, 0.0054378509521484375, 0.00885772705078125, 0.012277603149414062, 0.015697479248046875, 0.019117355346679688, 0.0225372314453125, 0.025957107543945312, 0.029376983642578125, 0.03279685974121094, 0.03621673583984375, 0.03963661193847656, 0.043056488037109375, 0.04647636413574219, 0.049896240234375, 0.05331611633300781, 0.056735992431640625, 0.06015586853027344, 0.06357574462890625, 0.06699562072753906, 0.07041549682617188, 0.07383537292480469, 0.0772552490234375, 0.08067512512207031, 0.08409500122070312, 0.08751487731933594, 0.09093475341796875, 0.09435462951660156, 0.09777450561523438, 0.10119438171386719, 0.1046142578125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 9.0, 9.0, 15.0, 25.0, 32.0, 42.0, 41.0, 49.0, 55.0, 53.0, 67.0, 59.0, 63.0, 63.0, 56.0, 59.0, 46.0, 56.0, 32.0, 36.0, 33.0, 13.0, 19.0, 14.0, 15.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0665283203125, -0.06462907791137695, -0.0627298355102539, -0.06083059310913086, -0.05893135070800781, -0.057032108306884766, -0.05513286590576172, -0.05323362350463867, -0.051334381103515625, -0.04943513870239258, -0.04753589630126953, -0.045636653900146484, -0.04373741149902344, -0.04183816909790039, -0.039938926696777344, -0.0380396842956543, -0.03614044189453125, -0.0342411994934082, -0.032341957092285156, -0.03044271469116211, -0.028543472290039062, -0.026644229888916016, -0.02474498748779297, -0.022845745086669922, -0.020946502685546875, -0.019047260284423828, -0.01714801788330078, -0.015248775482177734, -0.013349533081054688, -0.01145029067993164, -0.009551048278808594, -0.007651805877685547, -0.0057525634765625, -0.003853321075439453, -0.0019540786743164062, -5.4836273193359375e-05, 0.0018444061279296875, 0.0037436485290527344, 0.005642890930175781, 0.007542133331298828, 0.009441375732421875, 0.011340618133544922, 0.013239860534667969, 0.015139102935791016, 0.017038345336914062, 0.01893758773803711, 0.020836830139160156, 0.022736072540283203, 0.02463531494140625, 0.026534557342529297, 0.028433799743652344, 0.03033304214477539, 0.03223228454589844, 0.034131526947021484, 0.03603076934814453, 0.03793001174926758, 0.039829254150390625, 0.04172849655151367, 0.04362773895263672, 0.045526981353759766, 0.04742622375488281, 0.04932546615600586, 0.051224708557128906, 0.05312395095825195, 0.055023193359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 5.0, 6.0, 5.0, 10.0, 11.0, 23.0, 23.0, 35.0, 36.0, 51.0, 99.0, 160.0, 295.0, 709.0, 1898.0, 5733.0, 19693.0, 69254.0, 263739.0, 457556.0, 165244.0, 44745.0, 12893.0, 3833.0, 1279.0, 512.0, 254.0, 140.0, 80.0, 59.0, 38.0, 29.0, 26.0, 21.0, 9.0, 8.0, 5.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.1658935546875, -0.16106033325195312, -0.15622711181640625, -0.15139389038085938, -0.1465606689453125, -0.14172744750976562, -0.13689422607421875, -0.13206100463867188, -0.127227783203125, -0.12239456176757812, -0.11756134033203125, -0.11272811889648438, -0.1078948974609375, -0.10306167602539062, -0.09822845458984375, -0.09339523315429688, -0.08856201171875, -0.08372879028320312, -0.07889556884765625, -0.07406234741210938, -0.0692291259765625, -0.06439590454101562, -0.05956268310546875, -0.054729461669921875, -0.049896240234375, -0.045063018798828125, -0.04022979736328125, -0.035396575927734375, -0.0305633544921875, -0.025730133056640625, -0.02089691162109375, -0.016063690185546875, -0.01123046875, -0.006397247314453125, -0.00156402587890625, 0.003269195556640625, 0.0081024169921875, 0.012935638427734375, 0.01776885986328125, 0.022602081298828125, 0.027435302734375, 0.032268524169921875, 0.03710174560546875, 0.041934967041015625, 0.0467681884765625, 0.051601409912109375, 0.05643463134765625, 0.061267852783203125, 0.06610107421875, 0.07093429565429688, 0.07576751708984375, 0.08060073852539062, 0.0854339599609375, 0.09026718139648438, 0.09510040283203125, 0.09993362426757812, 0.104766845703125, 0.10960006713867188, 0.11443328857421875, 0.11926651000976562, 0.1240997314453125, 0.12893295288085938, 0.13376617431640625, 0.13859939575195312, 0.1434326171875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 12.0, 6.0, 12.0, 11.0, 11.0, 11.0, 14.0, 16.0, 19.0, 32.0, 21.0, 25.0, 34.0, 41.0, 31.0, 35.0, 51.0, 56.0, 37.0, 44.0, 45.0, 30.0, 37.0, 36.0, 43.0, 30.0, 31.0, 34.0, 18.0, 27.0, 22.0, 18.0, 19.0, 13.0, 11.0, 10.0, 8.0, 9.0, 4.0, 6.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.126708984375, -0.12275505065917969, -0.11880111694335938, -0.11484718322753906, -0.11089324951171875, -0.10693931579589844, -0.10298538208007812, -0.09903144836425781, -0.0950775146484375, -0.09112358093261719, -0.08716964721679688, -0.08321571350097656, -0.07926177978515625, -0.07530784606933594, -0.07135391235351562, -0.06739997863769531, -0.063446044921875, -0.05949211120605469, -0.055538177490234375, -0.05158424377441406, -0.04763031005859375, -0.04367637634277344, -0.039722442626953125, -0.03576850891113281, -0.0318145751953125, -0.027860641479492188, -0.023906707763671875, -0.019952774047851562, -0.01599884033203125, -0.012044906616210938, -0.008090972900390625, -0.0041370391845703125, -0.00018310546875, 0.0037708282470703125, 0.007724761962890625, 0.011678695678710938, 0.01563262939453125, 0.019586563110351562, 0.023540496826171875, 0.027494430541992188, 0.0314483642578125, 0.03540229797363281, 0.039356231689453125, 0.04331016540527344, 0.04726409912109375, 0.05121803283691406, 0.055171966552734375, 0.05912590026855469, 0.063079833984375, 0.06703376770019531, 0.07098770141601562, 0.07494163513183594, 0.07889556884765625, 0.08284950256347656, 0.08680343627929688, 0.09075736999511719, 0.0947113037109375, 0.09866523742675781, 0.10261917114257812, 0.10657310485839844, 0.11052703857421875, 0.11448097229003906, 0.11843490600585938, 0.12238883972167969, 0.1263427734375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 10.0, 14.0, 30.0, 40.0, 54.0, 103.0, 163.0, 278.0, 465.0, 745.0, 1305.0, 2195.0, 3703.0, 6354.0, 10766.0, 17662.0, 29093.0, 50384.0, 91626.0, 167443.0, 229673.0, 188989.0, 106723.0, 58312.0, 32988.0, 19623.0, 12077.0, 7022.0, 4272.0, 2551.0, 1593.0, 909.0, 574.0, 319.0, 190.0, 108.0, 72.0, 51.0, 25.0, 15.0, 12.0, 6.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0347900390625, -0.0336155891418457, -0.032441139221191406, -0.03126668930053711, -0.030092239379882812, -0.028917789459228516, -0.02774333953857422, -0.026568889617919922, -0.025394439697265625, -0.024219989776611328, -0.02304553985595703, -0.021871089935302734, -0.020696640014648438, -0.01952219009399414, -0.018347740173339844, -0.017173290252685547, -0.01599884033203125, -0.014824390411376953, -0.013649940490722656, -0.01247549057006836, -0.011301040649414062, -0.010126590728759766, -0.008952140808105469, -0.007777690887451172, -0.006603240966796875, -0.005428791046142578, -0.004254341125488281, -0.0030798912048339844, -0.0019054412841796875, -0.0007309913635253906, 0.00044345855712890625, 0.0016179084777832031, 0.0027923583984375, 0.003966808319091797, 0.005141258239746094, 0.006315708160400391, 0.0074901580810546875, 0.008664608001708984, 0.009839057922363281, 0.011013507843017578, 0.012187957763671875, 0.013362407684326172, 0.014536857604980469, 0.015711307525634766, 0.016885757446289062, 0.01806020736694336, 0.019234657287597656, 0.020409107208251953, 0.02158355712890625, 0.022758007049560547, 0.023932456970214844, 0.02510690689086914, 0.026281356811523438, 0.027455806732177734, 0.02863025665283203, 0.029804706573486328, 0.030979156494140625, 0.03215360641479492, 0.03332805633544922, 0.034502506256103516, 0.03567695617675781, 0.03685140609741211, 0.038025856018066406, 0.0392003059387207, 0.040374755859375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 9.0, 13.0, 13.0, 14.0, 18.0, 21.0, 24.0, 33.0, 33.0, 50.0, 50.0, 60.0, 82.0, 83.0, 77.0, 80.0, 62.0, 63.0, 52.0, 37.0, 22.0, 20.0, 18.0, 12.0, 7.0, 11.0, 5.0, 3.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7762184143066406e-05, -1.7231330275535583e-05, -1.670047640800476e-05, -1.6169622540473938e-05, -1.5638768672943115e-05, -1.5107914805412292e-05, -1.457706093788147e-05, -1.4046207070350647e-05, -1.3515353202819824e-05, -1.2984499335289001e-05, -1.2453645467758179e-05, -1.1922791600227356e-05, -1.1391937732696533e-05, -1.086108386516571e-05, -1.0330229997634888e-05, -9.799376130104065e-06, -9.268522262573242e-06, -8.73766839504242e-06, -8.206814527511597e-06, -7.675960659980774e-06, -7.145106792449951e-06, -6.614252924919128e-06, -6.083399057388306e-06, -5.552545189857483e-06, -5.02169132232666e-06, -4.490837454795837e-06, -3.959983587265015e-06, -3.429129719734192e-06, -2.898275852203369e-06, -2.3674219846725464e-06, -1.8365681171417236e-06, -1.3057142496109009e-06, -7.748603820800781e-07, -2.4400651454925537e-07, 2.868473529815674e-07, 8.177012205123901e-07, 1.3485550880432129e-06, 1.8794089555740356e-06, 2.4102628231048584e-06, 2.941116690635681e-06, 3.471970558166504e-06, 4.002824425697327e-06, 4.533678293228149e-06, 5.064532160758972e-06, 5.595386028289795e-06, 6.126239895820618e-06, 6.6570937633514404e-06, 7.187947630882263e-06, 7.718801498413086e-06, 8.249655365943909e-06, 8.780509233474731e-06, 9.311363101005554e-06, 9.842216968536377e-06, 1.03730708360672e-05, 1.0903924703598022e-05, 1.1434778571128845e-05, 1.1965632438659668e-05, 1.249648630619049e-05, 1.3027340173721313e-05, 1.3558194041252136e-05, 1.4089047908782959e-05, 1.4619901776313782e-05, 1.5150755643844604e-05, 1.5681609511375427e-05, 1.621246337890625e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 6.0, 12.0, 15.0, 18.0, 42.0, 34.0, 63.0, 116.0, 156.0, 304.0, 540.0, 1122.0, 2270.0, 4840.0, 10345.0, 21413.0, 43857.0, 98756.0, 253715.0, 331563.0, 157604.0, 63400.0, 30040.0, 14675.0, 7002.0, 3375.0, 1536.0, 743.0, 422.0, 209.0, 129.0, 83.0, 45.0, 39.0, 24.0, 14.0, 12.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04925537109375, -0.04772758483886719, -0.046199798583984375, -0.04467201232910156, -0.04314422607421875, -0.04161643981933594, -0.040088653564453125, -0.03856086730957031, -0.0370330810546875, -0.03550529479980469, -0.033977508544921875, -0.03244972229003906, -0.03092193603515625, -0.029394149780273438, -0.027866363525390625, -0.026338577270507812, -0.024810791015625, -0.023283004760742188, -0.021755218505859375, -0.020227432250976562, -0.01869964599609375, -0.017171859741210938, -0.015644073486328125, -0.014116287231445312, -0.0125885009765625, -0.011060714721679688, -0.009532928466796875, -0.008005142211914062, -0.00647735595703125, -0.0049495697021484375, -0.003421783447265625, -0.0018939971923828125, -0.0003662109375, 0.0011615753173828125, 0.002689361572265625, 0.0042171478271484375, 0.00574493408203125, 0.0072727203369140625, 0.008800506591796875, 0.010328292846679688, 0.0118560791015625, 0.013383865356445312, 0.014911651611328125, 0.016439437866210938, 0.01796722412109375, 0.019495010375976562, 0.021022796630859375, 0.022550582885742188, 0.024078369140625, 0.025606155395507812, 0.027133941650390625, 0.028661727905273438, 0.03018951416015625, 0.03171730041503906, 0.033245086669921875, 0.03477287292480469, 0.0363006591796875, 0.03782844543457031, 0.039356231689453125, 0.04088401794433594, 0.04241180419921875, 0.04393959045410156, 0.045467376708984375, 0.04699516296386719, 0.04852294921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 10.0, 13.0, 17.0, 24.0, 23.0, 26.0, 44.0, 48.0, 54.0, 76.0, 73.0, 73.0, 76.0, 65.0, 60.0, 48.0, 58.0, 33.0, 40.0, 32.0, 21.0, 17.0, 16.0, 9.0, 13.0, 5.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052703857421875, -0.05108022689819336, -0.04945659637451172, -0.04783296585083008, -0.04620933532714844, -0.0445857048034668, -0.042962074279785156, -0.041338443756103516, -0.039714813232421875, -0.038091182708740234, -0.036467552185058594, -0.03484392166137695, -0.03322029113769531, -0.03159666061401367, -0.02997303009033203, -0.02834939956665039, -0.02672576904296875, -0.02510213851928711, -0.02347850799560547, -0.021854877471923828, -0.020231246948242188, -0.018607616424560547, -0.016983985900878906, -0.015360355377197266, -0.013736724853515625, -0.012113094329833984, -0.010489463806152344, -0.008865833282470703, -0.0072422027587890625, -0.005618572235107422, -0.003994941711425781, -0.0023713111877441406, -0.0007476806640625, 0.0008759498596191406, 0.0024995803833007812, 0.004123210906982422, 0.0057468414306640625, 0.007370471954345703, 0.008994102478027344, 0.010617733001708984, 0.012241363525390625, 0.013864994049072266, 0.015488624572753906, 0.017112255096435547, 0.018735885620117188, 0.020359516143798828, 0.02198314666748047, 0.02360677719116211, 0.02523040771484375, 0.02685403823852539, 0.02847766876220703, 0.030101299285888672, 0.03172492980957031, 0.03334856033325195, 0.034972190856933594, 0.036595821380615234, 0.038219451904296875, 0.039843082427978516, 0.041466712951660156, 0.0430903434753418, 0.04471397399902344, 0.04633760452270508, 0.04796123504638672, 0.04958486557006836, 0.05120849609375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 11.0, 17.0, 26.0, 66.0, 115.0, 159.0, 172.0, 160.0, 121.0, 86.0, 34.0, 28.0, 13.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0831377506256104, -1.0556749105453491, -1.0282119512557983, -1.000749111175537, -0.9732862114906311, -0.9458233714103699, -0.9183604717254639, -0.8908976316452026, -0.8634347319602966, -0.8359718322753906, -0.8085089921951294, -0.7810460925102234, -0.7535831928253174, -0.7261203527450562, -0.6986574530601501, -0.6711945533752441, -0.6437317132949829, -0.6162688136100769, -0.5888059735298157, -0.5613430738449097, -0.5338801741600037, -0.5064173340797424, -0.4789544343948364, -0.4514915645122528, -0.4240286350250244, -0.3965657651424408, -0.3691028654575348, -0.34163999557495117, -0.31417712569236755, -0.28671425580978394, -0.25925135612487793, -0.2317884862422943, -0.2043256163597107, -0.17686273157596588, -0.14939986169338226, -0.12193697690963745, -0.09447409957647324, -0.06701122224330902, -0.03954833745956421, -0.01208546757698059, 0.015377417206764221, 0.042840294539928436, 0.07030317187309265, 0.09776605665683746, 0.12522894144058228, 0.1526918113231659, 0.1801546961069107, 0.20761756598949432, 0.23508045077323914, 0.26254332065582275, 0.29000622034072876, 0.3174690902233124, 0.344931960105896, 0.372394859790802, 0.3998577296733856, 0.42732059955596924, 0.45478349924087524, 0.48224636912345886, 0.5097092390060425, 0.5371721386909485, 0.5646350383758545, 0.5920978784561157, 0.6195607781410217, 0.6470236778259277, 0.674486517906189]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 19.0, 7.0, 18.0, 17.0, 18.0, 22.0, 32.0, 30.0, 28.0, 39.0, 35.0, 30.0, 51.0, 43.0, 40.0, 30.0, 44.0, 36.0, 30.0, 49.0, 41.0, 29.0, 23.0, 27.0, 33.0, 27.0, 26.0, 20.0, 18.0, 17.0, 18.0, 5.0, 9.0, 14.0, 4.0, 11.0, 3.0, 2.0, 3.0, 4.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.38126516342163086, -0.3689071238040924, -0.35654905438423157, -0.3441910147666931, -0.33183297514915466, -0.3194749355316162, -0.30711686611175537, -0.2947588264942169, -0.28240078687667847, -0.27004274725914, -0.2576846778392792, -0.24532663822174072, -0.23296859860420227, -0.22061054408550262, -0.20825248956680298, -0.19589444994926453, -0.18353639543056488, -0.17117834091186523, -0.15882030129432678, -0.14646224677562714, -0.13410420715808868, -0.12174615263938904, -0.10938810557126999, -0.09703005850315094, -0.08467201143503189, -0.07231396436691284, -0.05995591729879379, -0.047597866505384445, -0.035239819437265396, -0.022881772369146347, -0.010523721575737, 0.0018343254923820496, 0.014192372560501099, 0.026550419628620148, 0.0389084666967392, 0.051266517490148544, 0.0636245608329773, 0.07598261535167694, 0.08834066241979599, 0.10069870948791504, 0.11305675655603409, 0.12541480362415314, 0.13777285814285278, 0.15013089776039124, 0.16248895227909088, 0.17484699189662933, 0.18720504641532898, 0.19956308603286743, 0.21192114055156708, 0.22427919507026672, 0.23663723468780518, 0.24899528920650482, 0.26135334372520447, 0.2737113833427429, 0.28606942296028137, 0.2984274625778198, 0.31078553199768066, 0.3231435716152191, 0.33550164103507996, 0.3478596806526184, 0.36021772027015686, 0.3725757598876953, 0.38493382930755615, 0.3972918689250946, 0.40964990854263306]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 7.0, 12.0, 18.0, 24.0, 56.0, 58.0, 81.0, 113.0, 182.0, 267.0, 452.0, 773.0, 1531.0, 2961.0, 6736.0, 17229.0, 53810.0, 235288.0, 1203810.0, 1952502.0, 557337.0, 110782.0, 30540.0, 10770.0, 4436.0, 2049.0, 983.0, 576.0, 359.0, 218.0, 108.0, 71.0, 39.0, 41.0, 18.0, 17.0, 5.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08343505859375, -0.0812540054321289, -0.07907295227050781, -0.07689189910888672, -0.07471084594726562, -0.07252979278564453, -0.07034873962402344, -0.06816768646240234, -0.06598663330078125, -0.06380558013916016, -0.06162452697753906, -0.05944347381591797, -0.057262420654296875, -0.05508136749267578, -0.05290031433105469, -0.050719261169433594, -0.0485382080078125, -0.046357154846191406, -0.04417610168457031, -0.04199504852294922, -0.039813995361328125, -0.03763294219970703, -0.03545188903808594, -0.033270835876464844, -0.03108978271484375, -0.028908729553222656, -0.026727676391601562, -0.02454662322998047, -0.022365570068359375, -0.02018451690673828, -0.018003463745117188, -0.015822410583496094, -0.013641357421875, -0.011460304260253906, -0.009279251098632812, -0.007098197937011719, -0.004917144775390625, -0.0027360916137695312, -0.0005550384521484375, 0.0016260147094726562, 0.00380706787109375, 0.005988121032714844, 0.008169174194335938, 0.010350227355957031, 0.012531280517578125, 0.014712333679199219, 0.016893386840820312, 0.019074440002441406, 0.0212554931640625, 0.023436546325683594, 0.025617599487304688, 0.02779865264892578, 0.029979705810546875, 0.03216075897216797, 0.03434181213378906, 0.036522865295410156, 0.03870391845703125, 0.040884971618652344, 0.04306602478027344, 0.04524707794189453, 0.047428131103515625, 0.04960918426513672, 0.05179023742675781, 0.053971290588378906, 0.05615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 5.0, 6.0, 12.0, 7.0, 16.0, 18.0, 17.0, 25.0, 35.0, 41.0, 54.0, 41.0, 50.0, 52.0, 57.0, 48.0, 63.0, 64.0, 68.0, 51.0, 37.0, 40.0, 37.0, 27.0, 33.0, 12.0, 28.0, 16.0, 6.0, 10.0, 6.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0721435546875, -0.07018136978149414, -0.06821918487548828, -0.06625699996948242, -0.06429481506347656, -0.0623326301574707, -0.060370445251464844, -0.058408260345458984, -0.056446075439453125, -0.054483890533447266, -0.052521705627441406, -0.05055952072143555, -0.04859733581542969, -0.04663515090942383, -0.04467296600341797, -0.04271078109741211, -0.04074859619140625, -0.03878641128540039, -0.03682422637939453, -0.03486204147338867, -0.03289985656738281, -0.030937671661376953, -0.028975486755371094, -0.027013301849365234, -0.025051116943359375, -0.023088932037353516, -0.021126747131347656, -0.019164562225341797, -0.017202377319335938, -0.015240192413330078, -0.013278007507324219, -0.01131582260131836, -0.0093536376953125, -0.007391452789306641, -0.005429267883300781, -0.003467082977294922, -0.0015048980712890625, 0.0004572868347167969, 0.0024194717407226562, 0.004381656646728516, 0.006343841552734375, 0.008306026458740234, 0.010268211364746094, 0.012230396270751953, 0.014192581176757812, 0.016154766082763672, 0.01811695098876953, 0.02007913589477539, 0.02204132080078125, 0.02400350570678711, 0.02596569061279297, 0.027927875518798828, 0.029890060424804688, 0.03185224533081055, 0.033814430236816406, 0.035776615142822266, 0.037738800048828125, 0.039700984954833984, 0.041663169860839844, 0.0436253547668457, 0.04558753967285156, 0.04754972457885742, 0.04951190948486328, 0.05147409439086914, 0.053436279296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 7.0, 15.0, 24.0, 40.0, 54.0, 95.0, 175.0, 274.0, 592.0, 1410.0, 3838.0, 12662.0, 53568.0, 327165.0, 2144763.0, 1412599.0, 188643.0, 34404.0, 9016.0, 2794.0, 1062.0, 462.0, 236.0, 144.0, 91.0, 40.0, 32.0, 19.0, 14.0, 8.0, 7.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.10943317413330078, -0.10576820373535156, -0.10210323333740234, -0.09843826293945312, -0.0947732925415039, -0.09110832214355469, -0.08744335174560547, -0.08377838134765625, -0.08011341094970703, -0.07644844055175781, -0.0727834701538086, -0.06911849975585938, -0.06545352935791016, -0.06178855895996094, -0.05812358856201172, -0.0544586181640625, -0.05079364776611328, -0.04712867736816406, -0.043463706970214844, -0.039798736572265625, -0.036133766174316406, -0.03246879577636719, -0.02880382537841797, -0.02513885498046875, -0.02147388458251953, -0.017808914184570312, -0.014143943786621094, -0.010478973388671875, -0.006814002990722656, -0.0031490325927734375, 0.0005159378051757812, 0.004180908203125, 0.007845878601074219, 0.011510848999023438, 0.015175819396972656, 0.018840789794921875, 0.022505760192871094, 0.026170730590820312, 0.02983570098876953, 0.03350067138671875, 0.03716564178466797, 0.04083061218261719, 0.044495582580566406, 0.048160552978515625, 0.051825523376464844, 0.05549049377441406, 0.05915546417236328, 0.0628204345703125, 0.06648540496826172, 0.07015037536621094, 0.07381534576416016, 0.07748031616210938, 0.0811452865600586, 0.08481025695800781, 0.08847522735595703, 0.09214019775390625, 0.09580516815185547, 0.09947013854980469, 0.1031351089477539, 0.10680007934570312, 0.11046504974365234, 0.11413002014160156, 0.11779499053955078, 0.1214599609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 16.0, 28.0, 35.0, 70.0, 97.0, 197.0, 351.0, 552.0, 786.0, 720.0, 506.0, 294.0, 155.0, 107.0, 62.0, 37.0, 13.0, 14.0, 9.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08009147644042969, -0.07583236694335938, -0.07157325744628906, -0.06731414794921875, -0.06305503845214844, -0.058795928955078125, -0.05453681945800781, -0.0502777099609375, -0.04601860046386719, -0.041759490966796875, -0.03750038146972656, -0.03324127197265625, -0.028982162475585938, -0.024723052978515625, -0.020463943481445312, -0.016204833984375, -0.011945724487304688, -0.007686614990234375, -0.0034275054931640625, 0.00083160400390625, 0.0050907135009765625, 0.009349822998046875, 0.013608932495117188, 0.0178680419921875, 0.022127151489257812, 0.026386260986328125, 0.030645370483398438, 0.03490447998046875, 0.03916358947753906, 0.043422698974609375, 0.04768180847167969, 0.05194091796875, 0.05620002746582031, 0.060459136962890625, 0.06471824645996094, 0.06897735595703125, 0.07323646545410156, 0.07749557495117188, 0.08175468444824219, 0.0860137939453125, 0.09027290344238281, 0.09453201293945312, 0.09879112243652344, 0.10305023193359375, 0.10730934143066406, 0.11156845092773438, 0.11582756042480469, 0.120086669921875, 0.12434577941894531, 0.12860488891601562, 0.13286399841308594, 0.13712310791015625, 0.14138221740722656, 0.14564132690429688, 0.1499004364013672, 0.1541595458984375, 0.1584186553955078, 0.16267776489257812, 0.16693687438964844, 0.17119598388671875, 0.17545509338378906, 0.17971420288085938, 0.1839733123779297, 0.188232421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 18.0, 48.0, 87.0, 145.0, 189.0, 206.0, 131.0, 92.0, 41.0, 30.0, 8.0, 7.0, 6.0, 3.0], "bins": [-1.4769352674484253, -1.450332760810852, -1.4237301349639893, -1.397127628326416, -1.3705251216888428, -1.34392249584198, -1.3173199892044067, -1.290717363357544, -1.2641148567199707, -1.2375123500823975, -1.2109097242355347, -1.1843072175979614, -1.1577047109603882, -1.1311020851135254, -1.1044995784759521, -1.077897071838379, -1.0512944459915161, -1.0246919393539429, -0.9980893731117249, -0.9714868068695068, -0.9448842406272888, -0.9182816743850708, -0.8916791677474976, -0.8650766015052795, -0.8384740948677063, -0.8118715286254883, -0.785269021987915, -0.758666455745697, -0.732063889503479, -0.7054613828659058, -0.6788588166236877, -0.6522562503814697, -0.6256537437438965, -0.5990511775016785, -0.5724486708641052, -0.5458461046218872, -0.5192435383796692, -0.49264100193977356, -0.46603846549987793, -0.4394358992576599, -0.4128333330154419, -0.38623079657554626, -0.35962823033332825, -0.3330256938934326, -0.3064231276512146, -0.27982059121131897, -0.25321805477142334, -0.22661548852920532, -0.2000129222869873, -0.17341037094593048, -0.14680781960487366, -0.12020527571439743, -0.0936027243733406, -0.06700018048286438, -0.040397629141807556, -0.013795077800750732, 0.012807473540306091, 0.039410024881362915, 0.06601257622241974, 0.09261512011289597, 0.11921767145395279, 0.14582021534442902, 0.17242276668548584, 0.19902531802654266, 0.2256278693675995]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 10.0, 11.0, 12.0, 16.0, 17.0, 13.0, 12.0, 6.0, 15.0, 18.0, 30.0, 22.0, 29.0, 29.0, 35.0, 36.0, 28.0, 38.0, 43.0, 35.0, 33.0, 29.0, 42.0, 41.0, 32.0, 51.0, 37.0, 36.0, 34.0, 28.0, 19.0, 22.0, 25.0, 12.0, 16.0, 19.0, 14.0, 12.0, 5.0, 7.0, 5.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.28897976875305176, -0.2802063524723053, -0.2714329659938812, -0.26265954971313477, -0.2538861632347107, -0.24511274695396423, -0.23633934557437897, -0.2275659441947937, -0.21879254281520844, -0.21001914143562317, -0.2012457400560379, -0.19247233867645264, -0.18369892239570618, -0.1749255359172821, -0.16615211963653564, -0.15737871825695038, -0.1486053168773651, -0.13983191549777985, -0.13105851411819458, -0.12228510528802872, -0.11351170390844345, -0.10473830252885818, -0.09596489369869232, -0.08719149231910706, -0.07841809093952179, -0.06964468955993652, -0.06087128445506096, -0.052097879350185394, -0.04332447797060013, -0.03455107659101486, -0.025777671486139297, -0.017004266381263733, -0.008230865001678467, 0.0005425382405519485, 0.009315941482782364, 0.01808934472501278, 0.026862747967243195, 0.03563614934682846, 0.044409554451704025, 0.05318295955657959, 0.061956360936164856, 0.07072976231575012, 0.07950316369533539, 0.08827657252550125, 0.09704997390508652, 0.10582337528467178, 0.11459678411483765, 0.12337018549442291, 0.13214358687400818, 0.14091698825359344, 0.1496903896331787, 0.15846379101276398, 0.16723719239234924, 0.1760106086730957, 0.18478401005268097, 0.19355741143226624, 0.2023308128118515, 0.21110421419143677, 0.21987761557102203, 0.2286510169506073, 0.23742443323135376, 0.24619781970977783, 0.2549712359905243, 0.26374465227127075, 0.2725180387496948]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 6.0, 4.0, 3.0, 11.0, 8.0, 10.0, 17.0, 32.0, 39.0, 52.0, 60.0, 116.0, 226.0, 321.0, 619.0, 1259.0, 2504.0, 4861.0, 9778.0, 20522.0, 42504.0, 92419.0, 196110.0, 287711.0, 205048.0, 97290.0, 44710.0, 21394.0, 10439.0, 5080.0, 2526.0, 1281.0, 627.0, 366.0, 187.0, 143.0, 76.0, 58.0, 39.0, 21.0, 29.0, 9.0, 19.0, 5.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.11175537109375, -0.10832023620605469, -0.10488510131835938, -0.10144996643066406, -0.09801483154296875, -0.09457969665527344, -0.09114456176757812, -0.08770942687988281, -0.0842742919921875, -0.08083915710449219, -0.07740402221679688, -0.07396888732910156, -0.07053375244140625, -0.06709861755371094, -0.06366348266601562, -0.06022834777832031, -0.056793212890625, -0.05335807800292969, -0.049922943115234375, -0.04648780822753906, -0.04305267333984375, -0.03961753845214844, -0.036182403564453125, -0.03274726867675781, -0.0293121337890625, -0.025876998901367188, -0.022441864013671875, -0.019006729125976562, -0.01557159423828125, -0.012136459350585938, -0.008701324462890625, -0.0052661895751953125, -0.0018310546875, 0.0016040802001953125, 0.005039215087890625, 0.008474349975585938, 0.01190948486328125, 0.015344619750976562, 0.018779754638671875, 0.022214889526367188, 0.0256500244140625, 0.029085159301757812, 0.032520294189453125, 0.03595542907714844, 0.03939056396484375, 0.04282569885253906, 0.046260833740234375, 0.04969596862792969, 0.053131103515625, 0.05656623840332031, 0.060001373291015625, 0.06343650817871094, 0.06687164306640625, 0.07030677795410156, 0.07374191284179688, 0.07717704772949219, 0.0806121826171875, 0.08404731750488281, 0.08748245239257812, 0.09091758728027344, 0.09435272216796875, 0.09778785705566406, 0.10122299194335938, 0.10465812683105469, 0.10809326171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 5.0, 3.0, 8.0, 13.0, 17.0, 23.0, 23.0, 28.0, 26.0, 25.0, 25.0, 46.0, 49.0, 39.0, 52.0, 54.0, 50.0, 55.0, 71.0, 44.0, 52.0, 40.0, 37.0, 33.0, 33.0, 20.0, 27.0, 26.0, 18.0, 13.0, 12.0, 8.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.065185546875, -0.06336307525634766, -0.06154060363769531, -0.05971813201904297, -0.057895660400390625, -0.05607318878173828, -0.05425071716308594, -0.052428245544433594, -0.05060577392578125, -0.048783302307128906, -0.04696083068847656, -0.04513835906982422, -0.043315887451171875, -0.04149341583251953, -0.03967094421386719, -0.037848472595214844, -0.0360260009765625, -0.034203529357910156, -0.03238105773925781, -0.03055858612060547, -0.028736114501953125, -0.02691364288330078, -0.025091171264648438, -0.023268699645996094, -0.02144622802734375, -0.019623756408691406, -0.017801284790039062, -0.01597881317138672, -0.014156341552734375, -0.012333869934082031, -0.010511398315429688, -0.008688926696777344, -0.006866455078125, -0.005043983459472656, -0.0032215118408203125, -0.0013990402221679688, 0.000423431396484375, 0.0022459030151367188, 0.0040683746337890625, 0.005890846252441406, 0.00771331787109375, 0.009535789489746094, 0.011358261108398438, 0.013180732727050781, 0.015003204345703125, 0.01682567596435547, 0.018648147583007812, 0.020470619201660156, 0.0222930908203125, 0.024115562438964844, 0.025938034057617188, 0.02776050567626953, 0.029582977294921875, 0.03140544891357422, 0.03322792053222656, 0.035050392150878906, 0.03687286376953125, 0.038695335388183594, 0.04051780700683594, 0.04234027862548828, 0.044162750244140625, 0.04598522186279297, 0.04780769348144531, 0.049630165100097656, 0.05145263671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 6.0, 2.0, 3.0, 11.0, 11.0, 7.0, 22.0, 21.0, 33.0, 51.0, 92.0, 157.0, 442.0, 1284.0, 4265.0, 14479.0, 52397.0, 208444.0, 485893.0, 208197.0, 51850.0, 14498.0, 4179.0, 1268.0, 442.0, 214.0, 87.0, 64.0, 36.0, 24.0, 24.0, 13.0, 8.0, 2.0, 9.0, 2.0, 10.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.228271484375, -0.2220172882080078, -0.21576309204101562, -0.20950889587402344, -0.20325469970703125, -0.19700050354003906, -0.19074630737304688, -0.1844921112060547, -0.1782379150390625, -0.1719837188720703, -0.16572952270507812, -0.15947532653808594, -0.15322113037109375, -0.14696693420410156, -0.14071273803710938, -0.1344585418701172, -0.128204345703125, -0.12195014953613281, -0.11569595336914062, -0.10944175720214844, -0.10318756103515625, -0.09693336486816406, -0.09067916870117188, -0.08442497253417969, -0.0781707763671875, -0.07191658020019531, -0.06566238403320312, -0.05940818786621094, -0.05315399169921875, -0.04689979553222656, -0.040645599365234375, -0.03439140319824219, -0.02813720703125, -0.021883010864257812, -0.015628814697265625, -0.009374618530273438, -0.00312042236328125, 0.0031337738037109375, 0.009387969970703125, 0.015642166137695312, 0.0218963623046875, 0.028150558471679688, 0.034404754638671875, 0.04065895080566406, 0.04691314697265625, 0.05316734313964844, 0.059421539306640625, 0.06567573547363281, 0.071929931640625, 0.07818412780761719, 0.08443832397460938, 0.09069252014160156, 0.09694671630859375, 0.10320091247558594, 0.10945510864257812, 0.11570930480957031, 0.1219635009765625, 0.1282176971435547, 0.13447189331054688, 0.14072608947753906, 0.14698028564453125, 0.15323448181152344, 0.15948867797851562, 0.1657428741455078, 0.1719970703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 10.0, 4.0, 18.0, 17.0, 20.0, 24.0, 43.0, 35.0, 44.0, 36.0, 65.0, 55.0, 51.0, 57.0, 56.0, 65.0, 60.0, 47.0, 46.0, 40.0, 41.0, 36.0, 24.0, 20.0, 17.0, 7.0, 17.0, 12.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.207763671875, -0.20069503784179688, -0.19362640380859375, -0.18655776977539062, -0.1794891357421875, -0.17242050170898438, -0.16535186767578125, -0.15828323364257812, -0.151214599609375, -0.14414596557617188, -0.13707733154296875, -0.13000869750976562, -0.1229400634765625, -0.11587142944335938, -0.10880279541015625, -0.10173416137695312, -0.09466552734375, -0.08759689331054688, -0.08052825927734375, -0.07345962524414062, -0.0663909912109375, -0.059322357177734375, -0.05225372314453125, -0.045185089111328125, -0.038116455078125, -0.031047821044921875, -0.02397918701171875, -0.016910552978515625, -0.0098419189453125, -0.002773284912109375, 0.00429534912109375, 0.011363983154296875, 0.0184326171875, 0.025501251220703125, 0.03256988525390625, 0.039638519287109375, 0.0467071533203125, 0.053775787353515625, 0.06084442138671875, 0.06791305541992188, 0.074981689453125, 0.08205032348632812, 0.08911895751953125, 0.09618759155273438, 0.1032562255859375, 0.11032485961914062, 0.11739349365234375, 0.12446212768554688, 0.13153076171875, 0.13859939575195312, 0.14566802978515625, 0.15273666381835938, 0.1598052978515625, 0.16687393188476562, 0.17394256591796875, 0.18101119995117188, 0.188079833984375, 0.19514846801757812, 0.20221710205078125, 0.20928573608398438, 0.2163543701171875, 0.22342300415039062, 0.23049163818359375, 0.23756027221679688, 0.24462890625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 16.0, 16.0, 27.0, 46.0, 77.0, 133.0, 221.0, 393.0, 653.0, 1143.0, 2189.0, 4050.0, 7598.0, 14385.0, 26961.0, 50326.0, 99880.0, 194192.0, 261506.0, 186382.0, 94805.0, 47899.0, 25636.0, 13818.0, 7412.0, 4014.0, 2078.0, 1138.0, 636.0, 348.0, 188.0, 150.0, 73.0, 45.0, 28.0, 17.0, 16.0, 7.0, 6.0, 5.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.050262451171875, -0.04861259460449219, -0.046962738037109375, -0.04531288146972656, -0.04366302490234375, -0.04201316833496094, -0.040363311767578125, -0.03871345520019531, -0.0370635986328125, -0.03541374206542969, -0.033763885498046875, -0.03211402893066406, -0.03046417236328125, -0.028814315795898438, -0.027164459228515625, -0.025514602661132812, -0.02386474609375, -0.022214889526367188, -0.020565032958984375, -0.018915176391601562, -0.01726531982421875, -0.015615463256835938, -0.013965606689453125, -0.012315750122070312, -0.0106658935546875, -0.009016036987304688, -0.007366180419921875, -0.0057163238525390625, -0.00406646728515625, -0.0024166107177734375, -0.000766754150390625, 0.0008831024169921875, 0.002532958984375, 0.0041828155517578125, 0.005832672119140625, 0.0074825286865234375, 0.00913238525390625, 0.010782241821289062, 0.012432098388671875, 0.014081954956054688, 0.0157318115234375, 0.017381668090820312, 0.019031524658203125, 0.020681381225585938, 0.02233123779296875, 0.023981094360351562, 0.025630950927734375, 0.027280807495117188, 0.0289306640625, 0.030580520629882812, 0.032230377197265625, 0.03388023376464844, 0.03553009033203125, 0.03717994689941406, 0.038829803466796875, 0.04047966003417969, 0.0421295166015625, 0.04377937316894531, 0.045429229736328125, 0.04707908630371094, 0.04872894287109375, 0.05037879943847656, 0.052028656005859375, 0.05367851257324219, 0.055328369140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 7.0, 9.0, 9.0, 6.0, 10.0, 10.0, 20.0, 29.0, 16.0, 38.0, 41.0, 50.0, 69.0, 75.0, 76.0, 68.0, 77.0, 71.0, 64.0, 50.0, 32.0, 36.0, 29.0, 23.0, 15.0, 11.0, 11.0, 11.0, 8.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7523765563964844e-05, -1.6928650438785553e-05, -1.6333535313606262e-05, -1.573842018842697e-05, -1.514330506324768e-05, -1.454818993806839e-05, -1.3953074812889099e-05, -1.3357959687709808e-05, -1.2762844562530518e-05, -1.2167729437351227e-05, -1.1572614312171936e-05, -1.0977499186992645e-05, -1.0382384061813354e-05, -9.787268936634064e-06, -9.192153811454773e-06, -8.597038686275482e-06, -8.001923561096191e-06, -7.406808435916901e-06, -6.81169331073761e-06, -6.216578185558319e-06, -5.621463060379028e-06, -5.0263479351997375e-06, -4.431232810020447e-06, -3.836117684841156e-06, -3.2410025596618652e-06, -2.6458874344825745e-06, -2.0507723093032837e-06, -1.455657184123993e-06, -8.605420589447021e-07, -2.654269337654114e-07, 3.296881914138794e-07, 9.248033165931702e-07, 1.519918441772461e-06, 2.1150335669517517e-06, 2.7101486921310425e-06, 3.3052638173103333e-06, 3.900378942489624e-06, 4.495494067668915e-06, 5.0906091928482056e-06, 5.685724318027496e-06, 6.280839443206787e-06, 6.875954568386078e-06, 7.471069693565369e-06, 8.06618481874466e-06, 8.66129994392395e-06, 9.256415069103241e-06, 9.851530194282532e-06, 1.0446645319461823e-05, 1.1041760444641113e-05, 1.1636875569820404e-05, 1.2231990694999695e-05, 1.2827105820178986e-05, 1.3422220945358276e-05, 1.4017336070537567e-05, 1.4612451195716858e-05, 1.5207566320896149e-05, 1.580268144607544e-05, 1.639779657125473e-05, 1.699291169643402e-05, 1.7588026821613312e-05, 1.8183141946792603e-05, 1.8778257071971893e-05, 1.9373372197151184e-05, 1.9968487322330475e-05, 2.0563602447509766e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 12.0, 20.0, 27.0, 34.0, 63.0, 128.0, 202.0, 494.0, 958.0, 2355.0, 5877.0, 14462.0, 36646.0, 92887.0, 245356.0, 359999.0, 177110.0, 66867.0, 26792.0, 10678.0, 4253.0, 1798.0, 737.0, 352.0, 162.0, 109.0, 66.0, 32.0, 24.0, 18.0, 9.0, 3.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0750732421875, -0.07282066345214844, -0.07056808471679688, -0.06831550598144531, -0.06606292724609375, -0.06381034851074219, -0.061557769775390625, -0.05930519104003906, -0.0570526123046875, -0.05480003356933594, -0.052547454833984375, -0.05029487609863281, -0.04804229736328125, -0.04578971862792969, -0.043537139892578125, -0.04128456115722656, -0.039031982421875, -0.03677940368652344, -0.034526824951171875, -0.03227424621582031, -0.03002166748046875, -0.027769088745117188, -0.025516510009765625, -0.023263931274414062, -0.0210113525390625, -0.018758773803710938, -0.016506195068359375, -0.014253616333007812, -0.01200103759765625, -0.009748458862304688, -0.007495880126953125, -0.0052433013916015625, -0.00299072265625, -0.0007381439208984375, 0.001514434814453125, 0.0037670135498046875, 0.00601959228515625, 0.008272171020507812, 0.010524749755859375, 0.012777328491210938, 0.0150299072265625, 0.017282485961914062, 0.019535064697265625, 0.021787643432617188, 0.02404022216796875, 0.026292800903320312, 0.028545379638671875, 0.030797958374023438, 0.033050537109375, 0.03530311584472656, 0.037555694580078125, 0.03980827331542969, 0.04206085205078125, 0.04431343078613281, 0.046566009521484375, 0.04881858825683594, 0.0510711669921875, 0.05332374572753906, 0.055576324462890625, 0.05782890319824219, 0.06008148193359375, 0.06233406066894531, 0.06458663940429688, 0.06683921813964844, 0.069091796875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 5.0, 8.0, 10.0, 12.0, 14.0, 15.0, 21.0, 19.0, 21.0, 33.0, 50.0, 50.0, 66.0, 84.0, 82.0, 87.0, 78.0, 96.0, 62.0, 38.0, 36.0, 28.0, 23.0, 15.0, 12.0, 9.0, 5.0, 8.0, 4.0, 3.0, 5.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.09393310546875, -0.09164285659790039, -0.08935260772705078, -0.08706235885620117, -0.08477210998535156, -0.08248186111450195, -0.08019161224365234, -0.07790136337280273, -0.07561111450195312, -0.07332086563110352, -0.0710306167602539, -0.0687403678894043, -0.06645011901855469, -0.06415987014770508, -0.06186962127685547, -0.05957937240600586, -0.05728912353515625, -0.05499887466430664, -0.05270862579345703, -0.05041837692260742, -0.04812812805175781, -0.0458378791809082, -0.043547630310058594, -0.041257381439208984, -0.038967132568359375, -0.036676883697509766, -0.034386634826660156, -0.03209638595581055, -0.029806137084960938, -0.027515888214111328, -0.02522563934326172, -0.02293539047241211, -0.0206451416015625, -0.01835489273071289, -0.01606464385986328, -0.013774394989013672, -0.011484146118164062, -0.009193897247314453, -0.006903648376464844, -0.004613399505615234, -0.002323150634765625, -3.2901763916015625e-05, 0.0022573471069335938, 0.004547595977783203, 0.0068378448486328125, 0.009128093719482422, 0.011418342590332031, 0.01370859146118164, 0.01599884033203125, 0.01828908920288086, 0.02057933807373047, 0.022869586944580078, 0.025159835815429688, 0.027450084686279297, 0.029740333557128906, 0.032030582427978516, 0.034320831298828125, 0.036611080169677734, 0.038901329040527344, 0.04119157791137695, 0.04348182678222656, 0.04577207565307617, 0.04806232452392578, 0.05035257339477539, 0.052642822265625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 24.0, 70.0, 164.0, 236.0, 257.0, 140.0, 78.0, 24.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.212993860244751, -2.1625967025756836, -2.112199544906616, -2.061802387237549, -2.0114054679870605, -1.9610081911087036, -1.9106111526489258, -1.8602139949798584, -1.809816837310791, -1.7594196796417236, -1.7090225219726562, -1.6586254835128784, -1.608228325843811, -1.5578311681747437, -1.5074341297149658, -1.4570369720458984, -1.406639814376831, -1.3562426567077637, -1.3058454990386963, -1.2554484605789185, -1.205051302909851, -1.1546541452407837, -1.1042571067810059, -1.0538599491119385, -1.003462791442871, -0.9530656337738037, -0.9026685357093811, -0.8522714376449585, -0.8018742799758911, -0.7514771223068237, -0.7010800242424011, -0.6506829261779785, -0.6002857685089111, -0.5498886108398438, -0.49949151277542114, -0.44909438490867615, -0.39869725704193115, -0.34830012917518616, -0.29790300130844116, -0.24750587344169617, -0.19710874557495117, -0.14671161770820618, -0.09631448984146118, -0.045917361974716187, 0.004479765892028809, 0.054876893758773804, 0.1052740216255188, 0.1556711494922638, 0.2060682773590088, 0.2564654052257538, 0.3068625330924988, 0.3572596609592438, 0.40765678882598877, 0.45805391669273376, 0.5084510445594788, 0.5588481426239014, 0.6092453002929688, 0.6596424579620361, 0.7100395560264587, 0.7604366540908813, 0.8108338117599487, 0.8612309694290161, 0.9116280674934387, 0.9620251655578613, 1.0124223232269287]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 10.0, 7.0, 4.0, 6.0, 5.0, 16.0, 18.0, 15.0, 20.0, 22.0, 21.0, 28.0, 33.0, 33.0, 25.0, 33.0, 31.0, 37.0, 41.0, 43.0, 52.0, 30.0, 45.0, 35.0, 26.0, 59.0, 38.0, 36.0, 29.0, 28.0, 28.0, 22.0, 26.0, 16.0, 14.0, 12.0, 3.0, 10.0, 8.0, 9.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4538199305534363, -0.4384426176548004, -0.42306530475616455, -0.4076879918575287, -0.3923106789588928, -0.37693336606025696, -0.3615560531616211, -0.3461787700653076, -0.33080142736434937, -0.3154241144657135, -0.30004680156707764, -0.2846694886684418, -0.2692921757698059, -0.25391486287117004, -0.23853756487369537, -0.2231602519750595, -0.20778295397758484, -0.19240564107894897, -0.1770283281803131, -0.16165101528167725, -0.14627370238304138, -0.13089638948440552, -0.11551909148693085, -0.10014177858829498, -0.08476446568965912, -0.06938715279102325, -0.05400984361767769, -0.03863253444433212, -0.02325522154569626, -0.007877908647060394, 0.007499396800994873, 0.022876709699630737, 0.0382540225982666, 0.053631335496902466, 0.06900864839553833, 0.0843859538435936, 0.09976326674222946, 0.11514057964086533, 0.1305178850889206, 0.14589519798755646, 0.16127251088619232, 0.17664982378482819, 0.19202713668346405, 0.20740443468093872, 0.22278174757957458, 0.23815906047821045, 0.2535363733768463, 0.2689136862754822, 0.28429099917411804, 0.2996683120727539, 0.31504562497138977, 0.33042293787002563, 0.3458002507686615, 0.36117756366729736, 0.37655484676361084, 0.3919321894645691, 0.40730947256088257, 0.42268678545951843, 0.4380640983581543, 0.45344141125679016, 0.468818724155426, 0.4841960370540619, 0.49957334995269775, 0.5149506330490112, 0.5303279757499695]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 5.0, 8.0, 7.0, 19.0, 14.0, 16.0, 21.0, 12.0, 45.0, 57.0, 94.0, 194.0, 470.0, 1501.0, 6073.0, 30653.0, 236511.0, 2377247.0, 1387223.0, 129671.0, 18854.0, 3955.0, 963.0, 299.0, 115.0, 68.0, 37.0, 28.0, 24.0, 13.0, 16.0, 10.0, 12.0, 9.0, 11.0, 6.0, 5.0, 2.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15185546875, -0.14762115478515625, -0.1433868408203125, -0.13915252685546875, -0.134918212890625, -0.13068389892578125, -0.1264495849609375, -0.12221527099609375, -0.11798095703125, -0.11374664306640625, -0.1095123291015625, -0.10527801513671875, -0.101043701171875, -0.09680938720703125, -0.0925750732421875, -0.08834075927734375, -0.0841064453125, -0.07987213134765625, -0.0756378173828125, -0.07140350341796875, -0.067169189453125, -0.06293487548828125, -0.0587005615234375, -0.05446624755859375, -0.05023193359375, -0.04599761962890625, -0.0417633056640625, -0.03752899169921875, -0.033294677734375, -0.02906036376953125, -0.0248260498046875, -0.02059173583984375, -0.016357421875, -0.01212310791015625, -0.0078887939453125, -0.00365447998046875, 0.000579833984375, 0.00481414794921875, 0.0090484619140625, 0.01328277587890625, 0.01751708984375, 0.02175140380859375, 0.0259857177734375, 0.03022003173828125, 0.034454345703125, 0.03868865966796875, 0.0429229736328125, 0.04715728759765625, 0.0513916015625, 0.05562591552734375, 0.0598602294921875, 0.06409454345703125, 0.068328857421875, 0.07256317138671875, 0.0767974853515625, 0.08103179931640625, 0.08526611328125, 0.08950042724609375, 0.0937347412109375, 0.09796905517578125, 0.102203369140625, 0.10643768310546875, 0.1106719970703125, 0.11490631103515625, 0.119140625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 6.0, 11.0, 7.0, 15.0, 20.0, 17.0, 22.0, 22.0, 32.0, 23.0, 41.0, 41.0, 36.0, 50.0, 39.0, 51.0, 48.0, 59.0, 51.0, 47.0, 49.0, 52.0, 32.0, 31.0, 33.0, 30.0, 24.0, 14.0, 22.0, 14.0, 10.0, 10.0, 12.0, 5.0, 8.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0738525390625, -0.07185745239257812, -0.06986236572265625, -0.06786727905273438, -0.0658721923828125, -0.06387710571289062, -0.06188201904296875, -0.059886932373046875, -0.057891845703125, -0.055896759033203125, -0.05390167236328125, -0.051906585693359375, -0.0499114990234375, -0.047916412353515625, -0.04592132568359375, -0.043926239013671875, -0.04193115234375, -0.039936065673828125, -0.03794097900390625, -0.035945892333984375, -0.0339508056640625, -0.031955718994140625, -0.02996063232421875, -0.027965545654296875, -0.025970458984375, -0.023975372314453125, -0.02198028564453125, -0.019985198974609375, -0.0179901123046875, -0.015995025634765625, -0.01399993896484375, -0.012004852294921875, -0.010009765625, -0.008014678955078125, -0.00601959228515625, -0.004024505615234375, -0.0020294189453125, -3.4332275390625e-05, 0.00196075439453125, 0.003955841064453125, 0.005950927734375, 0.007946014404296875, 0.00994110107421875, 0.011936187744140625, 0.0139312744140625, 0.015926361083984375, 0.01792144775390625, 0.019916534423828125, 0.02191162109375, 0.023906707763671875, 0.02590179443359375, 0.027896881103515625, 0.0298919677734375, 0.031887054443359375, 0.03388214111328125, 0.035877227783203125, 0.037872314453125, 0.039867401123046875, 0.04186248779296875, 0.043857574462890625, 0.0458526611328125, 0.047847747802734375, 0.04984283447265625, 0.051837921142578125, 0.0538330078125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 2.0, 5.0, 9.0, 14.0, 15.0, 28.0, 31.0, 41.0, 57.0, 95.0, 148.0, 182.0, 279.0, 471.0, 739.0, 1223.0, 2089.0, 3600.0, 6743.0, 12850.0, 27433.0, 61963.0, 153332.0, 408658.0, 1065639.0, 1426638.0, 622854.0, 232129.0, 90358.0, 38495.0, 17831.0, 8840.0, 4692.0, 2692.0, 1561.0, 952.0, 542.0, 362.0, 225.0, 169.0, 97.0, 66.0, 46.0, 25.0, 27.0, 17.0, 7.0, 6.0, 2.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07183837890625, -0.06929206848144531, -0.06674575805664062, -0.06419944763183594, -0.06165313720703125, -0.05910682678222656, -0.056560516357421875, -0.05401420593261719, -0.0514678955078125, -0.04892158508300781, -0.046375274658203125, -0.04382896423339844, -0.04128265380859375, -0.03873634338378906, -0.036190032958984375, -0.03364372253417969, -0.031097412109375, -0.028551101684570312, -0.026004791259765625, -0.023458480834960938, -0.02091217041015625, -0.018365859985351562, -0.015819549560546875, -0.013273239135742188, -0.0107269287109375, -0.008180618286132812, -0.005634307861328125, -0.0030879974365234375, -0.00054168701171875, 0.0020046234130859375, 0.004550933837890625, 0.0070972442626953125, 0.0096435546875, 0.012189865112304688, 0.014736175537109375, 0.017282485961914062, 0.01982879638671875, 0.022375106811523438, 0.024921417236328125, 0.027467727661132812, 0.0300140380859375, 0.03256034851074219, 0.035106658935546875, 0.03765296936035156, 0.04019927978515625, 0.04274559020996094, 0.045291900634765625, 0.04783821105957031, 0.050384521484375, 0.05293083190917969, 0.055477142333984375, 0.05802345275878906, 0.06056976318359375, 0.06311607360839844, 0.06566238403320312, 0.06820869445800781, 0.0707550048828125, 0.07330131530761719, 0.07584762573242188, 0.07839393615722656, 0.08094024658203125, 0.08348655700683594, 0.08603286743164062, 0.08857917785644531, 0.09112548828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 10.0, 9.0, 23.0, 30.0, 40.0, 48.0, 71.0, 101.0, 135.0, 174.0, 283.0, 343.0, 395.0, 501.0, 457.0, 365.0, 285.0, 207.0, 157.0, 115.0, 70.0, 58.0, 45.0, 25.0, 19.0, 27.0, 13.0, 11.0, 8.0, 5.0, 6.0, 4.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.10491943359375, -0.1018819808959961, -0.09884452819824219, -0.09580707550048828, -0.09276962280273438, -0.08973217010498047, -0.08669471740722656, -0.08365726470947266, -0.08061981201171875, -0.07758235931396484, -0.07454490661621094, -0.07150745391845703, -0.06847000122070312, -0.06543254852294922, -0.06239509582519531, -0.059357643127441406, -0.0563201904296875, -0.053282737731933594, -0.05024528503417969, -0.04720783233642578, -0.044170379638671875, -0.04113292694091797, -0.03809547424316406, -0.035058021545410156, -0.03202056884765625, -0.028983116149902344, -0.025945663452148438, -0.02290821075439453, -0.019870758056640625, -0.01683330535888672, -0.013795852661132812, -0.010758399963378906, -0.007720947265625, -0.004683494567871094, -0.0016460418701171875, 0.0013914108276367188, 0.004428863525390625, 0.007466316223144531, 0.010503768920898438, 0.013541221618652344, 0.01657867431640625, 0.019616127014160156, 0.022653579711914062, 0.02569103240966797, 0.028728485107421875, 0.03176593780517578, 0.03480339050292969, 0.037840843200683594, 0.0408782958984375, 0.043915748596191406, 0.04695320129394531, 0.04999065399169922, 0.053028106689453125, 0.05606555938720703, 0.05910301208496094, 0.062140464782714844, 0.06517791748046875, 0.06821537017822266, 0.07125282287597656, 0.07429027557373047, 0.07732772827148438, 0.08036518096923828, 0.08340263366699219, 0.0864400863647461, 0.0894775390625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 34.0, 72.0, 109.0, 169.0, 206.0, 177.0, 136.0, 56.0, 30.0, 14.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9070184230804443, -1.8703745603561401, -1.833730697631836, -1.7970868349075317, -1.7604429721832275, -1.7237989902496338, -1.6871551275253296, -1.6505112648010254, -1.6138674020767212, -1.577223539352417, -1.5405796766281128, -1.5039358139038086, -1.4672918319702148, -1.4306479692459106, -1.3940041065216064, -1.3573602437973022, -1.320716381072998, -1.2840725183486938, -1.2474286556243896, -1.2107847929000854, -1.1741409301757812, -1.1374969482421875, -1.1008530855178833, -1.064209222793579, -1.027565360069275, -0.9909214973449707, -0.9542776346206665, -0.9176337122917175, -0.8809898495674133, -0.8443459868431091, -0.8077020645141602, -0.771058201789856, -0.7344144582748413, -0.6977705955505371, -0.6611267328262329, -0.6244828104972839, -0.5878389477729797, -0.5511950850486755, -0.5145511627197266, -0.47790729999542236, -0.44126343727111816, -0.40461957454681396, -0.3679756820201874, -0.3313317894935608, -0.2946879267692566, -0.2580440640449524, -0.2214001715183258, -0.18475627899169922, -0.14811241626739502, -0.11146853864192963, -0.07482466101646423, -0.03818078339099884, -0.0015369057655334473, 0.035106971859931946, 0.07175084948539734, 0.10839474201202393, 0.14503860473632812, 0.18168248236179352, 0.2183263599872589, 0.2549702525138855, 0.2916141152381897, 0.3282579779624939, 0.3649018704891205, 0.40154576301574707, 0.43818962574005127]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 7.0, 12.0, 12.0, 8.0, 21.0, 20.0, 20.0, 25.0, 22.0, 33.0, 27.0, 39.0, 30.0, 27.0, 38.0, 37.0, 49.0, 37.0, 34.0, 41.0, 46.0, 39.0, 34.0, 30.0, 37.0, 38.0, 29.0, 24.0, 26.0, 30.0, 23.0, 14.0, 19.0, 12.0, 9.0, 7.0, 8.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3649511933326721, -0.3531569838523865, -0.34136274456977844, -0.3295685350894928, -0.31777432560920715, -0.3059801161289215, -0.2941858768463135, -0.28239166736602783, -0.2705974578857422, -0.25880324840545654, -0.2470090240240097, -0.23521479964256287, -0.22342059016227722, -0.21162636578083038, -0.19983214139938354, -0.1880379319190979, -0.17624370753765106, -0.16444948315620422, -0.15265527367591858, -0.14086104929447174, -0.1290668398141861, -0.11727261543273926, -0.10547839850187302, -0.09368418157100677, -0.08188996464014053, -0.07009574770927429, -0.05830153077840805, -0.04650731012225151, -0.03471309319138527, -0.022918876260519028, -0.011124655604362488, 0.0006695613265037537, 0.012463778257369995, 0.024257995188236237, 0.03605221211910248, 0.04784643277525902, 0.05964064970612526, 0.0714348703622818, 0.08322908729314804, 0.09502330422401428, 0.10681752115488052, 0.11861173808574677, 0.1304059624671936, 0.14220017194747925, 0.1539943963289261, 0.16578860580921173, 0.17758283019065857, 0.1893770396709442, 0.20117126405239105, 0.2129654884338379, 0.22475969791412354, 0.23655392229557037, 0.24834813177585602, 0.26014235615730286, 0.2719365656375885, 0.28373080492019653, 0.2955250144004822, 0.3073192238807678, 0.31911346316337585, 0.3309076726436615, 0.34270188212394714, 0.3544960916042328, 0.3662903308868408, 0.37808454036712646, 0.3898787498474121]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 12.0, 11.0, 16.0, 28.0, 59.0, 103.0, 154.0, 260.0, 490.0, 820.0, 1455.0, 2737.0, 4912.0, 8833.0, 16194.0, 30881.0, 60834.0, 133556.0, 271922.0, 265855.0, 127079.0, 57798.0, 29497.0, 15732.0, 8552.0, 4829.0, 2523.0, 1452.0, 791.0, 512.0, 255.0, 159.0, 73.0, 56.0, 39.0, 16.0, 19.0, 10.0, 5.0, 10.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08514404296875, -0.08209991455078125, -0.0790557861328125, -0.07601165771484375, -0.072967529296875, -0.06992340087890625, -0.0668792724609375, -0.06383514404296875, -0.060791015625, -0.05774688720703125, -0.0547027587890625, -0.05165863037109375, -0.048614501953125, -0.04557037353515625, -0.0425262451171875, -0.03948211669921875, -0.03643798828125, -0.03339385986328125, -0.0303497314453125, -0.02730560302734375, -0.024261474609375, -0.02121734619140625, -0.0181732177734375, -0.01512908935546875, -0.0120849609375, -0.00904083251953125, -0.0059967041015625, -0.00295257568359375, 9.1552734375e-05, 0.00313568115234375, 0.0061798095703125, 0.00922393798828125, 0.01226806640625, 0.01531219482421875, 0.0183563232421875, 0.02140045166015625, 0.024444580078125, 0.02748870849609375, 0.0305328369140625, 0.03357696533203125, 0.03662109375, 0.03966522216796875, 0.0427093505859375, 0.04575347900390625, 0.048797607421875, 0.05184173583984375, 0.0548858642578125, 0.05792999267578125, 0.06097412109375, 0.06401824951171875, 0.0670623779296875, 0.07010650634765625, 0.073150634765625, 0.07619476318359375, 0.0792388916015625, 0.08228302001953125, 0.0853271484375, 0.08837127685546875, 0.0914154052734375, 0.09445953369140625, 0.097503662109375, 0.10054779052734375, 0.1035919189453125, 0.10663604736328125, 0.10968017578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 12.0, 12.0, 13.0, 10.0, 23.0, 15.0, 18.0, 21.0, 34.0, 34.0, 36.0, 31.0, 48.0, 43.0, 48.0, 36.0, 44.0, 56.0, 50.0, 59.0, 39.0, 43.0, 40.0, 22.0, 32.0, 25.0, 18.0, 28.0, 20.0, 20.0, 9.0, 11.0, 11.0, 8.0, 5.0, 10.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06683349609375, -0.06491661071777344, -0.06299972534179688, -0.06108283996582031, -0.05916595458984375, -0.05724906921386719, -0.055332183837890625, -0.05341529846191406, -0.0514984130859375, -0.04958152770996094, -0.047664642333984375, -0.04574775695800781, -0.04383087158203125, -0.04191398620605469, -0.039997100830078125, -0.03808021545410156, -0.036163330078125, -0.03424644470214844, -0.032329559326171875, -0.030412673950195312, -0.02849578857421875, -0.026578903198242188, -0.024662017822265625, -0.022745132446289062, -0.0208282470703125, -0.018911361694335938, -0.016994476318359375, -0.015077590942382812, -0.01316070556640625, -0.011243820190429688, -0.009326934814453125, -0.0074100494384765625, -0.0054931640625, -0.0035762786865234375, -0.001659393310546875, 0.0002574920654296875, 0.00217437744140625, 0.0040912628173828125, 0.006008148193359375, 0.007925033569335938, 0.0098419189453125, 0.011758804321289062, 0.013675689697265625, 0.015592575073242188, 0.01750946044921875, 0.019426345825195312, 0.021343231201171875, 0.023260116577148438, 0.025177001953125, 0.027093887329101562, 0.029010772705078125, 0.030927658081054688, 0.03284454345703125, 0.03476142883300781, 0.036678314208984375, 0.03859519958496094, 0.0405120849609375, 0.04242897033691406, 0.044345855712890625, 0.04626274108886719, 0.04817962646484375, 0.05009651184082031, 0.052013397216796875, 0.05393028259277344, 0.05584716796875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 11.0, 10.0, 20.0, 9.0, 26.0, 26.0, 43.0, 74.0, 183.0, 574.0, 2133.0, 8934.0, 45182.0, 335341.0, 563942.0, 73774.0, 13725.0, 3208.0, 824.0, 250.0, 101.0, 54.0, 35.0, 18.0, 13.0, 13.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.305419921875, -0.29620361328125, -0.2869873046875, -0.27777099609375, -0.2685546875, -0.25933837890625, -0.2501220703125, -0.24090576171875, -0.231689453125, -0.22247314453125, -0.2132568359375, -0.20404052734375, -0.19482421875, -0.18560791015625, -0.1763916015625, -0.16717529296875, -0.157958984375, -0.14874267578125, -0.1395263671875, -0.13031005859375, -0.12109375, -0.11187744140625, -0.1026611328125, -0.09344482421875, -0.084228515625, -0.07501220703125, -0.0657958984375, -0.05657958984375, -0.04736328125, -0.03814697265625, -0.0289306640625, -0.01971435546875, -0.010498046875, -0.00128173828125, 0.0079345703125, 0.01715087890625, 0.0263671875, 0.03558349609375, 0.0447998046875, 0.05401611328125, 0.063232421875, 0.07244873046875, 0.0816650390625, 0.09088134765625, 0.10009765625, 0.10931396484375, 0.1185302734375, 0.12774658203125, 0.136962890625, 0.14617919921875, 0.1553955078125, 0.16461181640625, 0.173828125, 0.18304443359375, 0.1922607421875, 0.20147705078125, 0.210693359375, 0.21990966796875, 0.2291259765625, 0.23834228515625, 0.24755859375, 0.25677490234375, 0.2659912109375, 0.27520751953125, 0.284423828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 9.0, 12.0, 13.0, 26.0, 29.0, 34.0, 41.0, 35.0, 43.0, 55.0, 63.0, 78.0, 80.0, 54.0, 57.0, 49.0, 66.0, 45.0, 44.0, 25.0, 29.0, 25.0, 16.0, 17.0, 13.0, 8.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26708984375, -0.2583503723144531, -0.24961090087890625, -0.24087142944335938, -0.2321319580078125, -0.22339248657226562, -0.21465301513671875, -0.20591354370117188, -0.197174072265625, -0.18843460083007812, -0.17969512939453125, -0.17095565795898438, -0.1622161865234375, -0.15347671508789062, -0.14473724365234375, -0.13599777221679688, -0.12725830078125, -0.11851882934570312, -0.10977935791015625, -0.10103988647460938, -0.0923004150390625, -0.08356094360351562, -0.07482147216796875, -0.06608200073242188, -0.057342529296875, -0.048603057861328125, -0.03986358642578125, -0.031124114990234375, -0.0223846435546875, -0.013645172119140625, -0.00490570068359375, 0.003833770751953125, 0.0125732421875, 0.021312713623046875, 0.03005218505859375, 0.038791656494140625, 0.0475311279296875, 0.056270599365234375, 0.06501007080078125, 0.07374954223632812, 0.082489013671875, 0.09122848510742188, 0.09996795654296875, 0.10870742797851562, 0.1174468994140625, 0.12618637084960938, 0.13492584228515625, 0.14366531372070312, 0.15240478515625, 0.16114425659179688, 0.16988372802734375, 0.17862319946289062, 0.1873626708984375, 0.19610214233398438, 0.20484161376953125, 0.21358108520507812, 0.222320556640625, 0.23106002807617188, 0.23979949951171875, 0.24853897094726562, 0.2572784423828125, 0.2660179138183594, 0.27475738525390625, 0.2834968566894531, 0.292236328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 12.0, 17.0, 29.0, 48.0, 87.0, 151.0, 219.0, 379.0, 684.0, 1154.0, 2107.0, 3573.0, 6036.0, 10947.0, 19457.0, 36297.0, 77707.0, 193257.0, 340746.0, 195378.0, 78738.0, 36539.0, 19666.0, 10826.0, 6150.0, 3496.0, 2056.0, 1169.0, 693.0, 398.0, 223.0, 131.0, 68.0, 50.0, 27.0, 23.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06494140625, -0.0629434585571289, -0.06094551086425781, -0.05894756317138672, -0.056949615478515625, -0.05495166778564453, -0.05295372009277344, -0.050955772399902344, -0.04895782470703125, -0.046959877014160156, -0.04496192932128906, -0.04296398162841797, -0.040966033935546875, -0.03896808624267578, -0.03697013854980469, -0.034972190856933594, -0.0329742431640625, -0.030976295471191406, -0.028978347778320312, -0.02698040008544922, -0.024982452392578125, -0.02298450469970703, -0.020986557006835938, -0.018988609313964844, -0.01699066162109375, -0.014992713928222656, -0.012994766235351562, -0.010996818542480469, -0.008998870849609375, -0.007000923156738281, -0.0050029754638671875, -0.0030050277709960938, -0.001007080078125, 0.0009908676147460938, 0.0029888153076171875, 0.004986763000488281, 0.006984710693359375, 0.008982658386230469, 0.010980606079101562, 0.012978553771972656, 0.01497650146484375, 0.016974449157714844, 0.018972396850585938, 0.02097034454345703, 0.022968292236328125, 0.02496623992919922, 0.026964187622070312, 0.028962135314941406, 0.0309600830078125, 0.032958030700683594, 0.03495597839355469, 0.03695392608642578, 0.038951873779296875, 0.04094982147216797, 0.04294776916503906, 0.044945716857910156, 0.04694366455078125, 0.048941612243652344, 0.05093955993652344, 0.05293750762939453, 0.054935455322265625, 0.05693340301513672, 0.05893135070800781, 0.060929298400878906, 0.06292724609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 8.0, 6.0, 29.0, 33.0, 51.0, 79.0, 96.0, 133.0, 151.0, 122.0, 89.0, 63.0, 30.0, 25.0, 24.0, 13.0, 8.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314018249511719e-05, -3.225449472665787e-05, -3.136880695819855e-05, -3.0483119189739227e-05, -2.9597431421279907e-05, -2.8711743652820587e-05, -2.7826055884361267e-05, -2.6940368115901947e-05, -2.6054680347442627e-05, -2.5168992578983307e-05, -2.4283304810523987e-05, -2.3397617042064667e-05, -2.2511929273605347e-05, -2.1626241505146027e-05, -2.0740553736686707e-05, -1.9854865968227386e-05, -1.8969178199768066e-05, -1.8083490431308746e-05, -1.7197802662849426e-05, -1.6312114894390106e-05, -1.5426427125930786e-05, -1.4540739357471466e-05, -1.3655051589012146e-05, -1.2769363820552826e-05, -1.1883676052093506e-05, -1.0997988283634186e-05, -1.0112300515174866e-05, -9.226612746715546e-06, -8.340924978256226e-06, -7.4552372097969055e-06, -6.5695494413375854e-06, -5.683861672878265e-06, -4.798173904418945e-06, -3.912486135959625e-06, -3.026798367500305e-06, -2.141110599040985e-06, -1.255422830581665e-06, -3.6973506212234497e-07, 5.159527063369751e-07, 1.4016404747962952e-06, 2.2873282432556152e-06, 3.1730160117149353e-06, 4.058703780174255e-06, 4.9443915486335754e-06, 5.8300793170928955e-06, 6.7157670855522156e-06, 7.601454854011536e-06, 8.487142622470856e-06, 9.372830390930176e-06, 1.0258518159389496e-05, 1.1144205927848816e-05, 1.2029893696308136e-05, 1.2915581464767456e-05, 1.3801269233226776e-05, 1.4686957001686096e-05, 1.5572644770145416e-05, 1.6458332538604736e-05, 1.7344020307064056e-05, 1.8229708075523376e-05, 1.9115395843982697e-05, 2.0001083612442017e-05, 2.0886771380901337e-05, 2.1772459149360657e-05, 2.2658146917819977e-05, 2.3543834686279297e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 2.0, 12.0, 15.0, 19.0, 29.0, 40.0, 80.0, 108.0, 219.0, 383.0, 625.0, 1200.0, 2365.0, 4818.0, 9394.0, 19441.0, 40475.0, 95215.0, 267482.0, 359931.0, 140261.0, 55596.0, 25494.0, 12396.0, 6306.0, 3127.0, 1574.0, 816.0, 441.0, 250.0, 148.0, 109.0, 58.0, 31.0, 37.0, 14.0, 9.0, 13.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0738525390625, -0.07162761688232422, -0.06940269470214844, -0.06717777252197266, -0.06495285034179688, -0.0627279281616211, -0.06050300598144531, -0.05827808380126953, -0.05605316162109375, -0.05382823944091797, -0.05160331726074219, -0.049378395080566406, -0.047153472900390625, -0.044928550720214844, -0.04270362854003906, -0.04047870635986328, -0.0382537841796875, -0.03602886199951172, -0.03380393981933594, -0.031579017639160156, -0.029354095458984375, -0.027129173278808594, -0.024904251098632812, -0.02267932891845703, -0.02045440673828125, -0.01822948455810547, -0.016004562377929688, -0.013779640197753906, -0.011554718017578125, -0.009329795837402344, -0.0071048736572265625, -0.004879951477050781, -0.002655029296875, -0.00043010711669921875, 0.0017948150634765625, 0.004019737243652344, 0.006244659423828125, 0.008469581604003906, 0.010694503784179688, 0.012919425964355469, 0.01514434814453125, 0.01736927032470703, 0.019594192504882812, 0.021819114685058594, 0.024044036865234375, 0.026268959045410156, 0.028493881225585938, 0.03071880340576172, 0.0329437255859375, 0.03516864776611328, 0.03739356994628906, 0.039618492126464844, 0.041843414306640625, 0.044068336486816406, 0.04629325866699219, 0.04851818084716797, 0.05074310302734375, 0.05296802520751953, 0.05519294738769531, 0.057417869567871094, 0.059642791748046875, 0.061867713928222656, 0.06409263610839844, 0.06631755828857422, 0.06854248046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 4.0, 10.0, 10.0, 11.0, 15.0, 22.0, 25.0, 31.0, 37.0, 62.0, 76.0, 90.0, 107.0, 104.0, 86.0, 72.0, 47.0, 31.0, 18.0, 18.0, 24.0, 16.0, 4.0, 8.0, 10.0, 11.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0882568359375, -0.08557510375976562, -0.08289337158203125, -0.08021163940429688, -0.0775299072265625, -0.07484817504882812, -0.07216644287109375, -0.06948471069335938, -0.066802978515625, -0.06412124633789062, -0.06143951416015625, -0.058757781982421875, -0.0560760498046875, -0.053394317626953125, -0.05071258544921875, -0.048030853271484375, -0.04534912109375, -0.042667388916015625, -0.03998565673828125, -0.037303924560546875, -0.0346221923828125, -0.031940460205078125, -0.02925872802734375, -0.026576995849609375, -0.023895263671875, -0.021213531494140625, -0.01853179931640625, -0.015850067138671875, -0.0131683349609375, -0.010486602783203125, -0.00780487060546875, -0.005123138427734375, -0.00244140625, 0.000240325927734375, 0.00292205810546875, 0.005603790283203125, 0.0082855224609375, 0.010967254638671875, 0.01364898681640625, 0.016330718994140625, 0.019012451171875, 0.021694183349609375, 0.02437591552734375, 0.027057647705078125, 0.0297393798828125, 0.032421112060546875, 0.03510284423828125, 0.037784576416015625, 0.04046630859375, 0.043148040771484375, 0.04582977294921875, 0.048511505126953125, 0.0511932373046875, 0.053874969482421875, 0.05655670166015625, 0.059238433837890625, 0.061920166015625, 0.06460189819335938, 0.06728363037109375, 0.06996536254882812, 0.0726470947265625, 0.07532882690429688, 0.07801055908203125, 0.08069229125976562, 0.0833740234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 23.0, 49.0, 110.0, 209.0, 223.0, 170.0, 121.0, 58.0, 27.0, 14.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43019184470176697, -0.3789558410644531, -0.3277198076248169, -0.27648380398750305, -0.22524778544902802, -0.17401176691055298, -0.12277576327323914, -0.0715397298336029, -0.020303726196289062, 0.030932288616895676, 0.08216830343008041, 0.13340431451797485, 0.1846403330564499, 0.23587635159492493, 0.28711235523223877, 0.338348388671875, 0.38958439230918884, 0.4408203959465027, 0.4920564293861389, 0.5432924032211304, 0.5945284366607666, 0.6457644701004028, 0.6970005035400391, 0.7482365369796753, 0.7994725108146667, 0.850708544254303, 0.9019445180892944, 0.9531805515289307, 1.004416584968567, 1.0556526184082031, 1.1068885326385498, 1.1581246852874756, 1.2093607187271118, 1.260596752166748, 1.3118327856063843, 1.3630688190460205, 1.4143047332763672, 1.4655407667160034, 1.5167768001556396, 1.5680128335952759, 1.619248867034912, 1.6704849004745483, 1.7217209339141846, 1.7729568481445312, 1.8241928815841675, 1.8754289150238037, 1.92666494846344, 1.9779009819030762, 2.029136896133423, 2.0803728103637695, 2.1316089630126953, 2.182844877243042, 2.2340810298919678, 2.2853169441223145, 2.3365530967712402, 2.387789011001587, 2.4390251636505127, 2.4902610778808594, 2.541497230529785, 2.592733144760132, 2.6439692974090576, 2.6952052116394043, 2.74644136428833, 2.7976772785186768, 2.8489131927490234]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 7.0, 5.0, 5.0, 14.0, 13.0, 14.0, 23.0, 16.0, 29.0, 20.0, 33.0, 22.0, 34.0, 28.0, 45.0, 32.0, 51.0, 32.0, 42.0, 53.0, 50.0, 37.0, 34.0, 49.0, 36.0, 38.0, 33.0, 30.0, 22.0, 23.0, 18.0, 21.0, 17.0, 9.0, 15.0, 9.0, 11.0, 6.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6256731152534485, -0.6062715649604797, -0.5868699550628662, -0.5674684047698975, -0.5480668544769287, -0.5286652445793152, -0.5092636942863464, -0.4898621141910553, -0.47046053409576416, -0.451058954000473, -0.4316573739051819, -0.41225582361221313, -0.392854243516922, -0.37345266342163086, -0.3540511131286621, -0.33464953303337097, -0.31524795293807983, -0.2958463728427887, -0.27644479274749756, -0.2570432424545288, -0.23764166235923767, -0.21824008226394653, -0.1988385170698166, -0.17943695187568665, -0.1600353717803955, -0.14063379168510437, -0.12123222649097443, -0.10183065384626389, -0.08242908120155334, -0.0630275085568428, -0.04362593591213226, -0.02422437071800232, -0.004822850227355957, 0.014578722417354584, 0.033980295062065125, 0.053381867706775665, 0.0727834403514862, 0.09218501299619675, 0.11158658564090729, 0.13098815083503723, 0.15038973093032837, 0.1697913110256195, 0.18919287621974945, 0.2085944414138794, 0.22799602150917053, 0.24739760160446167, 0.2667991518974304, 0.28620073199272156, 0.3056023120880127, 0.32500389218330383, 0.34440547227859497, 0.3638070225715637, 0.38320860266685486, 0.402610182762146, 0.42201173305511475, 0.4414133131504059, 0.460814893245697, 0.48021647334098816, 0.4996180534362793, 0.519019603729248, 0.5384211540222168, 0.5578227639198303, 0.5772243142127991, 0.5966259241104126, 0.6160274744033813]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 13.0, 13.0, 20.0, 26.0, 36.0, 42.0, 65.0, 124.0, 251.0, 512.0, 1313.0, 3981.0, 14900.0, 68599.0, 417983.0, 2667071.0, 861735.0, 124112.0, 24203.0, 6101.0, 1772.0, 654.0, 272.0, 149.0, 98.0, 50.0, 41.0, 31.0, 20.0, 14.0, 18.0, 11.0, 12.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13720703125, -0.1328754425048828, -0.12854385375976562, -0.12421226501464844, -0.11988067626953125, -0.11554908752441406, -0.11121749877929688, -0.10688591003417969, -0.1025543212890625, -0.09822273254394531, -0.09389114379882812, -0.08955955505371094, -0.08522796630859375, -0.08089637756347656, -0.07656478881835938, -0.07223320007324219, -0.067901611328125, -0.06357002258300781, -0.059238433837890625, -0.05490684509277344, -0.05057525634765625, -0.04624366760253906, -0.041912078857421875, -0.03758049011230469, -0.0332489013671875, -0.028917312622070312, -0.024585723876953125, -0.020254135131835938, -0.01592254638671875, -0.011590957641601562, -0.007259368896484375, -0.0029277801513671875, 0.00140380859375, 0.0057353973388671875, 0.010066986083984375, 0.014398574829101562, 0.01873016357421875, 0.023061752319335938, 0.027393341064453125, 0.03172492980957031, 0.0360565185546875, 0.04038810729980469, 0.044719696044921875, 0.04905128479003906, 0.05338287353515625, 0.05771446228027344, 0.062046051025390625, 0.06637763977050781, 0.070709228515625, 0.07504081726074219, 0.07937240600585938, 0.08370399475097656, 0.08803558349609375, 0.09236717224121094, 0.09669876098632812, 0.10103034973144531, 0.1053619384765625, 0.10969352722167969, 0.11402511596679688, 0.11835670471191406, 0.12268829345703125, 0.12701988220214844, 0.13135147094726562, 0.1356830596923828, 0.1400146484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 9.0, 4.0, 6.0, 10.0, 13.0, 19.0, 11.0, 18.0, 26.0, 29.0, 34.0, 35.0, 33.0, 42.0, 40.0, 42.0, 55.0, 41.0, 54.0, 50.0, 33.0, 33.0, 35.0, 44.0, 38.0, 26.0, 29.0, 29.0, 16.0, 19.0, 24.0, 21.0, 15.0, 19.0, 11.0, 8.0, 9.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.072021484375, -0.06996345520019531, -0.06790542602539062, -0.06584739685058594, -0.06378936767578125, -0.06173133850097656, -0.059673309326171875, -0.05761528015136719, -0.0555572509765625, -0.05349922180175781, -0.051441192626953125, -0.04938316345214844, -0.04732513427734375, -0.04526710510253906, -0.043209075927734375, -0.04115104675292969, -0.039093017578125, -0.03703498840332031, -0.034976959228515625, -0.03291893005371094, -0.03086090087890625, -0.028802871704101562, -0.026744842529296875, -0.024686813354492188, -0.0226287841796875, -0.020570755004882812, -0.018512725830078125, -0.016454696655273438, -0.01439666748046875, -0.012338638305664062, -0.010280609130859375, -0.008222579956054688, -0.00616455078125, -0.0041065216064453125, -0.002048492431640625, 9.5367431640625e-06, 0.00206756591796875, 0.0041255950927734375, 0.006183624267578125, 0.008241653442382812, 0.0102996826171875, 0.012357711791992188, 0.014415740966796875, 0.016473770141601562, 0.01853179931640625, 0.020589828491210938, 0.022647857666015625, 0.024705886840820312, 0.026763916015625, 0.028821945190429688, 0.030879974365234375, 0.03293800354003906, 0.03499603271484375, 0.03705406188964844, 0.039112091064453125, 0.04117012023925781, 0.0432281494140625, 0.04528617858886719, 0.047344207763671875, 0.04940223693847656, 0.05146026611328125, 0.05351829528808594, 0.055576324462890625, 0.05763435363769531, 0.0596923828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 14.0, 10.0, 16.0, 56.0, 74.0, 112.0, 158.0, 243.0, 441.0, 805.0, 1553.0, 3165.0, 7275.0, 18158.0, 52679.0, 169908.0, 630648.0, 2001854.0, 945683.0, 246759.0, 72625.0, 24524.0, 9308.0, 3947.0, 1887.0, 951.0, 579.0, 312.0, 173.0, 120.0, 74.0, 63.0, 41.0, 16.0, 14.0, 7.0, 8.0, 6.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1683349609375, -0.16361236572265625, -0.1588897705078125, -0.15416717529296875, -0.149444580078125, -0.14472198486328125, -0.1399993896484375, -0.13527679443359375, -0.13055419921875, -0.12583160400390625, -0.1211090087890625, -0.11638641357421875, -0.111663818359375, -0.10694122314453125, -0.1022186279296875, -0.09749603271484375, -0.0927734375, -0.08805084228515625, -0.0833282470703125, -0.07860565185546875, -0.073883056640625, -0.06916046142578125, -0.0644378662109375, -0.05971527099609375, -0.05499267578125, -0.05027008056640625, -0.0455474853515625, -0.04082489013671875, -0.036102294921875, -0.03137969970703125, -0.0266571044921875, -0.02193450927734375, -0.0172119140625, -0.01248931884765625, -0.0077667236328125, -0.00304412841796875, 0.001678466796875, 0.00640106201171875, 0.0111236572265625, 0.01584625244140625, 0.02056884765625, 0.02529144287109375, 0.0300140380859375, 0.03473663330078125, 0.039459228515625, 0.04418182373046875, 0.0489044189453125, 0.05362701416015625, 0.058349609375, 0.06307220458984375, 0.0677947998046875, 0.07251739501953125, 0.077239990234375, 0.08196258544921875, 0.0866851806640625, 0.09140777587890625, 0.09613037109375, 0.10085296630859375, 0.1055755615234375, 0.11029815673828125, 0.115020751953125, 0.11974334716796875, 0.1244659423828125, 0.12918853759765625, 0.1339111328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 9.0, 13.0, 26.0, 38.0, 62.0, 100.0, 150.0, 234.0, 403.0, 657.0, 784.0, 559.0, 360.0, 244.0, 141.0, 92.0, 70.0, 46.0, 30.0, 12.0, 11.0, 12.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1470947265625, -0.1418895721435547, -0.13668441772460938, -0.13147926330566406, -0.12627410888671875, -0.12106895446777344, -0.11586380004882812, -0.11065864562988281, -0.1054534912109375, -0.10024833679199219, -0.09504318237304688, -0.08983802795410156, -0.08463287353515625, -0.07942771911621094, -0.07422256469726562, -0.06901741027832031, -0.063812255859375, -0.05860710144042969, -0.053401947021484375, -0.04819679260253906, -0.04299163818359375, -0.03778648376464844, -0.032581329345703125, -0.027376174926757812, -0.0221710205078125, -0.016965866088867188, -0.011760711669921875, -0.0065555572509765625, -0.00135040283203125, 0.0038547515869140625, 0.009059906005859375, 0.014265060424804688, 0.01947021484375, 0.024675369262695312, 0.029880523681640625, 0.03508567810058594, 0.04029083251953125, 0.04549598693847656, 0.050701141357421875, 0.05590629577636719, 0.0611114501953125, 0.06631660461425781, 0.07152175903320312, 0.07672691345214844, 0.08193206787109375, 0.08713722229003906, 0.09234237670898438, 0.09754753112792969, 0.102752685546875, 0.10795783996582031, 0.11316299438476562, 0.11836814880371094, 0.12357330322265625, 0.12877845764160156, 0.13398361206054688, 0.1391887664794922, 0.1443939208984375, 0.1495990753173828, 0.15480422973632812, 0.16000938415527344, 0.16521453857421875, 0.17041969299316406, 0.17562484741210938, 0.1808300018310547, 0.18603515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 12.0, 23.0, 58.0, 96.0, 147.0, 171.0, 182.0, 143.0, 109.0, 33.0, 19.0, 13.0, 8.0, 5.0], "bins": [-2.1622724533081055, -2.123638391494751, -2.0850040912628174, -2.046370029449463, -2.0077357292175293, -1.9691016674041748, -1.9304674863815308, -1.8918333053588867, -1.8531992435455322, -1.8145650625228882, -1.7759308815002441, -1.7372968196868896, -1.6986626386642456, -1.6600284576416016, -1.6213942766189575, -1.5827600955963135, -1.5441259145736694, -1.5054917335510254, -1.4668575525283813, -1.4282234907150269, -1.3895893096923828, -1.3509551286697388, -1.3123209476470947, -1.2736867666244507, -1.2350525856018066, -1.1964184045791626, -1.1577842235565186, -1.119150161743164, -1.08051598072052, -1.041881799697876, -1.003247618675232, -0.9646134376525879, -0.925979495048523, -0.8873453140258789, -0.8487111926078796, -0.8100770115852356, -0.7714428901672363, -0.7328087091445923, -0.6941745281219482, -0.6555403470993042, -0.6169062256813049, -0.5782720446586609, -0.5396379232406616, -0.5010037422180176, -0.4623695909976959, -0.42373543977737427, -0.3851012587547302, -0.34646710753440857, -0.3078329563140869, -0.26919880509376526, -0.2305646389722824, -0.19193047285079956, -0.1532963216304779, -0.11466217041015625, -0.0760280042886734, -0.03739383816719055, 0.0012403130531311035, 0.039874471724033356, 0.07850863039493561, 0.11714278906583786, 0.1557769477367401, 0.19441109895706177, 0.23304526507854462, 0.27167943120002747, 0.3103135824203491]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 11.0, 7.0, 6.0, 13.0, 19.0, 20.0, 17.0, 19.0, 23.0, 15.0, 25.0, 24.0, 35.0, 34.0, 31.0, 31.0, 38.0, 50.0, 39.0, 40.0, 41.0, 49.0, 45.0, 43.0, 51.0, 33.0, 35.0, 24.0, 28.0, 24.0, 20.0, 18.0, 18.0, 15.0, 7.0, 5.0, 13.0, 10.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.40882408618927, -0.3959386348724365, -0.3830532133579254, -0.3701677620410919, -0.3572823405265808, -0.3443968892097473, -0.3315114378929138, -0.3186259865760803, -0.3057405650615692, -0.2928551137447357, -0.2799696922302246, -0.2670842409133911, -0.2541987895965576, -0.2413133680820465, -0.228427916765213, -0.2155424803495407, -0.2026570439338684, -0.1897716075181961, -0.1768861711025238, -0.1640007197856903, -0.151115283370018, -0.1382298469543457, -0.1253443956375122, -0.1124589592218399, -0.0995735228061676, -0.0866880863904953, -0.0738026425242424, -0.0609172023832798, -0.0480317622423172, -0.0351463258266449, -0.022260881960392, -0.009375438094139099, 0.003509998321533203, 0.016395438462495804, 0.029280878603458405, 0.042166318744421005, 0.055051758885383606, 0.06793719530105591, 0.08082263916730881, 0.0937080830335617, 0.10659351944923401, 0.11947895586490631, 0.1323643922805786, 0.1452498435974121, 0.1581352800130844, 0.1710207164287567, 0.1839061677455902, 0.1967916041612625, 0.20967704057693481, 0.22256247699260712, 0.23544791340827942, 0.24833336472511292, 0.261218786239624, 0.2741042375564575, 0.286989688873291, 0.2998751401901245, 0.3127605617046356, 0.3256460130214691, 0.3385314345359802, 0.3514168858528137, 0.3643023371696472, 0.3771877586841583, 0.3900732100009918, 0.40295863151550293, 0.4158440828323364]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 2.0, 6.0, 8.0, 17.0, 20.0, 55.0, 71.0, 146.0, 247.0, 411.0, 670.0, 1158.0, 2033.0, 3472.0, 5812.0, 10014.0, 16788.0, 29198.0, 55488.0, 128670.0, 307203.0, 269891.0, 106487.0, 48064.0, 26007.0, 14965.0, 8961.0, 5308.0, 2998.0, 1870.0, 1042.0, 610.0, 366.0, 194.0, 114.0, 79.0, 46.0, 27.0, 14.0, 5.0, 8.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.09983634948730469, -0.09670639038085938, -0.09357643127441406, -0.09044647216796875, -0.08731651306152344, -0.08418655395507812, -0.08105659484863281, -0.0779266357421875, -0.07479667663574219, -0.07166671752929688, -0.06853675842285156, -0.06540679931640625, -0.06227684020996094, -0.059146881103515625, -0.05601692199707031, -0.052886962890625, -0.04975700378417969, -0.046627044677734375, -0.04349708557128906, -0.04036712646484375, -0.03723716735839844, -0.034107208251953125, -0.030977249145507812, -0.0278472900390625, -0.024717330932617188, -0.021587371826171875, -0.018457412719726562, -0.01532745361328125, -0.012197494506835938, -0.009067535400390625, -0.0059375762939453125, -0.0028076171875, 0.0003223419189453125, 0.003452301025390625, 0.0065822601318359375, 0.00971221923828125, 0.012842178344726562, 0.015972137451171875, 0.019102096557617188, 0.0222320556640625, 0.025362014770507812, 0.028491973876953125, 0.03162193298339844, 0.03475189208984375, 0.03788185119628906, 0.041011810302734375, 0.04414176940917969, 0.047271728515625, 0.05040168762207031, 0.053531646728515625, 0.05666160583496094, 0.05979156494140625, 0.06292152404785156, 0.06605148315429688, 0.06918144226074219, 0.0723114013671875, 0.07544136047363281, 0.07857131958007812, 0.08170127868652344, 0.08483123779296875, 0.08796119689941406, 0.09109115600585938, 0.09422111511230469, 0.09735107421875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 6.0, 8.0, 14.0, 12.0, 14.0, 13.0, 23.0, 18.0, 23.0, 24.0, 25.0, 24.0, 34.0, 34.0, 43.0, 41.0, 38.0, 48.0, 37.0, 56.0, 44.0, 34.0, 34.0, 48.0, 27.0, 32.0, 35.0, 27.0, 19.0, 33.0, 19.0, 11.0, 18.0, 20.0, 11.0, 15.0, 7.0, 3.0, 11.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.06365966796875, -0.06169939041137695, -0.059739112854003906, -0.05777883529663086, -0.05581855773925781, -0.053858280181884766, -0.05189800262451172, -0.04993772506713867, -0.047977447509765625, -0.04601716995239258, -0.04405689239501953, -0.042096614837646484, -0.04013633728027344, -0.03817605972290039, -0.036215782165527344, -0.0342555046081543, -0.03229522705078125, -0.030334949493408203, -0.028374671936035156, -0.02641439437866211, -0.024454116821289062, -0.022493839263916016, -0.02053356170654297, -0.018573284149169922, -0.016613006591796875, -0.014652729034423828, -0.012692451477050781, -0.010732173919677734, -0.008771896362304688, -0.006811618804931641, -0.004851341247558594, -0.002891063690185547, -0.0009307861328125, 0.0010294914245605469, 0.0029897689819335938, 0.004950046539306641, 0.0069103240966796875, 0.008870601654052734, 0.010830879211425781, 0.012791156768798828, 0.014751434326171875, 0.016711711883544922, 0.01867198944091797, 0.020632266998291016, 0.022592544555664062, 0.02455282211303711, 0.026513099670410156, 0.028473377227783203, 0.03043365478515625, 0.0323939323425293, 0.034354209899902344, 0.03631448745727539, 0.03827476501464844, 0.040235042572021484, 0.04219532012939453, 0.04415559768676758, 0.046115875244140625, 0.04807615280151367, 0.05003643035888672, 0.051996707916259766, 0.05395698547363281, 0.05591726303100586, 0.057877540588378906, 0.05983781814575195, 0.061798095703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 5.0, 9.0, 14.0, 16.0, 21.0, 24.0, 38.0, 47.0, 87.0, 167.0, 321.0, 730.0, 1716.0, 4052.0, 8771.0, 20307.0, 51518.0, 209932.0, 560299.0, 123580.0, 38186.0, 15913.0, 6961.0, 3136.0, 1357.0, 601.0, 322.0, 140.0, 91.0, 43.0, 27.0, 20.0, 22.0, 11.0, 7.0, 6.0, 13.0, 6.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0], "bins": [-0.2093505859375, -0.2028789520263672, -0.19640731811523438, -0.18993568420410156, -0.18346405029296875, -0.17699241638183594, -0.17052078247070312, -0.1640491485595703, -0.1575775146484375, -0.1511058807373047, -0.14463424682617188, -0.13816261291503906, -0.13169097900390625, -0.12521934509277344, -0.11874771118164062, -0.11227607727050781, -0.105804443359375, -0.09933280944824219, -0.09286117553710938, -0.08638954162597656, -0.07991790771484375, -0.07344627380371094, -0.06697463989257812, -0.06050300598144531, -0.0540313720703125, -0.04755973815917969, -0.041088104248046875, -0.03461647033691406, -0.02814483642578125, -0.021673202514648438, -0.015201568603515625, -0.008729934692382812, -0.00225830078125, 0.0042133331298828125, 0.010684967041015625, 0.017156600952148438, 0.02362823486328125, 0.030099868774414062, 0.036571502685546875, 0.04304313659667969, 0.0495147705078125, 0.05598640441894531, 0.062458038330078125, 0.06892967224121094, 0.07540130615234375, 0.08187294006347656, 0.08834457397460938, 0.09481620788574219, 0.101287841796875, 0.10775947570800781, 0.11423110961914062, 0.12070274353027344, 0.12717437744140625, 0.13364601135253906, 0.14011764526367188, 0.1465892791748047, 0.1530609130859375, 0.1595325469970703, 0.16600418090820312, 0.17247581481933594, 0.17894744873046875, 0.18541908264160156, 0.19189071655273438, 0.1983623504638672, 0.204833984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 9.0, 15.0, 13.0, 17.0, 15.0, 24.0, 23.0, 23.0, 38.0, 45.0, 45.0, 49.0, 49.0, 61.0, 56.0, 61.0, 49.0, 48.0, 40.0, 45.0, 45.0, 46.0, 18.0, 23.0, 27.0, 20.0, 8.0, 17.0, 4.0, 5.0, 12.0, 2.0, 1.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.254150390625, -0.2465534210205078, -0.23895645141601562, -0.23135948181152344, -0.22376251220703125, -0.21616554260253906, -0.20856857299804688, -0.2009716033935547, -0.1933746337890625, -0.1857776641845703, -0.17818069458007812, -0.17058372497558594, -0.16298675537109375, -0.15538978576660156, -0.14779281616210938, -0.1401958465576172, -0.132598876953125, -0.1250019073486328, -0.11740493774414062, -0.10980796813964844, -0.10221099853515625, -0.09461402893066406, -0.08701705932617188, -0.07942008972167969, -0.0718231201171875, -0.06422615051269531, -0.056629180908203125, -0.04903221130371094, -0.04143524169921875, -0.03383827209472656, -0.026241302490234375, -0.018644332885742188, -0.01104736328125, -0.0034503936767578125, 0.004146575927734375, 0.011743545532226562, 0.01934051513671875, 0.026937484741210938, 0.034534454345703125, 0.04213142395019531, 0.0497283935546875, 0.05732536315917969, 0.06492233276367188, 0.07251930236816406, 0.08011627197265625, 0.08771324157714844, 0.09531021118164062, 0.10290718078613281, 0.110504150390625, 0.11810111999511719, 0.12569808959960938, 0.13329505920410156, 0.14089202880859375, 0.14848899841308594, 0.15608596801757812, 0.1636829376220703, 0.1712799072265625, 0.1788768768310547, 0.18647384643554688, 0.19407081604003906, 0.20166778564453125, 0.20926475524902344, 0.21686172485351562, 0.2244586944580078, 0.2320556640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 11.0, 19.0, 28.0, 32.0, 62.0, 96.0, 122.0, 205.0, 328.0, 475.0, 723.0, 1143.0, 1762.0, 2791.0, 4424.0, 7087.0, 11223.0, 17460.0, 30339.0, 61708.0, 181607.0, 399651.0, 185038.0, 62883.0, 30635.0, 17898.0, 11147.0, 7120.0, 4569.0, 2909.0, 1790.0, 1105.0, 765.0, 462.0, 295.0, 226.0, 138.0, 81.0, 63.0, 36.0, 21.0, 23.0, 12.0, 6.0, 10.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.06256103515625, -0.06057548522949219, -0.058589935302734375, -0.05660438537597656, -0.05461883544921875, -0.05263328552246094, -0.050647735595703125, -0.04866218566894531, -0.0466766357421875, -0.04469108581542969, -0.042705535888671875, -0.04071998596191406, -0.03873443603515625, -0.03674888610839844, -0.034763336181640625, -0.03277778625488281, -0.030792236328125, -0.028806686401367188, -0.026821136474609375, -0.024835586547851562, -0.02285003662109375, -0.020864486694335938, -0.018878936767578125, -0.016893386840820312, -0.0149078369140625, -0.012922286987304688, -0.010936737060546875, -0.008951187133789062, -0.00696563720703125, -0.0049800872802734375, -0.002994537353515625, -0.0010089874267578125, 0.0009765625, 0.0029621124267578125, 0.004947662353515625, 0.0069332122802734375, 0.00891876220703125, 0.010904312133789062, 0.012889862060546875, 0.014875411987304688, 0.0168609619140625, 0.018846511840820312, 0.020832061767578125, 0.022817611694335938, 0.02480316162109375, 0.026788711547851562, 0.028774261474609375, 0.030759811401367188, 0.032745361328125, 0.03473091125488281, 0.036716461181640625, 0.03870201110839844, 0.04068756103515625, 0.04267311096191406, 0.044658660888671875, 0.04664421081542969, 0.0486297607421875, 0.05061531066894531, 0.052600860595703125, 0.05458641052246094, 0.05657196044921875, 0.05855751037597656, 0.060543060302734375, 0.06252861022949219, 0.06451416015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 3.0, 10.0, 3.0, 16.0, 20.0, 23.0, 37.0, 50.0, 68.0, 106.0, 123.0, 124.0, 109.0, 72.0, 64.0, 41.0, 19.0, 23.0, 10.0, 7.0, 12.0, 8.0, 8.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5987625122070312e-05, -2.5270506739616394e-05, -2.4553388357162476e-05, -2.3836269974708557e-05, -2.311915159225464e-05, -2.240203320980072e-05, -2.1684914827346802e-05, -2.0967796444892883e-05, -2.0250678062438965e-05, -1.9533559679985046e-05, -1.8816441297531128e-05, -1.809932291507721e-05, -1.738220453262329e-05, -1.6665086150169373e-05, -1.5947967767715454e-05, -1.5230849385261536e-05, -1.4513731002807617e-05, -1.3796612620353699e-05, -1.307949423789978e-05, -1.2362375855445862e-05, -1.1645257472991943e-05, -1.0928139090538025e-05, -1.0211020708084106e-05, -9.493902325630188e-06, -8.77678394317627e-06, -8.059665560722351e-06, -7.342547178268433e-06, -6.625428795814514e-06, -5.908310413360596e-06, -5.191192030906677e-06, -4.474073648452759e-06, -3.7569552659988403e-06, -3.039836883544922e-06, -2.3227185010910034e-06, -1.605600118637085e-06, -8.884817361831665e-07, -1.7136335372924805e-07, 5.457550287246704e-07, 1.2628734111785889e-06, 1.9799917936325073e-06, 2.6971101760864258e-06, 3.4142285585403442e-06, 4.131346940994263e-06, 4.848465323448181e-06, 5.5655837059021e-06, 6.282702088356018e-06, 6.9998204708099365e-06, 7.716938853263855e-06, 8.434057235717773e-06, 9.151175618171692e-06, 9.86829400062561e-06, 1.0585412383079529e-05, 1.1302530765533447e-05, 1.2019649147987366e-05, 1.2736767530441284e-05, 1.3453885912895203e-05, 1.4171004295349121e-05, 1.488812267780304e-05, 1.5605241060256958e-05, 1.6322359442710876e-05, 1.7039477825164795e-05, 1.7756596207618713e-05, 1.8473714590072632e-05, 1.919083297252655e-05, 1.990795135498047e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 8.0, 11.0, 9.0, 17.0, 22.0, 32.0, 63.0, 79.0, 148.0, 255.0, 537.0, 1179.0, 2540.0, 5842.0, 13567.0, 33374.0, 100064.0, 535175.0, 261089.0, 56229.0, 21669.0, 9269.0, 3923.0, 1785.0, 838.0, 394.0, 176.0, 108.0, 72.0, 31.0, 21.0, 11.0, 12.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12852096557617188, -0.12520599365234375, -0.12189102172851562, -0.1185760498046875, -0.11526107788085938, -0.11194610595703125, -0.10863113403320312, -0.105316162109375, -0.10200119018554688, -0.09868621826171875, -0.09537124633789062, -0.0920562744140625, -0.08874130249023438, -0.08542633056640625, -0.08211135864257812, -0.07879638671875, -0.07548141479492188, -0.07216644287109375, -0.06885147094726562, -0.0655364990234375, -0.062221527099609375, -0.05890655517578125, -0.055591583251953125, -0.052276611328125, -0.048961639404296875, -0.04564666748046875, -0.042331695556640625, -0.0390167236328125, -0.035701751708984375, -0.03238677978515625, -0.029071807861328125, -0.0257568359375, -0.022441864013671875, -0.01912689208984375, -0.015811920166015625, -0.0124969482421875, -0.009181976318359375, -0.00586700439453125, -0.002552032470703125, 0.000762939453125, 0.004077911376953125, 0.00739288330078125, 0.010707855224609375, 0.0140228271484375, 0.017337799072265625, 0.02065277099609375, 0.023967742919921875, 0.02728271484375, 0.030597686767578125, 0.03391265869140625, 0.037227630615234375, 0.0405426025390625, 0.043857574462890625, 0.04717254638671875, 0.050487518310546875, 0.053802490234375, 0.057117462158203125, 0.06043243408203125, 0.06374740600585938, 0.0670623779296875, 0.07037734985351562, 0.07369232177734375, 0.07700729370117188, 0.080322265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 9.0, 11.0, 15.0, 11.0, 31.0, 43.0, 51.0, 87.0, 121.0, 156.0, 120.0, 87.0, 54.0, 42.0, 30.0, 19.0, 15.0, 12.0, 13.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.094482421875, -0.09138202667236328, -0.08828163146972656, -0.08518123626708984, -0.08208084106445312, -0.0789804458618164, -0.07588005065917969, -0.07277965545654297, -0.06967926025390625, -0.06657886505126953, -0.06347846984863281, -0.060378074645996094, -0.057277679443359375, -0.054177284240722656, -0.05107688903808594, -0.04797649383544922, -0.0448760986328125, -0.04177570343017578, -0.03867530822753906, -0.035574913024902344, -0.032474517822265625, -0.029374122619628906, -0.026273727416992188, -0.02317333221435547, -0.02007293701171875, -0.01697254180908203, -0.013872146606445312, -0.010771751403808594, -0.007671356201171875, -0.004570960998535156, -0.0014705657958984375, 0.0016298294067382812, 0.004730224609375, 0.007830619812011719, 0.010931015014648438, 0.014031410217285156, 0.017131805419921875, 0.020232200622558594, 0.023332595825195312, 0.02643299102783203, 0.02953338623046875, 0.03263378143310547, 0.03573417663574219, 0.038834571838378906, 0.041934967041015625, 0.045035362243652344, 0.04813575744628906, 0.05123615264892578, 0.0543365478515625, 0.05743694305419922, 0.06053733825683594, 0.06363773345947266, 0.06673812866210938, 0.0698385238647461, 0.07293891906738281, 0.07603931427001953, 0.07913970947265625, 0.08224010467529297, 0.08534049987792969, 0.0884408950805664, 0.09154129028320312, 0.09464168548583984, 0.09774208068847656, 0.10084247589111328, 0.10394287109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 3.0, 8.0, 13.0, 18.0, 23.0, 22.0, 27.0, 32.0, 55.0, 41.0, 64.0, 58.0, 61.0, 79.0, 69.0, 91.0, 50.0, 52.0, 56.0, 35.0, 31.0, 27.0, 28.0, 16.0, 15.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.512471079826355, -0.4946480989456177, -0.476825088262558, -0.4590021073818207, -0.441179096698761, -0.4233561158180237, -0.4055331349372864, -0.3877101540565491, -0.3698871433734894, -0.3520641624927521, -0.3342411518096924, -0.3164181709289551, -0.2985951900482178, -0.2807721793651581, -0.2629491984844208, -0.24512620270252228, -0.22730320692062378, -0.20948021113872528, -0.19165721535682678, -0.17383423447608948, -0.15601123869419098, -0.13818824291229248, -0.12036525458097458, -0.10254226624965668, -0.08471927046775818, -0.06689627468585968, -0.04907328635454178, -0.03125029429793358, -0.013427302241325378, 0.00439569354057312, 0.02221868187189102, 0.04004167020320892, 0.05786466598510742, 0.07568766176700592, 0.09351065009832382, 0.11133363842964172, 0.12915663421154022, 0.14697962999343872, 0.16480261087417603, 0.18262560665607452, 0.20044860243797302, 0.21827159821987152, 0.23609459400177002, 0.2539175748825073, 0.27174055576324463, 0.2895635664463043, 0.3073865473270416, 0.3252095580101013, 0.3430325388908386, 0.3608555197715759, 0.3786785304546356, 0.3965015113353729, 0.4143245220184326, 0.4321475028991699, 0.4499704837799072, 0.46779346466064453, 0.4856164753437042, 0.5034394860267639, 0.5212624669075012, 0.5390854477882385, 0.5569084286689758, 0.5747314691543579, 0.5925544500350952, 0.6103774309158325, 0.6282004117965698]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 2.0, 4.0, 5.0, 5.0, 4.0, 10.0, 13.0, 9.0, 15.0, 15.0, 19.0, 12.0, 18.0, 30.0, 28.0, 25.0, 26.0, 27.0, 40.0, 33.0, 42.0, 51.0, 39.0, 36.0, 47.0, 43.0, 45.0, 38.0, 43.0, 42.0, 29.0, 24.0, 35.0, 25.0, 25.0, 19.0, 15.0, 10.0, 14.0, 5.0, 7.0, 4.0, 5.0, 3.0, 4.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.6516975164413452, -0.6314100027084351, -0.6111224889755249, -0.5908349752426147, -0.5705474615097046, -0.5502600073814392, -0.529972493648529, -0.5096849799156189, -0.48939746618270874, -0.4691099524497986, -0.4488224387168884, -0.42853495478630066, -0.4082474410533905, -0.38795992732048035, -0.3676724433898926, -0.3473849296569824, -0.32709741592407227, -0.3068099021911621, -0.28652238845825195, -0.2662349045276642, -0.24594739079475403, -0.22565987706184387, -0.2053723782300949, -0.18508487939834595, -0.1647973656654358, -0.14450985193252563, -0.12422235310077667, -0.10393484681844711, -0.08364734053611755, -0.063359834253788, -0.043072327971458435, -0.022784829139709473, -0.002497255802154541, 0.01779025048017502, 0.03807775676250458, 0.05836526304483414, 0.0786527693271637, 0.09894027560949326, 0.11922778189182281, 0.13951528072357178, 0.15980279445648193, 0.1800903081893921, 0.20037780702114105, 0.22066530585289001, 0.24095281958580017, 0.2612403333187103, 0.2815278172492981, 0.30181533098220825, 0.3221028447151184, 0.34239035844802856, 0.3626778721809387, 0.3829653561115265, 0.40325286984443665, 0.4235403835773468, 0.44382786750793457, 0.4641153812408447, 0.4844028949737549, 0.504690408706665, 0.5249779224395752, 0.5452654361724854, 0.5655529499053955, 0.5858404040336609, 0.606127917766571, 0.6264154314994812, 0.6467029452323914]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 2.0, 8.0, 4.0, 8.0, 3.0, 11.0, 9.0, 11.0, 22.0, 20.0, 22.0, 46.0, 45.0, 56.0, 84.0, 133.0, 196.0, 404.0, 676.0, 1435.0, 2969.0, 6905.0, 16761.0, 44649.0, 130637.0, 442676.0, 2228677.0, 960116.0, 234601.0, 75875.0, 27468.0, 10708.0, 4550.0, 2038.0, 1019.0, 538.0, 323.0, 179.0, 110.0, 61.0, 58.0, 42.0, 26.0, 25.0, 17.0, 11.0, 13.0, 9.0, 2.0, 7.0, 5.0, 3.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.1126708984375, -0.10923099517822266, -0.10579109191894531, -0.10235118865966797, -0.09891128540039062, -0.09547138214111328, -0.09203147888183594, -0.0885915756225586, -0.08515167236328125, -0.0817117691040039, -0.07827186584472656, -0.07483196258544922, -0.07139205932617188, -0.06795215606689453, -0.06451225280761719, -0.061072349548339844, -0.0576324462890625, -0.054192543029785156, -0.05075263977050781, -0.04731273651123047, -0.043872833251953125, -0.04043292999267578, -0.03699302673339844, -0.033553123474121094, -0.03011322021484375, -0.026673316955566406, -0.023233413696289062, -0.01979351043701172, -0.016353607177734375, -0.012913703918457031, -0.009473800659179688, -0.006033897399902344, -0.002593994140625, 0.0008459091186523438, 0.0042858123779296875, 0.007725715637207031, 0.011165618896484375, 0.014605522155761719, 0.018045425415039062, 0.021485328674316406, 0.02492523193359375, 0.028365135192871094, 0.03180503845214844, 0.03524494171142578, 0.038684844970703125, 0.04212474822998047, 0.04556465148925781, 0.049004554748535156, 0.0524444580078125, 0.055884361267089844, 0.05932426452636719, 0.06276416778564453, 0.06620407104492188, 0.06964397430419922, 0.07308387756347656, 0.0765237808227539, 0.07996368408203125, 0.0834035873413086, 0.08684349060058594, 0.09028339385986328, 0.09372329711914062, 0.09716320037841797, 0.10060310363769531, 0.10404300689697266, 0.10748291015625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 1.0, 11.0, 9.0, 7.0, 11.0, 15.0, 22.0, 19.0, 11.0, 13.0, 20.0, 31.0, 26.0, 31.0, 29.0, 45.0, 34.0, 47.0, 48.0, 44.0, 39.0, 49.0, 38.0, 39.0, 29.0, 29.0, 38.0, 40.0, 31.0, 28.0, 28.0, 17.0, 14.0, 8.0, 11.0, 17.0, 4.0, 16.0, 10.0, 7.0, 8.0, 2.0, 8.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06451416015625, -0.06240272521972656, -0.060291290283203125, -0.05817985534667969, -0.05606842041015625, -0.05395698547363281, -0.051845550537109375, -0.04973411560058594, -0.0476226806640625, -0.04551124572753906, -0.043399810791015625, -0.04128837585449219, -0.03917694091796875, -0.03706550598144531, -0.034954071044921875, -0.03284263610839844, -0.030731201171875, -0.028619766235351562, -0.026508331298828125, -0.024396896362304688, -0.02228546142578125, -0.020174026489257812, -0.018062591552734375, -0.015951156616210938, -0.0138397216796875, -0.011728286743164062, -0.009616851806640625, -0.0075054168701171875, -0.00539398193359375, -0.0032825469970703125, -0.001171112060546875, 0.0009403228759765625, 0.0030517578125, 0.0051631927490234375, 0.007274627685546875, 0.009386062622070312, 0.01149749755859375, 0.013608932495117188, 0.015720367431640625, 0.017831802368164062, 0.0199432373046875, 0.022054672241210938, 0.024166107177734375, 0.026277542114257812, 0.02838897705078125, 0.030500411987304688, 0.032611846923828125, 0.03472328186035156, 0.036834716796875, 0.03894615173339844, 0.041057586669921875, 0.04316902160644531, 0.04528045654296875, 0.04739189147949219, 0.049503326416015625, 0.05161476135253906, 0.0537261962890625, 0.05583763122558594, 0.057949066162109375, 0.06006050109863281, 0.06217193603515625, 0.06428337097167969, 0.06639480590820312, 0.06850624084472656, 0.07061767578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 19.0, 12.0, 17.0, 14.0, 25.0, 30.0, 73.0, 88.0, 117.0, 180.0, 290.0, 481.0, 752.0, 1437.0, 2570.0, 5368.0, 12002.0, 28989.0, 78566.0, 235346.0, 822218.0, 2114936.0, 603475.0, 181948.0, 61936.0, 23441.0, 9864.0, 4618.0, 2289.0, 1259.0, 737.0, 386.0, 242.0, 159.0, 102.0, 77.0, 58.0, 38.0, 33.0, 16.0, 18.0, 16.0, 8.0, 9.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.18212890625, -0.1768321990966797, -0.17153549194335938, -0.16623878479003906, -0.16094207763671875, -0.15564537048339844, -0.15034866333007812, -0.1450519561767578, -0.1397552490234375, -0.1344585418701172, -0.12916183471679688, -0.12386512756347656, -0.11856842041015625, -0.11327171325683594, -0.10797500610351562, -0.10267829895019531, -0.097381591796875, -0.09208488464355469, -0.08678817749023438, -0.08149147033691406, -0.07619476318359375, -0.07089805603027344, -0.06560134887695312, -0.06030464172363281, -0.0550079345703125, -0.04971122741699219, -0.044414520263671875, -0.03911781311035156, -0.03382110595703125, -0.028524398803710938, -0.023227691650390625, -0.017930984497070312, -0.01263427734375, -0.0073375701904296875, -0.002040863037109375, 0.0032558441162109375, 0.00855255126953125, 0.013849258422851562, 0.019145965576171875, 0.024442672729492188, 0.0297393798828125, 0.03503608703613281, 0.040332794189453125, 0.04562950134277344, 0.05092620849609375, 0.05622291564941406, 0.061519622802734375, 0.06681632995605469, 0.072113037109375, 0.07740974426269531, 0.08270645141601562, 0.08800315856933594, 0.09329986572265625, 0.09859657287597656, 0.10389328002929688, 0.10918998718261719, 0.1144866943359375, 0.11978340148925781, 0.12508010864257812, 0.13037681579589844, 0.13567352294921875, 0.14097023010253906, 0.14626693725585938, 0.1515636444091797, 0.1568603515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 6.0, 12.0, 23.0, 42.0, 69.0, 139.0, 215.0, 377.0, 814.0, 1087.0, 500.0, 323.0, 200.0, 115.0, 61.0, 42.0, 14.0, 19.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30224609375, -0.2950782775878906, -0.28791046142578125, -0.2807426452636719, -0.2735748291015625, -0.2664070129394531, -0.25923919677734375, -0.2520713806152344, -0.244903564453125, -0.23773574829101562, -0.23056793212890625, -0.22340011596679688, -0.2162322998046875, -0.20906448364257812, -0.20189666748046875, -0.19472885131835938, -0.18756103515625, -0.18039321899414062, -0.17322540283203125, -0.16605758666992188, -0.1588897705078125, -0.15172195434570312, -0.14455413818359375, -0.13738632202148438, -0.130218505859375, -0.12305068969726562, -0.11588287353515625, -0.10871505737304688, -0.1015472412109375, -0.09437942504882812, -0.08721160888671875, -0.08004379272460938, -0.0728759765625, -0.06570816040039062, -0.05854034423828125, -0.051372528076171875, -0.0442047119140625, -0.037036895751953125, -0.02986907958984375, -0.022701263427734375, -0.015533447265625, -0.008365631103515625, -0.00119781494140625, 0.005970001220703125, 0.0131378173828125, 0.020305633544921875, 0.02747344970703125, 0.034641265869140625, 0.04180908203125, 0.048976898193359375, 0.05614471435546875, 0.06331253051757812, 0.0704803466796875, 0.07764816284179688, 0.08481597900390625, 0.09198379516601562, 0.099151611328125, 0.10631942749023438, 0.11348724365234375, 0.12065505981445312, 0.1278228759765625, 0.13499069213867188, 0.14215850830078125, 0.14932632446289062, 0.156494140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 21.0, 33.0, 103.0, 143.0, 185.0, 198.0, 140.0, 103.0, 47.0, 25.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.316335678100586, -2.268930196762085, -2.221524477005005, -2.174118995666504, -2.126713275909424, -2.079307794570923, -2.0319020748138428, -1.9844965934753418, -1.9370908737182617, -1.8896852731704712, -1.8422796726226807, -1.7948740720748901, -1.7474684715270996, -1.700062870979309, -1.6526572704315186, -1.6052517890930176, -1.557846188545227, -1.5104405879974365, -1.463034987449646, -1.4156293869018555, -1.368223786354065, -1.3208181858062744, -1.2734127044677734, -1.2260069847106934, -1.1786015033721924, -1.1311959028244019, -1.0837903022766113, -1.0363847017288208, -0.9889791011810303, -0.9415735006332397, -0.894167959690094, -0.8467623591423035, -0.7993565797805786, -0.7519509792327881, -0.7045453786849976, -0.657139778137207, -0.6097341775894165, -0.562328577041626, -0.5149230360984802, -0.4675174355506897, -0.42011183500289917, -0.37270623445510864, -0.3253006339073181, -0.27789506316185, -0.23048946261405945, -0.18308386206626892, -0.13567829132080078, -0.08827269077301025, -0.04086709022521973, 0.006538502871990204, 0.053944095969200134, 0.10134968161582947, 0.14875528216362, 0.19616088271141052, 0.24356645345687866, 0.2909720540046692, 0.3383776545524597, 0.38578325510025024, 0.43318885564804077, 0.4805944263935089, 0.527999997138977, 0.5754055976867676, 0.6228111982345581, 0.6702167987823486, 0.7176223993301392]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 5.0, 5.0, 5.0, 8.0, 9.0, 17.0, 11.0, 17.0, 20.0, 20.0, 28.0, 18.0, 22.0, 41.0, 29.0, 35.0, 39.0, 42.0, 42.0, 48.0, 58.0, 43.0, 37.0, 33.0, 32.0, 34.0, 27.0, 44.0, 30.0, 24.0, 31.0, 26.0, 20.0, 15.0, 16.0, 12.0, 10.0, 18.0, 6.0, 5.0, 4.0, 7.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4193037748336792, -0.40633684396743774, -0.3933699131011963, -0.38040298223495483, -0.3674360513687134, -0.3544691205024719, -0.34150218963623047, -0.328535258769989, -0.31556832790374756, -0.3026013970375061, -0.28963446617126465, -0.2766675353050232, -0.26370060443878174, -0.2507336735725403, -0.23776674270629883, -0.22479981184005737, -0.21183288097381592, -0.19886595010757446, -0.185899019241333, -0.17293208837509155, -0.1599651575088501, -0.14699822664260864, -0.1340312957763672, -0.12106436491012573, -0.10809743404388428, -0.09513050317764282, -0.08216357231140137, -0.06919664144515991, -0.05622971057891846, -0.043262779712677, -0.030295848846435547, -0.017328917980194092, -0.004361987113952637, 0.008604943752288818, 0.021571874618530273, 0.03453880548477173, 0.047505736351013184, 0.06047266721725464, 0.0734395980834961, 0.08640652894973755, 0.099373459815979, 0.11234039068222046, 0.12530732154846191, 0.13827425241470337, 0.15124118328094482, 0.16420811414718628, 0.17717504501342773, 0.1901419758796692, 0.20310890674591064, 0.2160758376121521, 0.22904276847839355, 0.242009699344635, 0.25497663021087646, 0.2679435610771179, 0.2809104919433594, 0.29387742280960083, 0.3068443536758423, 0.31981128454208374, 0.3327782154083252, 0.34574514627456665, 0.3587120771408081, 0.37167900800704956, 0.384645938873291, 0.39761286973953247, 0.4105798006057739]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 9.0, 15.0, 24.0, 24.0, 35.0, 78.0, 97.0, 153.0, 216.0, 386.0, 503.0, 842.0, 1371.0, 2228.0, 3432.0, 5643.0, 9096.0, 14925.0, 24639.0, 41316.0, 72219.0, 138896.0, 241369.0, 218716.0, 117613.0, 62553.0, 36075.0, 21686.0, 13118.0, 8088.0, 4972.0, 3007.0, 1873.0, 1206.0, 724.0, 479.0, 309.0, 209.0, 139.0, 94.0, 54.0, 34.0, 28.0, 19.0, 10.0, 8.0, 7.0, 11.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.08154296875, -0.07906246185302734, -0.07658195495605469, -0.07410144805908203, -0.07162094116210938, -0.06914043426513672, -0.06665992736816406, -0.0641794204711914, -0.06169891357421875, -0.059218406677246094, -0.05673789978027344, -0.05425739288330078, -0.051776885986328125, -0.04929637908935547, -0.04681587219238281, -0.044335365295410156, -0.0418548583984375, -0.039374351501464844, -0.03689384460449219, -0.03441333770751953, -0.031932830810546875, -0.02945232391357422, -0.026971817016601562, -0.024491310119628906, -0.02201080322265625, -0.019530296325683594, -0.017049789428710938, -0.014569282531738281, -0.012088775634765625, -0.009608268737792969, -0.0071277618408203125, -0.004647254943847656, -0.002166748046875, 0.00031375885009765625, 0.0027942657470703125, 0.005274772644042969, 0.007755279541015625, 0.010235786437988281, 0.012716293334960938, 0.015196800231933594, 0.01767730712890625, 0.020157814025878906, 0.022638320922851562, 0.02511882781982422, 0.027599334716796875, 0.03007984161376953, 0.03256034851074219, 0.035040855407714844, 0.0375213623046875, 0.040001869201660156, 0.04248237609863281, 0.04496288299560547, 0.047443389892578125, 0.04992389678955078, 0.05240440368652344, 0.054884910583496094, 0.05736541748046875, 0.059845924377441406, 0.06232643127441406, 0.06480693817138672, 0.06728744506835938, 0.06976795196533203, 0.07224845886230469, 0.07472896575927734, 0.07720947265625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 11.0, 11.0, 9.0, 11.0, 12.0, 14.0, 18.0, 26.0, 24.0, 30.0, 30.0, 30.0, 41.0, 43.0, 33.0, 44.0, 40.0, 39.0, 44.0, 39.0, 51.0, 33.0, 41.0, 30.0, 39.0, 29.0, 25.0, 35.0, 25.0, 20.0, 17.0, 16.0, 9.0, 14.0, 15.0, 9.0, 13.0, 9.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0], "bins": [-0.07391357421875, -0.0716562271118164, -0.06939888000488281, -0.06714153289794922, -0.06488418579101562, -0.06262683868408203, -0.06036949157714844, -0.058112144470214844, -0.05585479736328125, -0.053597450256347656, -0.05134010314941406, -0.04908275604248047, -0.046825408935546875, -0.04456806182861328, -0.04231071472167969, -0.040053367614746094, -0.0377960205078125, -0.035538673400878906, -0.03328132629394531, -0.03102397918701172, -0.028766632080078125, -0.02650928497314453, -0.024251937866210938, -0.021994590759277344, -0.01973724365234375, -0.017479896545410156, -0.015222549438476562, -0.012965202331542969, -0.010707855224609375, -0.008450508117675781, -0.0061931610107421875, -0.003935813903808594, -0.001678466796875, 0.0005788803100585938, 0.0028362274169921875, 0.005093574523925781, 0.007350921630859375, 0.009608268737792969, 0.011865615844726562, 0.014122962951660156, 0.01638031005859375, 0.018637657165527344, 0.020895004272460938, 0.02315235137939453, 0.025409698486328125, 0.02766704559326172, 0.029924392700195312, 0.032181739807128906, 0.0344390869140625, 0.036696434020996094, 0.03895378112792969, 0.04121112823486328, 0.043468475341796875, 0.04572582244873047, 0.04798316955566406, 0.050240516662597656, 0.05249786376953125, 0.054755210876464844, 0.05701255798339844, 0.05926990509033203, 0.061527252197265625, 0.06378459930419922, 0.06604194641113281, 0.0682992935180664, 0.070556640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 8.0, 9.0, 4.0, 11.0, 21.0, 16.0, 20.0, 25.0, 25.0, 23.0, 58.0, 81.0, 210.0, 1019.0, 6075.0, 41189.0, 336142.0, 580959.0, 70076.0, 10299.0, 1597.0, 319.0, 114.0, 43.0, 31.0, 27.0, 26.0, 25.0, 18.0, 14.0, 8.0, 10.0, 9.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.375244140625, -0.36486053466796875, -0.3544769287109375, -0.34409332275390625, -0.333709716796875, -0.32332611083984375, -0.3129425048828125, -0.30255889892578125, -0.29217529296875, -0.28179168701171875, -0.2714080810546875, -0.26102447509765625, -0.250640869140625, -0.24025726318359375, -0.2298736572265625, -0.21949005126953125, -0.2091064453125, -0.19872283935546875, -0.1883392333984375, -0.17795562744140625, -0.167572021484375, -0.15718841552734375, -0.1468048095703125, -0.13642120361328125, -0.12603759765625, -0.11565399169921875, -0.1052703857421875, -0.09488677978515625, -0.084503173828125, -0.07411956787109375, -0.0637359619140625, -0.05335235595703125, -0.04296875, -0.03258514404296875, -0.0222015380859375, -0.01181793212890625, -0.001434326171875, 0.00894927978515625, 0.0193328857421875, 0.02971649169921875, 0.04010009765625, 0.05048370361328125, 0.0608673095703125, 0.07125091552734375, 0.081634521484375, 0.09201812744140625, 0.1024017333984375, 0.11278533935546875, 0.1231689453125, 0.13355255126953125, 0.1439361572265625, 0.15431976318359375, 0.164703369140625, 0.17508697509765625, 0.1854705810546875, 0.19585418701171875, 0.20623779296875, 0.21662139892578125, 0.2270050048828125, 0.23738861083984375, 0.247772216796875, 0.25815582275390625, 0.2685394287109375, 0.27892303466796875, 0.289306640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 9.0, 3.0, 7.0, 9.0, 7.0, 12.0, 17.0, 24.0, 20.0, 26.0, 33.0, 35.0, 34.0, 40.0, 34.0, 35.0, 54.0, 49.0, 39.0, 41.0, 40.0, 45.0, 44.0, 38.0, 42.0, 36.0, 27.0, 29.0, 27.0, 24.0, 18.0, 18.0, 10.0, 14.0, 9.0, 12.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2607421875, -0.25278472900390625, -0.2448272705078125, -0.23686981201171875, -0.228912353515625, -0.22095489501953125, -0.2129974365234375, -0.20503997802734375, -0.19708251953125, -0.18912506103515625, -0.1811676025390625, -0.17321014404296875, -0.165252685546875, -0.15729522705078125, -0.1493377685546875, -0.14138031005859375, -0.1334228515625, -0.12546539306640625, -0.1175079345703125, -0.10955047607421875, -0.101593017578125, -0.09363555908203125, -0.0856781005859375, -0.07772064208984375, -0.06976318359375, -0.06180572509765625, -0.0538482666015625, -0.04589080810546875, -0.037933349609375, -0.02997589111328125, -0.0220184326171875, -0.01406097412109375, -0.006103515625, 0.00185394287109375, 0.0098114013671875, 0.01776885986328125, 0.025726318359375, 0.03368377685546875, 0.0416412353515625, 0.04959869384765625, 0.05755615234375, 0.06551361083984375, 0.0734710693359375, 0.08142852783203125, 0.089385986328125, 0.09734344482421875, 0.1053009033203125, 0.11325836181640625, 0.1212158203125, 0.12917327880859375, 0.1371307373046875, 0.14508819580078125, 0.153045654296875, 0.16100311279296875, 0.1689605712890625, 0.17691802978515625, 0.18487548828125, 0.19283294677734375, 0.2007904052734375, 0.20874786376953125, 0.216705322265625, 0.22466278076171875, 0.2326202392578125, 0.24057769775390625, 0.24853515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 12.0, 7.0, 12.0, 18.0, 26.0, 51.0, 73.0, 128.0, 242.0, 455.0, 1104.0, 2721.0, 7887.0, 21971.0, 60903.0, 200255.0, 523663.0, 150259.0, 50020.0, 18289.0, 6298.0, 2293.0, 941.0, 418.0, 209.0, 131.0, 64.0, 43.0, 19.0, 18.0, 10.0, 6.0, 6.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09326171875, -0.08972930908203125, -0.0861968994140625, -0.08266448974609375, -0.079132080078125, -0.07559967041015625, -0.0720672607421875, -0.06853485107421875, -0.06500244140625, -0.06147003173828125, -0.0579376220703125, -0.05440521240234375, -0.050872802734375, -0.04734039306640625, -0.0438079833984375, -0.04027557373046875, -0.0367431640625, -0.03321075439453125, -0.0296783447265625, -0.02614593505859375, -0.022613525390625, -0.01908111572265625, -0.0155487060546875, -0.01201629638671875, -0.00848388671875, -0.00495147705078125, -0.0014190673828125, 0.00211334228515625, 0.005645751953125, 0.00917816162109375, 0.0127105712890625, 0.01624298095703125, 0.019775390625, 0.02330780029296875, 0.0268402099609375, 0.03037261962890625, 0.033905029296875, 0.03743743896484375, 0.0409698486328125, 0.04450225830078125, 0.04803466796875, 0.05156707763671875, 0.0550994873046875, 0.05863189697265625, 0.062164306640625, 0.06569671630859375, 0.0692291259765625, 0.07276153564453125, 0.0762939453125, 0.07982635498046875, 0.0833587646484375, 0.08689117431640625, 0.090423583984375, 0.09395599365234375, 0.0974884033203125, 0.10102081298828125, 0.10455322265625, 0.10808563232421875, 0.1116180419921875, 0.11515045166015625, 0.118682861328125, 0.12221527099609375, 0.1257476806640625, 0.12928009033203125, 0.1328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 3.0, 11.0, 15.0, 15.0, 21.0, 35.0, 37.0, 50.0, 74.0, 125.0, 128.0, 107.0, 112.0, 78.0, 55.0, 24.0, 17.0, 27.0, 14.0, 8.0, 6.0, 6.0, 7.0, 4.0, 0.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.7894973754882812e-05, -2.717692404985428e-05, -2.6458874344825745e-05, -2.574082463979721e-05, -2.5022774934768677e-05, -2.4304725229740143e-05, -2.358667552471161e-05, -2.2868625819683075e-05, -2.215057611465454e-05, -2.1432526409626007e-05, -2.0714476704597473e-05, -1.999642699956894e-05, -1.9278377294540405e-05, -1.856032758951187e-05, -1.7842277884483337e-05, -1.7124228179454803e-05, -1.640617847442627e-05, -1.5688128769397736e-05, -1.4970079064369202e-05, -1.4252029359340668e-05, -1.3533979654312134e-05, -1.28159299492836e-05, -1.2097880244255066e-05, -1.1379830539226532e-05, -1.0661780834197998e-05, -9.943731129169464e-06, -9.22568142414093e-06, -8.507631719112396e-06, -7.789582014083862e-06, -7.071532309055328e-06, -6.3534826040267944e-06, -5.6354328989982605e-06, -4.9173831939697266e-06, -4.199333488941193e-06, -3.4812837839126587e-06, -2.7632340788841248e-06, -2.045184373855591e-06, -1.3271346688270569e-06, -6.09084963798523e-07, 1.0896474123001099e-07, 8.270144462585449e-07, 1.5450641512870789e-06, 2.263113856315613e-06, 2.9811635613441467e-06, 3.6992132663726807e-06, 4.417262971401215e-06, 5.1353126764297485e-06, 5.8533623814582825e-06, 6.571412086486816e-06, 7.28946179151535e-06, 8.007511496543884e-06, 8.725561201572418e-06, 9.443610906600952e-06, 1.0161660611629486e-05, 1.087971031665802e-05, 1.1597760021686554e-05, 1.2315809726715088e-05, 1.3033859431743622e-05, 1.3751909136772156e-05, 1.446995884180069e-05, 1.5188008546829224e-05, 1.5906058251857758e-05, 1.662410795688629e-05, 1.7342157661914825e-05, 1.806020736694336e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 11.0, 9.0, 16.0, 16.0, 30.0, 45.0, 49.0, 100.0, 155.0, 294.0, 805.0, 2281.0, 7447.0, 24077.0, 75842.0, 330017.0, 461963.0, 99592.0, 31350.0, 9571.0, 3006.0, 1003.0, 375.0, 156.0, 114.0, 54.0, 45.0, 39.0, 25.0, 17.0, 15.0, 11.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.11590194702148438, -0.11205291748046875, -0.10820388793945312, -0.1043548583984375, -0.10050582885742188, -0.09665679931640625, -0.09280776977539062, -0.088958740234375, -0.08510971069335938, -0.08126068115234375, -0.07741165161132812, -0.0735626220703125, -0.06971359252929688, -0.06586456298828125, -0.062015533447265625, -0.05816650390625, -0.054317474365234375, -0.05046844482421875, -0.046619415283203125, -0.0427703857421875, -0.038921356201171875, -0.03507232666015625, -0.031223297119140625, -0.027374267578125, -0.023525238037109375, -0.01967620849609375, -0.015827178955078125, -0.0119781494140625, -0.008129119873046875, -0.00428009033203125, -0.000431060791015625, 0.00341796875, 0.007266998291015625, 0.01111602783203125, 0.014965057373046875, 0.0188140869140625, 0.022663116455078125, 0.02651214599609375, 0.030361175537109375, 0.034210205078125, 0.038059234619140625, 0.04190826416015625, 0.045757293701171875, 0.0496063232421875, 0.053455352783203125, 0.05730438232421875, 0.061153411865234375, 0.06500244140625, 0.06885147094726562, 0.07270050048828125, 0.07654953002929688, 0.0803985595703125, 0.08424758911132812, 0.08809661865234375, 0.09194564819335938, 0.095794677734375, 0.09964370727539062, 0.10349273681640625, 0.10734176635742188, 0.1111907958984375, 0.11503982543945312, 0.11888885498046875, 0.12273788452148438, 0.1265869140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 8.0, 9.0, 13.0, 8.0, 9.0, 29.0, 31.0, 32.0, 52.0, 84.0, 104.0, 152.0, 134.0, 106.0, 79.0, 41.0, 26.0, 23.0, 17.0, 10.0, 13.0, 13.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.1632080078125, -0.1595630645751953, -0.15591812133789062, -0.15227317810058594, -0.14862823486328125, -0.14498329162597656, -0.14133834838867188, -0.1376934051513672, -0.1340484619140625, -0.1304035186767578, -0.12675857543945312, -0.12311363220214844, -0.11946868896484375, -0.11582374572753906, -0.11217880249023438, -0.10853385925292969, -0.104888916015625, -0.10124397277832031, -0.09759902954101562, -0.09395408630371094, -0.09030914306640625, -0.08666419982910156, -0.08301925659179688, -0.07937431335449219, -0.0757293701171875, -0.07208442687988281, -0.06843948364257812, -0.06479454040527344, -0.06114959716796875, -0.05750465393066406, -0.053859710693359375, -0.05021476745605469, -0.04656982421875, -0.04292488098144531, -0.039279937744140625, -0.03563499450683594, -0.03199005126953125, -0.028345108032226562, -0.024700164794921875, -0.021055221557617188, -0.0174102783203125, -0.013765335083007812, -0.010120391845703125, -0.0064754486083984375, -0.00283050537109375, 0.0008144378662109375, 0.004459381103515625, 0.008104324340820312, 0.011749267578125, 0.015394210815429688, 0.019039154052734375, 0.022684097290039062, 0.02632904052734375, 0.029973983764648438, 0.033618927001953125, 0.03726387023925781, 0.0409088134765625, 0.04455375671386719, 0.048198699951171875, 0.05184364318847656, 0.05548858642578125, 0.05913352966308594, 0.06277847290039062, 0.06642341613769531, 0.070068359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 17.0, 228.0, 610.0, 151.0, 16.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5815100073814392, -0.41304612159729004, -0.24458226561546326, -0.07611840963363647, 0.0923454761505127, 0.26080936193466187, 0.42927318811416626, 0.5977371335029602, 0.7662009596824646, 0.9346648454666138, 1.1031286716461182, 1.271592617034912, 1.4400564432144165, 1.608520269393921, 1.7769842147827148, 1.9454481601715088, 2.1139118671417236, 2.2823758125305176, 2.4508395195007324, 2.6193034648895264, 2.7877674102783203, 2.956231117248535, 3.124695062637329, 3.293159008026123, 3.461622953414917, 3.630086898803711, 3.798550605773926, 3.9670145511627197, 4.135478496551514, 4.3039422035217285, 4.472406387329102, 4.640870094299316, 4.8093342781066895, 4.977797985076904, 5.146262168884277, 5.314725875854492, 5.483189582824707, 5.65165376663208, 5.820117473602295, 5.988581657409668, 6.157045364379883, 6.325509071350098, 6.493973255157471, 6.6624369621276855, 6.8309006690979, 6.999364852905273, 7.167828559875488, 7.336292266845703, 7.504755973815918, 7.673219680786133, 7.841683864593506, 8.010147094726562, 8.178611755371094, 8.347075462341309, 8.515539169311523, 8.684002876281738, 8.85246753692627, 9.020931243896484, 9.1893949508667, 9.357858657836914, 9.526323318481445, 9.69478702545166, 9.863250732421875, 10.03171443939209, 10.200178146362305]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 11.0, 9.0, 12.0, 13.0, 19.0, 20.0, 32.0, 32.0, 36.0, 34.0, 32.0, 37.0, 33.0, 43.0, 52.0, 42.0, 56.0, 42.0, 46.0, 41.0, 51.0, 49.0, 40.0, 37.0, 23.0, 22.0, 26.0, 22.0, 16.0, 13.0, 12.0, 7.0, 10.0, 5.0, 4.0, 3.0, 8.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.9348077774047852, -0.910399317741394, -0.8859908580780029, -0.8615823984146118, -0.8371739387512207, -0.8127654790878296, -0.7883570194244385, -0.7639485597610474, -0.7395401000976562, -0.7151316404342651, -0.690723180770874, -0.6663147211074829, -0.6419062614440918, -0.6174978017807007, -0.5930893421173096, -0.5686808824539185, -0.5442724227905273, -0.5198639631271362, -0.4954555034637451, -0.471047043800354, -0.4466385841369629, -0.4222301244735718, -0.39782166481018066, -0.37341320514678955, -0.34900474548339844, -0.3245962858200073, -0.3001878261566162, -0.2757793664932251, -0.251370906829834, -0.22696244716644287, -0.20255398750305176, -0.17814552783966064, -0.1537371277809143, -0.1293286681175232, -0.10492020845413208, -0.08051174879074097, -0.056103289127349854, -0.03169482946395874, -0.007286369800567627, 0.017122089862823486, 0.0415305495262146, 0.06593900918960571, 0.09034746885299683, 0.11475592851638794, 0.13916438817977905, 0.16357284784317017, 0.18798130750656128, 0.2123897671699524, 0.2367982268333435, 0.2612066864967346, 0.28561514616012573, 0.31002360582351685, 0.33443206548690796, 0.3588405251502991, 0.3832489848136902, 0.4076574444770813, 0.4320659041404724, 0.4564743638038635, 0.48088282346725464, 0.5052912831306458, 0.5296997427940369, 0.554108202457428, 0.5785166621208191, 0.6029251217842102, 0.6273335814476013]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 25.0, 25.0, 37.0, 61.0, 60.0, 119.0, 173.0, 256.0, 404.0, 660.0, 920.0, 1509.0, 2635.0, 4364.0, 7710.0, 14025.0, 26677.0, 53052.0, 110359.0, 251390.0, 662081.0, 1727467.0, 796818.0, 286748.0, 123556.0, 58372.0, 29318.0, 15286.0, 8211.0, 4762.0, 2679.0, 1643.0, 1014.0, 615.0, 393.0, 294.0, 155.0, 100.0, 85.0, 79.0, 43.0, 33.0, 20.0, 11.0, 10.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08404541015625, -0.08129692077636719, -0.07854843139648438, -0.07579994201660156, -0.07305145263671875, -0.07030296325683594, -0.06755447387695312, -0.06480598449707031, -0.0620574951171875, -0.05930900573730469, -0.056560516357421875, -0.05381202697753906, -0.05106353759765625, -0.04831504821777344, -0.045566558837890625, -0.04281806945800781, -0.040069580078125, -0.03732109069824219, -0.034572601318359375, -0.03182411193847656, -0.02907562255859375, -0.026327133178710938, -0.023578643798828125, -0.020830154418945312, -0.0180816650390625, -0.015333175659179688, -0.012584686279296875, -0.009836196899414062, -0.00708770751953125, -0.0043392181396484375, -0.001590728759765625, 0.0011577606201171875, 0.00390625, 0.0066547393798828125, 0.009403228759765625, 0.012151718139648438, 0.01490020751953125, 0.017648696899414062, 0.020397186279296875, 0.023145675659179688, 0.0258941650390625, 0.028642654418945312, 0.031391143798828125, 0.03413963317871094, 0.03688812255859375, 0.03963661193847656, 0.042385101318359375, 0.04513359069824219, 0.047882080078125, 0.05063056945800781, 0.053379058837890625, 0.05612754821777344, 0.05887603759765625, 0.06162452697753906, 0.06437301635742188, 0.06712150573730469, 0.0698699951171875, 0.07261848449707031, 0.07536697387695312, 0.07811546325683594, 0.08086395263671875, 0.08361244201660156, 0.08636093139648438, 0.08910942077636719, 0.09185791015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 11.0, 10.0, 8.0, 12.0, 10.0, 17.0, 12.0, 22.0, 24.0, 20.0, 27.0, 25.0, 39.0, 39.0, 45.0, 42.0, 41.0, 34.0, 49.0, 37.0, 49.0, 38.0, 36.0, 42.0, 37.0, 30.0, 31.0, 30.0, 21.0, 22.0, 24.0, 16.0, 21.0, 13.0, 14.0, 11.0, 6.0, 6.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.06666278839111328, -0.06423377990722656, -0.061804771423339844, -0.059375762939453125, -0.056946754455566406, -0.05451774597167969, -0.05208873748779297, -0.04965972900390625, -0.04723072052001953, -0.04480171203613281, -0.042372703552246094, -0.039943695068359375, -0.037514686584472656, -0.03508567810058594, -0.03265666961669922, -0.0302276611328125, -0.02779865264892578, -0.025369644165039062, -0.022940635681152344, -0.020511627197265625, -0.018082618713378906, -0.015653610229492188, -0.013224601745605469, -0.01079559326171875, -0.008366584777832031, -0.0059375762939453125, -0.0035085678100585938, -0.001079559326171875, 0.0013494491577148438, 0.0037784576416015625, 0.006207466125488281, 0.008636474609375, 0.011065483093261719, 0.013494491577148438, 0.015923500061035156, 0.018352508544921875, 0.020781517028808594, 0.023210525512695312, 0.02563953399658203, 0.02806854248046875, 0.03049755096435547, 0.03292655944824219, 0.035355567932128906, 0.037784576416015625, 0.040213584899902344, 0.04264259338378906, 0.04507160186767578, 0.0475006103515625, 0.04992961883544922, 0.05235862731933594, 0.054787635803222656, 0.057216644287109375, 0.059645652770996094, 0.06207466125488281, 0.06450366973876953, 0.06693267822265625, 0.06936168670654297, 0.07179069519042969, 0.0742197036743164, 0.07664871215820312, 0.07907772064208984, 0.08150672912597656, 0.08393573760986328, 0.08636474609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 2.0, 10.0, 7.0, 21.0, 35.0, 49.0, 59.0, 92.0, 144.0, 222.0, 348.0, 582.0, 994.0, 1834.0, 3625.0, 7466.0, 17286.0, 45523.0, 132692.0, 444661.0, 1847229.0, 1231068.0, 305510.0, 95198.0, 33644.0, 13326.0, 5983.0, 2852.0, 1534.0, 896.0, 481.0, 290.0, 194.0, 132.0, 111.0, 53.0, 40.0, 27.0, 26.0, 12.0, 7.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1611328125, -0.155548095703125, -0.14996337890625, -0.144378662109375, -0.1387939453125, -0.133209228515625, -0.12762451171875, -0.122039794921875, -0.116455078125, -0.110870361328125, -0.10528564453125, -0.099700927734375, -0.0941162109375, -0.088531494140625, -0.08294677734375, -0.077362060546875, -0.07177734375, -0.066192626953125, -0.06060791015625, -0.055023193359375, -0.0494384765625, -0.043853759765625, -0.03826904296875, -0.032684326171875, -0.027099609375, -0.021514892578125, -0.01593017578125, -0.010345458984375, -0.0047607421875, 0.000823974609375, 0.00640869140625, 0.011993408203125, 0.017578125, 0.023162841796875, 0.02874755859375, 0.034332275390625, 0.0399169921875, 0.045501708984375, 0.05108642578125, 0.056671142578125, 0.062255859375, 0.067840576171875, 0.07342529296875, 0.079010009765625, 0.0845947265625, 0.090179443359375, 0.09576416015625, 0.101348876953125, 0.10693359375, 0.112518310546875, 0.11810302734375, 0.123687744140625, 0.1292724609375, 0.134857177734375, 0.14044189453125, 0.146026611328125, 0.151611328125, 0.157196044921875, 0.16278076171875, 0.168365478515625, 0.1739501953125, 0.179534912109375, 0.18511962890625, 0.190704345703125, 0.1962890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 13.0, 13.0, 26.0, 31.0, 58.0, 66.0, 106.0, 194.0, 273.0, 473.0, 676.0, 770.0, 469.0, 308.0, 206.0, 119.0, 88.0, 54.0, 47.0, 26.0, 9.0, 14.0, 9.0, 2.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.2601776123046875, -0.253509521484375, -0.2468414306640625, -0.24017333984375, -0.2335052490234375, -0.226837158203125, -0.2201690673828125, -0.2135009765625, -0.2068328857421875, -0.200164794921875, -0.1934967041015625, -0.18682861328125, -0.1801605224609375, -0.173492431640625, -0.1668243408203125, -0.16015625, -0.1534881591796875, -0.146820068359375, -0.1401519775390625, -0.13348388671875, -0.1268157958984375, -0.120147705078125, -0.1134796142578125, -0.1068115234375, -0.1001434326171875, -0.093475341796875, -0.0868072509765625, -0.08013916015625, -0.0734710693359375, -0.066802978515625, -0.0601348876953125, -0.053466796875, -0.0467987060546875, -0.040130615234375, -0.0334625244140625, -0.02679443359375, -0.0201263427734375, -0.013458251953125, -0.0067901611328125, -0.0001220703125, 0.0065460205078125, 0.013214111328125, 0.0198822021484375, 0.02655029296875, 0.0332183837890625, 0.039886474609375, 0.0465545654296875, 0.05322265625, 0.0598907470703125, 0.066558837890625, 0.0732269287109375, 0.07989501953125, 0.0865631103515625, 0.093231201171875, 0.0998992919921875, 0.1065673828125, 0.1132354736328125, 0.119903564453125, 0.1265716552734375, 0.13323974609375, 0.1399078369140625, 0.146575927734375, 0.1532440185546875, 0.159912109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 12.0, 25.0, 34.0, 53.0, 79.0, 90.0, 129.0, 143.0, 123.0, 104.0, 76.0, 45.0, 34.0, 27.0, 14.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7484586238861084, -1.7100229263305664, -1.6715872287750244, -1.633151650428772, -1.59471595287323, -1.556280255317688, -1.5178446769714355, -1.4794089794158936, -1.4409732818603516, -1.4025375843048096, -1.3641018867492676, -1.3256663084030151, -1.2872306108474731, -1.2487949132919312, -1.2103593349456787, -1.1719236373901367, -1.1334879398345947, -1.0950522422790527, -1.0566165447235107, -1.0181809663772583, -0.9797452688217163, -0.9413095712661743, -0.9028739333152771, -0.8644382953643799, -0.8260025978088379, -0.7875669002532959, -0.7491312623023987, -0.7106956243515015, -0.6722599267959595, -0.6338242292404175, -0.5953885912895203, -0.556952953338623, -0.5185173749923706, -0.480081707239151, -0.4416460394859314, -0.4032103717327118, -0.3647747039794922, -0.3263390362262726, -0.287903368473053, -0.24946770071983337, -0.21103203296661377, -0.17259636521339417, -0.13416069746017456, -0.09572502970695496, -0.05728936195373535, -0.018853694200515747, 0.019581973552703857, 0.05801764130592346, 0.09645330905914307, 0.13488897681236267, 0.17332464456558228, 0.21176031231880188, 0.2501959800720215, 0.2886316478252411, 0.3270673155784607, 0.3655029833316803, 0.4039386510848999, 0.4423743188381195, 0.4808099865913391, 0.5192456245422363, 0.5576813220977783, 0.5961170196533203, 0.6345526576042175, 0.6729882955551147, 0.7114239931106567]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 3.0, 13.0, 11.0, 12.0, 11.0, 14.0, 13.0, 25.0, 36.0, 41.0, 23.0, 35.0, 43.0, 36.0, 44.0, 47.0, 36.0, 46.0, 39.0, 49.0, 45.0, 35.0, 33.0, 41.0, 30.0, 23.0, 30.0, 22.0, 28.0, 19.0, 18.0, 16.0, 17.0, 9.0, 12.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.570195198059082, -0.551947295665741, -0.5336993336677551, -0.5154514312744141, -0.4972034692764282, -0.47895556688308716, -0.4607076346874237, -0.44245970249176025, -0.4242117702960968, -0.40596383810043335, -0.3877159059047699, -0.36946797370910645, -0.3512200713157654, -0.33297210931777954, -0.3147242069244385, -0.296476274728775, -0.2782283425331116, -0.2599804103374481, -0.24173247814178467, -0.2234845608472824, -0.20523662865161896, -0.1869886964559555, -0.16874077916145325, -0.1504928469657898, -0.13224491477012634, -0.11399698257446289, -0.09574905782938004, -0.07750113308429718, -0.05925320088863373, -0.041005268692970276, -0.02275734394788742, -0.004509419202804565, 0.013738512992858887, 0.03198644146323204, 0.050234369933605194, 0.06848229467868805, 0.0867302268743515, 0.10497815907001495, 0.12322608381509781, 0.14147400856018066, 0.15972194075584412, 0.17796987295150757, 0.19621780514717102, 0.21446572244167328, 0.23271365463733673, 0.2509616017341614, 0.26920950412750244, 0.2874574363231659, 0.30570536851882935, 0.3239533007144928, 0.34220123291015625, 0.3604491651058197, 0.37869709730148315, 0.3969449996948242, 0.41519293189048767, 0.4334408640861511, 0.4516887962818146, 0.469936728477478, 0.4881846606731415, 0.5064325928688049, 0.524680495262146, 0.5429284572601318, 0.5611763596534729, 0.579424262046814, 0.5976722240447998]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 9.0, 5.0, 12.0, 31.0, 38.0, 61.0, 98.0, 120.0, 226.0, 300.0, 403.0, 672.0, 990.0, 1515.0, 2215.0, 3372.0, 4966.0, 7164.0, 10889.0, 16163.0, 25282.0, 40978.0, 69242.0, 121497.0, 199055.0, 208628.0, 133571.0, 76430.0, 44741.0, 27161.0, 17472.0, 11501.0, 7795.0, 5144.0, 3612.0, 2381.0, 1630.0, 1012.0, 727.0, 478.0, 327.0, 223.0, 146.0, 81.0, 68.0, 48.0, 35.0, 19.0, 11.0, 8.0, 6.0, 3.0, 0.0, 0.0, 5.0, 1.0], "bins": [-0.10711669921875, -0.10387897491455078, -0.10064125061035156, -0.09740352630615234, -0.09416580200195312, -0.0909280776977539, -0.08769035339355469, -0.08445262908935547, -0.08121490478515625, -0.07797718048095703, -0.07473945617675781, -0.0715017318725586, -0.06826400756835938, -0.06502628326416016, -0.06178855895996094, -0.05855083465576172, -0.0553131103515625, -0.05207538604736328, -0.04883766174316406, -0.045599937438964844, -0.042362213134765625, -0.039124488830566406, -0.03588676452636719, -0.03264904022216797, -0.02941131591796875, -0.02617359161376953, -0.022935867309570312, -0.019698143005371094, -0.016460418701171875, -0.013222694396972656, -0.009984970092773438, -0.006747245788574219, -0.003509521484375, -0.00027179718017578125, 0.0029659271240234375, 0.006203651428222656, 0.009441375732421875, 0.012679100036621094, 0.015916824340820312, 0.01915454864501953, 0.02239227294921875, 0.02562999725341797, 0.028867721557617188, 0.032105445861816406, 0.035343170166015625, 0.038580894470214844, 0.04181861877441406, 0.04505634307861328, 0.0482940673828125, 0.05153179168701172, 0.05476951599121094, 0.058007240295410156, 0.061244964599609375, 0.0644826889038086, 0.06772041320800781, 0.07095813751220703, 0.07419586181640625, 0.07743358612060547, 0.08067131042480469, 0.0839090347290039, 0.08714675903320312, 0.09038448333740234, 0.09362220764160156, 0.09685993194580078, 0.10009765625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 12.0, 13.0, 20.0, 10.0, 24.0, 21.0, 35.0, 27.0, 21.0, 23.0, 32.0, 35.0, 29.0, 37.0, 47.0, 40.0, 36.0, 40.0, 40.0, 49.0, 33.0, 38.0, 31.0, 38.0, 29.0, 42.0, 25.0, 26.0, 20.0, 17.0, 10.0, 16.0, 17.0, 11.0, 8.0, 8.0, 8.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06634521484375, -0.06409645080566406, -0.061847686767578125, -0.05959892272949219, -0.05735015869140625, -0.05510139465332031, -0.052852630615234375, -0.05060386657714844, -0.0483551025390625, -0.04610633850097656, -0.043857574462890625, -0.04160881042480469, -0.03936004638671875, -0.03711128234863281, -0.034862518310546875, -0.03261375427246094, -0.030364990234375, -0.028116226196289062, -0.025867462158203125, -0.023618698120117188, -0.02136993408203125, -0.019121170043945312, -0.016872406005859375, -0.014623641967773438, -0.0123748779296875, -0.010126113891601562, -0.007877349853515625, -0.0056285858154296875, -0.00337982177734375, -0.0011310577392578125, 0.001117706298828125, 0.0033664703369140625, 0.005615234375, 0.007863998413085938, 0.010112762451171875, 0.012361526489257812, 0.01461029052734375, 0.016859054565429688, 0.019107818603515625, 0.021356582641601562, 0.0236053466796875, 0.025854110717773438, 0.028102874755859375, 0.030351638793945312, 0.03260040283203125, 0.03484916687011719, 0.037097930908203125, 0.03934669494628906, 0.041595458984375, 0.04384422302246094, 0.046092987060546875, 0.04834175109863281, 0.05059051513671875, 0.05283927917480469, 0.055088043212890625, 0.05733680725097656, 0.0595855712890625, 0.06183433532714844, 0.06408309936523438, 0.06633186340332031, 0.06858062744140625, 0.07082939147949219, 0.07307815551757812, 0.07532691955566406, 0.07757568359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 7.0, 7.0, 11.0, 7.0, 25.0, 27.0, 40.0, 63.0, 102.0, 141.0, 236.0, 406.0, 885.0, 1667.0, 3688.0, 8066.0, 17250.0, 36687.0, 83057.0, 200263.0, 347557.0, 198417.0, 81780.0, 36245.0, 16910.0, 7747.0, 3678.0, 1733.0, 772.0, 419.0, 205.0, 143.0, 86.0, 56.0, 46.0, 34.0, 24.0, 12.0, 5.0, 12.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.14923477172851562, -0.14380645751953125, -0.13837814331054688, -0.1329498291015625, -0.12752151489257812, -0.12209320068359375, -0.11666488647460938, -0.111236572265625, -0.10580825805664062, -0.10037994384765625, -0.09495162963867188, -0.0895233154296875, -0.08409500122070312, -0.07866668701171875, -0.07323837280273438, -0.06781005859375, -0.062381744384765625, -0.05695343017578125, -0.051525115966796875, -0.0460968017578125, -0.040668487548828125, -0.03524017333984375, -0.029811859130859375, -0.024383544921875, -0.018955230712890625, -0.01352691650390625, -0.008098602294921875, -0.0026702880859375, 0.002758026123046875, 0.00818634033203125, 0.013614654541015625, 0.01904296875, 0.024471282958984375, 0.02989959716796875, 0.035327911376953125, 0.0407562255859375, 0.046184539794921875, 0.05161285400390625, 0.057041168212890625, 0.062469482421875, 0.06789779663085938, 0.07332611083984375, 0.07875442504882812, 0.0841827392578125, 0.08961105346679688, 0.09503936767578125, 0.10046768188476562, 0.10589599609375, 0.11132431030273438, 0.11675262451171875, 0.12218093872070312, 0.1276092529296875, 0.13303756713867188, 0.13846588134765625, 0.14389419555664062, 0.149322509765625, 0.15475082397460938, 0.16017913818359375, 0.16560745239257812, 0.1710357666015625, 0.17646408081054688, 0.18189239501953125, 0.18732070922851562, 0.1927490234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 5.0, 10.0, 14.0, 11.0, 8.0, 16.0, 22.0, 24.0, 27.0, 26.0, 32.0, 28.0, 37.0, 42.0, 44.0, 48.0, 44.0, 45.0, 40.0, 46.0, 44.0, 63.0, 45.0, 43.0, 44.0, 24.0, 22.0, 14.0, 30.0, 24.0, 11.0, 8.0, 9.0, 6.0, 8.0, 1.0, 4.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260986328125, -0.2518463134765625, -0.242706298828125, -0.2335662841796875, -0.22442626953125, -0.2152862548828125, -0.206146240234375, -0.1970062255859375, -0.1878662109375, -0.1787261962890625, -0.169586181640625, -0.1604461669921875, -0.15130615234375, -0.1421661376953125, -0.133026123046875, -0.1238861083984375, -0.11474609375, -0.1056060791015625, -0.096466064453125, -0.0873260498046875, -0.07818603515625, -0.0690460205078125, -0.059906005859375, -0.0507659912109375, -0.0416259765625, -0.0324859619140625, -0.023345947265625, -0.0142059326171875, -0.00506591796875, 0.0040740966796875, 0.013214111328125, 0.0223541259765625, 0.031494140625, 0.0406341552734375, 0.049774169921875, 0.0589141845703125, 0.06805419921875, 0.0771942138671875, 0.086334228515625, 0.0954742431640625, 0.1046142578125, 0.1137542724609375, 0.122894287109375, 0.1320343017578125, 0.14117431640625, 0.1503143310546875, 0.159454345703125, 0.1685943603515625, 0.177734375, 0.1868743896484375, 0.196014404296875, 0.2051544189453125, 0.21429443359375, 0.2234344482421875, 0.232574462890625, 0.2417144775390625, 0.2508544921875, 0.2599945068359375, 0.269134521484375, 0.2782745361328125, 0.28741455078125, 0.2965545654296875, 0.305694580078125, 0.3148345947265625, 0.323974609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 13.0, 18.0, 20.0, 35.0, 47.0, 69.0, 111.0, 173.0, 325.0, 579.0, 1173.0, 2280.0, 4579.0, 9528.0, 20199.0, 45106.0, 111347.0, 299643.0, 333591.0, 126458.0, 50194.0, 22392.0, 10403.0, 5069.0, 2426.0, 1210.0, 630.0, 387.0, 226.0, 121.0, 67.0, 39.0, 30.0, 21.0, 20.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1123046875, -0.1090078353881836, -0.10571098327636719, -0.10241413116455078, -0.09911727905273438, -0.09582042694091797, -0.09252357482910156, -0.08922672271728516, -0.08592987060546875, -0.08263301849365234, -0.07933616638183594, -0.07603931427001953, -0.07274246215820312, -0.06944561004638672, -0.06614875793457031, -0.0628519058227539, -0.0595550537109375, -0.056258201599121094, -0.05296134948730469, -0.04966449737548828, -0.046367645263671875, -0.04307079315185547, -0.03977394104003906, -0.036477088928222656, -0.03318023681640625, -0.029883384704589844, -0.026586532592773438, -0.02328968048095703, -0.019992828369140625, -0.01669597625732422, -0.013399124145507812, -0.010102272033691406, -0.006805419921875, -0.0035085678100585938, -0.0002117156982421875, 0.0030851364135742188, 0.006381988525390625, 0.009678840637207031, 0.012975692749023438, 0.016272544860839844, 0.01956939697265625, 0.022866249084472656, 0.026163101196289062, 0.02945995330810547, 0.032756805419921875, 0.03605365753173828, 0.03935050964355469, 0.042647361755371094, 0.0459442138671875, 0.049241065979003906, 0.05253791809082031, 0.05583477020263672, 0.059131622314453125, 0.06242847442626953, 0.06572532653808594, 0.06902217864990234, 0.07231903076171875, 0.07561588287353516, 0.07891273498535156, 0.08220958709716797, 0.08550643920898438, 0.08880329132080078, 0.09210014343261719, 0.0953969955444336, 0.09869384765625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 12.0, 4.0, 7.0, 9.0, 11.0, 11.0, 13.0, 17.0, 28.0, 37.0, 34.0, 49.0, 60.0, 85.0, 106.0, 95.0, 73.0, 72.0, 48.0, 56.0, 34.0, 27.0, 21.0, 14.0, 10.0, 9.0, 11.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.1517276763916016e-05, -2.080574631690979e-05, -2.0094215869903564e-05, -1.938268542289734e-05, -1.8671154975891113e-05, -1.7959624528884888e-05, -1.7248094081878662e-05, -1.6536563634872437e-05, -1.582503318786621e-05, -1.5113502740859985e-05, -1.440197229385376e-05, -1.3690441846847534e-05, -1.2978911399841309e-05, -1.2267380952835083e-05, -1.1555850505828857e-05, -1.0844320058822632e-05, -1.0132789611816406e-05, -9.42125916481018e-06, -8.709728717803955e-06, -7.99819827079773e-06, -7.286667823791504e-06, -6.575137376785278e-06, -5.863606929779053e-06, -5.152076482772827e-06, -4.4405460357666016e-06, -3.729015588760376e-06, -3.0174851417541504e-06, -2.305954694747925e-06, -1.5944242477416992e-06, -8.828938007354736e-07, -1.7136335372924805e-07, 5.401670932769775e-07, 1.2516975402832031e-06, 1.9632279872894287e-06, 2.6747584342956543e-06, 3.38628888130188e-06, 4.0978193283081055e-06, 4.809349775314331e-06, 5.520880222320557e-06, 6.232410669326782e-06, 6.943941116333008e-06, 7.655471563339233e-06, 8.367002010345459e-06, 9.078532457351685e-06, 9.79006290435791e-06, 1.0501593351364136e-05, 1.1213123798370361e-05, 1.1924654245376587e-05, 1.2636184692382812e-05, 1.3347715139389038e-05, 1.4059245586395264e-05, 1.477077603340149e-05, 1.5482306480407715e-05, 1.619383692741394e-05, 1.6905367374420166e-05, 1.761689782142639e-05, 1.8328428268432617e-05, 1.9039958715438843e-05, 1.975148916244507e-05, 2.0463019609451294e-05, 2.117455005645752e-05, 2.1886080503463745e-05, 2.259761095046997e-05, 2.3309141397476196e-05, 2.4020671844482422e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 8.0, 12.0, 24.0, 32.0, 45.0, 67.0, 104.0, 173.0, 272.0, 447.0, 806.0, 1280.0, 2406.0, 4493.0, 8563.0, 16644.0, 33022.0, 68741.0, 149148.0, 300922.0, 244350.0, 111093.0, 52496.0, 25464.0, 12867.0, 6702.0, 3678.0, 1983.0, 1104.0, 643.0, 341.0, 195.0, 156.0, 88.0, 50.0, 33.0, 28.0, 27.0, 9.0, 7.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.088134765625, -0.08552837371826172, -0.08292198181152344, -0.08031558990478516, -0.07770919799804688, -0.0751028060913086, -0.07249641418457031, -0.06989002227783203, -0.06728363037109375, -0.06467723846435547, -0.06207084655761719, -0.059464454650878906, -0.056858062744140625, -0.054251670837402344, -0.05164527893066406, -0.04903888702392578, -0.0464324951171875, -0.04382610321044922, -0.04121971130371094, -0.038613319396972656, -0.036006927490234375, -0.033400535583496094, -0.030794143676757812, -0.02818775177001953, -0.02558135986328125, -0.02297496795654297, -0.020368576049804688, -0.017762184143066406, -0.015155792236328125, -0.012549400329589844, -0.009943008422851562, -0.007336616516113281, -0.004730224609375, -0.0021238327026367188, 0.0004825592041015625, 0.0030889511108398438, 0.005695343017578125, 0.008301734924316406, 0.010908126831054688, 0.013514518737792969, 0.01612091064453125, 0.01872730255126953, 0.021333694458007812, 0.023940086364746094, 0.026546478271484375, 0.029152870178222656, 0.03175926208496094, 0.03436565399169922, 0.0369720458984375, 0.03957843780517578, 0.04218482971191406, 0.044791221618652344, 0.047397613525390625, 0.050004005432128906, 0.05261039733886719, 0.05521678924560547, 0.05782318115234375, 0.06042957305908203, 0.06303596496582031, 0.0656423568725586, 0.06824874877929688, 0.07085514068603516, 0.07346153259277344, 0.07606792449951172, 0.07867431640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 10.0, 7.0, 14.0, 13.0, 18.0, 22.0, 25.0, 31.0, 36.0, 41.0, 59.0, 66.0, 76.0, 85.0, 87.0, 53.0, 58.0, 54.0, 38.0, 38.0, 29.0, 23.0, 12.0, 9.0, 19.0, 4.0, 12.0, 9.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10015869140625, -0.09710311889648438, -0.09404754638671875, -0.09099197387695312, -0.0879364013671875, -0.08488082885742188, -0.08182525634765625, -0.07876968383789062, -0.075714111328125, -0.07265853881835938, -0.06960296630859375, -0.06654739379882812, -0.0634918212890625, -0.060436248779296875, -0.05738067626953125, -0.054325103759765625, -0.05126953125, -0.048213958740234375, -0.04515838623046875, -0.042102813720703125, -0.0390472412109375, -0.035991668701171875, -0.03293609619140625, -0.029880523681640625, -0.026824951171875, -0.023769378662109375, -0.02071380615234375, -0.017658233642578125, -0.0146026611328125, -0.011547088623046875, -0.00849151611328125, -0.005435943603515625, -0.00238037109375, 0.000675201416015625, 0.00373077392578125, 0.006786346435546875, 0.0098419189453125, 0.012897491455078125, 0.01595306396484375, 0.019008636474609375, 0.022064208984375, 0.025119781494140625, 0.02817535400390625, 0.031230926513671875, 0.0342864990234375, 0.037342071533203125, 0.04039764404296875, 0.043453216552734375, 0.0465087890625, 0.049564361572265625, 0.05261993408203125, 0.055675506591796875, 0.0587310791015625, 0.061786651611328125, 0.06484222412109375, 0.06789779663085938, 0.070953369140625, 0.07400894165039062, 0.07706451416015625, 0.08012008666992188, 0.0831756591796875, 0.08623123168945312, 0.08928680419921875, 0.09234237670898438, 0.09539794921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 11.0, 32.0, 132.0, 291.0, 313.0, 163.0, 55.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.985721588134766, -5.870831489562988, -5.755941390991211, -5.641051769256592, -5.5261616706848145, -5.411271572113037, -5.296381950378418, -5.181491851806641, -5.066601753234863, -4.951711654663086, -4.836821556091309, -4.7219319343566895, -4.607041835784912, -4.492151737213135, -4.377262115478516, -4.262372016906738, -4.147481918334961, -4.032591819763184, -3.9177019596099854, -3.802812099456787, -3.6879220008850098, -3.5730319023132324, -3.458142042160034, -3.343252182006836, -3.2283620834350586, -3.1134719848632812, -2.998582124710083, -2.8836922645568848, -2.7688021659851074, -2.65391206741333, -2.539022207260132, -2.4241323471069336, -2.3092422485351562, -2.194352149963379, -2.0794622898101807, -1.9645723104476929, -1.849682331085205, -1.7347923517227173, -1.6199023723602295, -1.5050123929977417, -1.390122413635254, -1.2752324342727661, -1.1603424549102783, -1.0454524755477905, -0.9305624961853027, -0.8156725168228149, -0.7007825374603271, -0.5858925580978394, -0.47100257873535156, -0.35611259937286377, -0.24122262001037598, -0.12633264064788818, -0.01144266128540039, 0.1034473180770874, 0.2183372974395752, 0.333227276802063, 0.4481172561645508, 0.5630072355270386, 0.6778972148895264, 0.7927871942520142, 0.907677173614502, 1.0225671529769897, 1.1374571323394775, 1.2523471117019653, 1.3672370910644531]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 7.0, 8.0, 7.0, 14.0, 15.0, 6.0, 24.0, 24.0, 25.0, 28.0, 38.0, 33.0, 35.0, 34.0, 29.0, 45.0, 48.0, 46.0, 28.0, 48.0, 52.0, 43.0, 43.0, 45.0, 38.0, 40.0, 29.0, 24.0, 25.0, 21.0, 12.0, 16.0, 11.0, 11.0, 13.0, 2.0, 9.0, 6.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.0381935834884644, -1.0098590850830078, -0.981524646282196, -0.9531902074813843, -0.9248557090759277, -0.896521270275116, -0.8681868314743042, -0.8398523330688477, -0.8115178346633911, -0.7831833958625793, -0.7548488974571228, -0.726514458656311, -0.6981799602508545, -0.6698455214500427, -0.641511082649231, -0.6131765842437744, -0.5848421454429626, -0.5565077066421509, -0.5281732082366943, -0.49983876943588257, -0.471504271030426, -0.44316983222961426, -0.4148353636264801, -0.38650089502334595, -0.3581664264202118, -0.32983195781707764, -0.3014974892139435, -0.2731630206108093, -0.24482856690883636, -0.2164940983057022, -0.18815964460372925, -0.1598251760005951, -0.1314907670021057, -0.10315629839897156, -0.074821837246418, -0.04648737609386444, -0.018152907490730286, 0.01018156111240387, 0.03851601481437683, 0.06685048341751099, 0.09518495202064514, 0.1235194206237793, 0.15185388922691345, 0.1801883429288864, 0.20852281153202057, 0.23685728013515472, 0.2651917338371277, 0.29352620244026184, 0.321860671043396, 0.35019513964653015, 0.3785296082496643, 0.4068640470504761, 0.4351985454559326, 0.4635329842567444, 0.49186745285987854, 0.5202019214630127, 0.5485364198684692, 0.576870858669281, 0.6052053570747375, 0.6335397958755493, 0.6618742942810059, 0.6902087330818176, 0.7185431718826294, 0.7468776702880859, 0.7752121090888977]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 8.0, 19.0, 20.0, 26.0, 43.0, 62.0, 99.0, 173.0, 330.0, 499.0, 984.0, 1741.0, 3106.0, 5608.0, 10671.0, 21989.0, 46339.0, 104562.0, 253107.0, 756947.0, 1907780.0, 668363.0, 231081.0, 95596.0, 42965.0, 20137.0, 10252.0, 5234.0, 2804.0, 1521.0, 897.0, 499.0, 306.0, 177.0, 113.0, 78.0, 53.0, 33.0, 24.0, 15.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10150146484375, -0.09805488586425781, -0.09460830688476562, -0.09116172790527344, -0.08771514892578125, -0.08426856994628906, -0.08082199096679688, -0.07737541198730469, -0.0739288330078125, -0.07048225402832031, -0.06703567504882812, -0.06358909606933594, -0.06014251708984375, -0.05669593811035156, -0.053249359130859375, -0.04980278015136719, -0.046356201171875, -0.04290962219238281, -0.039463043212890625, -0.03601646423339844, -0.03256988525390625, -0.029123306274414062, -0.025676727294921875, -0.022230148315429688, -0.0187835693359375, -0.015336990356445312, -0.011890411376953125, -0.008443832397460938, -0.00499725341796875, -0.0015506744384765625, 0.001895904541015625, 0.0053424835205078125, 0.0087890625, 0.012235641479492188, 0.015682220458984375, 0.019128799438476562, 0.02257537841796875, 0.026021957397460938, 0.029468536376953125, 0.03291511535644531, 0.0363616943359375, 0.03980827331542969, 0.043254852294921875, 0.04670143127441406, 0.05014801025390625, 0.05359458923339844, 0.057041168212890625, 0.06048774719238281, 0.063934326171875, 0.06738090515136719, 0.07082748413085938, 0.07427406311035156, 0.07772064208984375, 0.08116722106933594, 0.08461380004882812, 0.08806037902832031, 0.0915069580078125, 0.09495353698730469, 0.09840011596679688, 0.10184669494628906, 0.10529327392578125, 0.10873985290527344, 0.11218643188476562, 0.11563301086425781, 0.11907958984375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 11.0, 8.0, 19.0, 14.0, 19.0, 24.0, 15.0, 28.0, 34.0, 35.0, 32.0, 45.0, 38.0, 47.0, 43.0, 53.0, 45.0, 49.0, 48.0, 57.0, 58.0, 30.0, 38.0, 30.0, 29.0, 23.0, 20.0, 15.0, 14.0, 13.0, 12.0, 10.0, 11.0, 4.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07415771484375, -0.07134342193603516, -0.06852912902832031, -0.06571483612060547, -0.06290054321289062, -0.06008625030517578, -0.05727195739746094, -0.054457664489746094, -0.05164337158203125, -0.048829078674316406, -0.04601478576660156, -0.04320049285888672, -0.040386199951171875, -0.03757190704345703, -0.03475761413574219, -0.031943321228027344, -0.0291290283203125, -0.026314735412597656, -0.023500442504882812, -0.02068614959716797, -0.017871856689453125, -0.015057563781738281, -0.012243270874023438, -0.009428977966308594, -0.00661468505859375, -0.0038003921508789062, -0.0009860992431640625, 0.0018281936645507812, 0.004642486572265625, 0.007456779479980469, 0.010271072387695312, 0.013085365295410156, 0.015899658203125, 0.018713951110839844, 0.021528244018554688, 0.02434253692626953, 0.027156829833984375, 0.02997112274169922, 0.03278541564941406, 0.035599708557128906, 0.03841400146484375, 0.041228294372558594, 0.04404258728027344, 0.04685688018798828, 0.049671173095703125, 0.05248546600341797, 0.05529975891113281, 0.058114051818847656, 0.0609283447265625, 0.06374263763427734, 0.06655693054199219, 0.06937122344970703, 0.07218551635742188, 0.07499980926513672, 0.07781410217285156, 0.0806283950805664, 0.08344268798828125, 0.0862569808959961, 0.08907127380371094, 0.09188556671142578, 0.09469985961914062, 0.09751415252685547, 0.10032844543457031, 0.10314273834228516, 0.10595703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 6.0, 7.0, 5.0, 18.0, 28.0, 46.0, 55.0, 95.0, 140.0, 250.0, 342.0, 560.0, 910.0, 1509.0, 2570.0, 4678.0, 8840.0, 17218.0, 35153.0, 75772.0, 167144.0, 403065.0, 1174443.0, 1444951.0, 487722.0, 198271.0, 87477.0, 40871.0, 19633.0, 10041.0, 5254.0, 2861.0, 1678.0, 965.0, 601.0, 391.0, 256.0, 158.0, 103.0, 60.0, 52.0, 30.0, 25.0, 13.0, 10.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.130615234375, -0.12627601623535156, -0.12193679809570312, -0.11759757995605469, -0.11325836181640625, -0.10891914367675781, -0.10457992553710938, -0.10024070739746094, -0.0959014892578125, -0.09156227111816406, -0.08722305297851562, -0.08288383483886719, -0.07854461669921875, -0.07420539855957031, -0.06986618041992188, -0.06552696228027344, -0.061187744140625, -0.05684852600097656, -0.052509307861328125, -0.04817008972167969, -0.04383087158203125, -0.03949165344238281, -0.035152435302734375, -0.030813217163085938, -0.0264739990234375, -0.022134780883789062, -0.017795562744140625, -0.013456344604492188, -0.00911712646484375, -0.0047779083251953125, -0.000438690185546875, 0.0039005279541015625, 0.00823974609375, 0.012578964233398438, 0.016918182373046875, 0.021257400512695312, 0.02559661865234375, 0.029935836791992188, 0.034275054931640625, 0.03861427307128906, 0.0429534912109375, 0.04729270935058594, 0.051631927490234375, 0.05597114562988281, 0.06031036376953125, 0.06464958190917969, 0.06898880004882812, 0.07332801818847656, 0.077667236328125, 0.08200645446777344, 0.08634567260742188, 0.09068489074707031, 0.09502410888671875, 0.09936332702636719, 0.10370254516601562, 0.10804176330566406, 0.1123809814453125, 0.11672019958496094, 0.12105941772460938, 0.1253986358642578, 0.12973785400390625, 0.1340770721435547, 0.13841629028320312, 0.14275550842285156, 0.1470947265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 14.0, 12.0, 20.0, 27.0, 49.0, 60.0, 107.0, 136.0, 161.0, 315.0, 475.0, 759.0, 650.0, 446.0, 281.0, 163.0, 114.0, 86.0, 63.0, 38.0, 14.0, 26.0, 16.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267578125, -0.26053810119628906, -0.2534980773925781, -0.2464580535888672, -0.23941802978515625, -0.2323780059814453, -0.22533798217773438, -0.21829795837402344, -0.2112579345703125, -0.20421791076660156, -0.19717788696289062, -0.1901378631591797, -0.18309783935546875, -0.1760578155517578, -0.16901779174804688, -0.16197776794433594, -0.154937744140625, -0.14789772033691406, -0.14085769653320312, -0.1338176727294922, -0.12677764892578125, -0.11973762512207031, -0.11269760131835938, -0.10565757751464844, -0.0986175537109375, -0.09157752990722656, -0.08453750610351562, -0.07749748229980469, -0.07045745849609375, -0.06341743469238281, -0.056377410888671875, -0.04933738708496094, -0.04229736328125, -0.03525733947753906, -0.028217315673828125, -0.021177291870117188, -0.01413726806640625, -0.0070972442626953125, -5.7220458984375e-05, 0.0069828033447265625, 0.0140228271484375, 0.021062850952148438, 0.028102874755859375, 0.03514289855957031, 0.04218292236328125, 0.04922294616699219, 0.056262969970703125, 0.06330299377441406, 0.070343017578125, 0.07738304138183594, 0.08442306518554688, 0.09146308898925781, 0.09850311279296875, 0.10554313659667969, 0.11258316040039062, 0.11962318420410156, 0.1266632080078125, 0.13370323181152344, 0.14074325561523438, 0.1477832794189453, 0.15482330322265625, 0.1618633270263672, 0.16890335083007812, 0.17594337463378906, 0.1829833984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 4.0, 8.0, 17.0, 18.0, 28.0, 42.0, 53.0, 79.0, 108.0, 114.0, 117.0, 103.0, 84.0, 82.0, 44.0, 43.0, 18.0, 18.0, 12.0, 6.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9285476207733154, -0.8938480615615845, -0.8591485023498535, -0.8244490027427673, -0.7897494435310364, -0.7550498843193054, -0.7203503847122192, -0.6856508255004883, -0.6509512662887573, -0.6162517070770264, -0.5815521478652954, -0.5468526482582092, -0.5121530890464783, -0.4774535298347473, -0.44275400042533875, -0.4080544710159302, -0.3733549118041992, -0.33865535259246826, -0.3039558231830597, -0.2692562937736511, -0.23455673456192017, -0.1998571902513504, -0.16515764594078064, -0.13045810163021088, -0.09575855731964111, -0.06105901300907135, -0.026359468698501587, 0.008340075612068176, 0.04303961992263794, 0.0777391642332077, 0.11243870854377747, 0.14713825285434723, 0.18183791637420654, 0.2165374606847763, 0.25123700499534607, 0.28593653440475464, 0.3206360936164856, 0.35533565282821655, 0.3900351822376251, 0.4247347116470337, 0.45943427085876465, 0.4941338300704956, 0.5288333892822266, 0.5635328888893127, 0.5982324481010437, 0.6329320073127747, 0.6676315069198608, 0.7023310661315918, 0.7370306253433228, 0.7717301845550537, 0.8064297437667847, 0.8411292433738708, 0.8758288025856018, 0.9105283617973328, 0.945227861404419, 0.9799274206161499, 1.0146269798278809, 1.0493265390396118, 1.0840260982513428, 1.1187256574630737, 1.1534252166748047, 1.188124656677246, 1.222824215888977, 1.257523775100708, 1.292223334312439]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 4.0, 4.0, 6.0, 8.0, 9.0, 13.0, 16.0, 15.0, 18.0, 22.0, 25.0, 24.0, 19.0, 26.0, 23.0, 30.0, 28.0, 19.0, 30.0, 31.0, 41.0, 34.0, 37.0, 35.0, 34.0, 41.0, 34.0, 36.0, 38.0, 31.0, 33.0, 29.0, 32.0, 20.0, 21.0, 19.0, 23.0, 9.0, 17.0, 14.0, 16.0, 6.0, 3.0, 2.0, 6.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.6949673891067505, -0.6762309074401855, -0.6574944257736206, -0.6387579441070557, -0.6200214624404907, -0.6012850403785706, -0.5825485587120056, -0.5638120770454407, -0.5450755953788757, -0.5263391137123108, -0.5076026320457458, -0.4888661801815033, -0.47012969851493835, -0.4513932168483734, -0.43265676498413086, -0.4139202833175659, -0.395183801651001, -0.37644731998443604, -0.3577108383178711, -0.33897438645362854, -0.3202379047870636, -0.30150142312049866, -0.2827649712562561, -0.26402848958969116, -0.24529200792312622, -0.22655552625656128, -0.20781905949115753, -0.18908259272575378, -0.17034611105918884, -0.1516096293926239, -0.13287316262722015, -0.1141366958618164, -0.09540015459060669, -0.07666368037462234, -0.057927206158638, -0.039190731942653656, -0.02045425772666931, -0.001717783510684967, 0.017018690705299377, 0.035755157470703125, 0.054491639137268066, 0.07322811335325241, 0.09196458756923676, 0.1107010617852211, 0.12943753600120544, 0.14817401766777039, 0.16691048443317413, 0.18564695119857788, 0.20438343286514282, 0.22311991453170776, 0.2418563812971115, 0.26059284806251526, 0.2793293297290802, 0.29806581139564514, 0.3168022632598877, 0.33553874492645264, 0.3542752265930176, 0.3730117082595825, 0.39174818992614746, 0.41048464179039, 0.42922112345695496, 0.4479576051235199, 0.46669405698776245, 0.4854305386543274, 0.5041670203208923]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 15.0, 13.0, 26.0, 34.0, 66.0, 70.0, 132.0, 174.0, 227.0, 382.0, 571.0, 807.0, 1275.0, 1987.0, 3058.0, 4745.0, 7685.0, 12541.0, 21632.0, 38093.0, 77072.0, 194566.0, 342767.0, 179445.0, 71698.0, 36470.0, 20421.0, 12099.0, 7304.0, 4586.0, 2938.0, 1906.0, 1270.0, 853.0, 521.0, 359.0, 233.0, 169.0, 121.0, 75.0, 53.0, 40.0, 14.0, 19.0, 10.0, 6.0, 4.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11572265625, -0.11165618896484375, -0.1075897216796875, -0.10352325439453125, -0.099456787109375, -0.09539031982421875, -0.0913238525390625, -0.08725738525390625, -0.08319091796875, -0.07912445068359375, -0.0750579833984375, -0.07099151611328125, -0.066925048828125, -0.06285858154296875, -0.0587921142578125, -0.05472564697265625, -0.0506591796875, -0.04659271240234375, -0.0425262451171875, -0.03845977783203125, -0.034393310546875, -0.03032684326171875, -0.0262603759765625, -0.02219390869140625, -0.01812744140625, -0.01406097412109375, -0.0099945068359375, -0.00592803955078125, -0.001861572265625, 0.00220489501953125, 0.0062713623046875, 0.01033782958984375, 0.014404296875, 0.01847076416015625, 0.0225372314453125, 0.02660369873046875, 0.030670166015625, 0.03473663330078125, 0.0388031005859375, 0.04286956787109375, 0.04693603515625, 0.05100250244140625, 0.0550689697265625, 0.05913543701171875, 0.063201904296875, 0.06726837158203125, 0.0713348388671875, 0.07540130615234375, 0.0794677734375, 0.08353424072265625, 0.0876007080078125, 0.09166717529296875, 0.095733642578125, 0.09980010986328125, 0.1038665771484375, 0.10793304443359375, 0.11199951171875, 0.11606597900390625, 0.1201324462890625, 0.12419891357421875, 0.128265380859375, 0.13233184814453125, 0.1363983154296875, 0.14046478271484375, 0.14453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 4.0, 8.0, 1.0, 16.0, 7.0, 12.0, 15.0, 16.0, 16.0, 11.0, 16.0, 30.0, 24.0, 26.0, 23.0, 30.0, 38.0, 39.0, 39.0, 51.0, 47.0, 37.0, 53.0, 28.0, 46.0, 30.0, 42.0, 27.0, 35.0, 25.0, 36.0, 29.0, 28.0, 20.0, 17.0, 11.0, 11.0, 11.0, 9.0, 10.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07098388671875, -0.06868553161621094, -0.06638717651367188, -0.06408882141113281, -0.06179046630859375, -0.05949211120605469, -0.057193756103515625, -0.05489540100097656, -0.0525970458984375, -0.05029869079589844, -0.048000335693359375, -0.04570198059082031, -0.04340362548828125, -0.04110527038574219, -0.038806915283203125, -0.03650856018066406, -0.034210205078125, -0.03191184997558594, -0.029613494873046875, -0.027315139770507812, -0.02501678466796875, -0.022718429565429688, -0.020420074462890625, -0.018121719360351562, -0.0158233642578125, -0.013525009155273438, -0.011226654052734375, -0.008928298950195312, -0.00662994384765625, -0.0043315887451171875, -0.002033233642578125, 0.0002651214599609375, 0.0025634765625, 0.0048618316650390625, 0.007160186767578125, 0.009458541870117188, 0.01175689697265625, 0.014055252075195312, 0.016353607177734375, 0.018651962280273438, 0.0209503173828125, 0.023248672485351562, 0.025547027587890625, 0.027845382690429688, 0.03014373779296875, 0.03244209289550781, 0.034740447998046875, 0.03703880310058594, 0.039337158203125, 0.04163551330566406, 0.043933868408203125, 0.04623222351074219, 0.04853057861328125, 0.05082893371582031, 0.053127288818359375, 0.05542564392089844, 0.0577239990234375, 0.06002235412597656, 0.062320709228515625, 0.06461906433105469, 0.06691741943359375, 0.06921577453613281, 0.07151412963867188, 0.07381248474121094, 0.07611083984375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 9.0, 11.0, 12.0, 14.0, 30.0, 65.0, 88.0, 167.0, 307.0, 552.0, 1136.0, 2219.0, 4283.0, 8563.0, 17766.0, 38619.0, 104569.0, 375274.0, 334876.0, 91926.0, 35683.0, 16210.0, 7889.0, 3969.0, 2034.0, 1017.0, 544.0, 299.0, 155.0, 87.0, 65.0, 31.0, 18.0, 8.0, 16.0, 6.0, 9.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.19287109375, -0.18718910217285156, -0.18150711059570312, -0.1758251190185547, -0.17014312744140625, -0.1644611358642578, -0.15877914428710938, -0.15309715270996094, -0.1474151611328125, -0.14173316955566406, -0.13605117797851562, -0.1303691864013672, -0.12468719482421875, -0.11900520324707031, -0.11332321166992188, -0.10764122009277344, -0.101959228515625, -0.09627723693847656, -0.09059524536132812, -0.08491325378417969, -0.07923126220703125, -0.07354927062988281, -0.06786727905273438, -0.06218528747558594, -0.0565032958984375, -0.05082130432128906, -0.045139312744140625, -0.03945732116699219, -0.03377532958984375, -0.028093338012695312, -0.022411346435546875, -0.016729354858398438, -0.01104736328125, -0.0053653717041015625, 0.000316619873046875, 0.0059986114501953125, 0.01168060302734375, 0.017362594604492188, 0.023044586181640625, 0.028726577758789062, 0.0344085693359375, 0.04009056091308594, 0.045772552490234375, 0.05145454406738281, 0.05713653564453125, 0.06281852722167969, 0.06850051879882812, 0.07418251037597656, 0.079864501953125, 0.08554649353027344, 0.09122848510742188, 0.09691047668457031, 0.10259246826171875, 0.10827445983886719, 0.11395645141601562, 0.11963844299316406, 0.1253204345703125, 0.13100242614746094, 0.13668441772460938, 0.1423664093017578, 0.14804840087890625, 0.1537303924560547, 0.15941238403320312, 0.16509437561035156, 0.1707763671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 9.0, 4.0, 9.0, 10.0, 17.0, 9.0, 21.0, 20.0, 20.0, 25.0, 24.0, 34.0, 35.0, 33.0, 37.0, 46.0, 30.0, 46.0, 38.0, 39.0, 55.0, 35.0, 49.0, 47.0, 24.0, 40.0, 30.0, 32.0, 34.0, 21.0, 20.0, 20.0, 19.0, 13.0, 6.0, 6.0, 8.0, 5.0, 4.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.255615234375, -0.2485504150390625, -0.241485595703125, -0.2344207763671875, -0.22735595703125, -0.2202911376953125, -0.213226318359375, -0.2061614990234375, -0.1990966796875, -0.1920318603515625, -0.184967041015625, -0.1779022216796875, -0.17083740234375, -0.1637725830078125, -0.156707763671875, -0.1496429443359375, -0.142578125, -0.1355133056640625, -0.128448486328125, -0.1213836669921875, -0.11431884765625, -0.1072540283203125, -0.100189208984375, -0.0931243896484375, -0.0860595703125, -0.0789947509765625, -0.071929931640625, -0.0648651123046875, -0.05780029296875, -0.0507354736328125, -0.043670654296875, -0.0366058349609375, -0.029541015625, -0.0224761962890625, -0.015411376953125, -0.0083465576171875, -0.00128173828125, 0.0057830810546875, 0.012847900390625, 0.0199127197265625, 0.0269775390625, 0.0340423583984375, 0.041107177734375, 0.0481719970703125, 0.05523681640625, 0.0623016357421875, 0.069366455078125, 0.0764312744140625, 0.08349609375, 0.0905609130859375, 0.097625732421875, 0.1046905517578125, 0.11175537109375, 0.1188201904296875, 0.125885009765625, 0.1329498291015625, 0.1400146484375, 0.1470794677734375, 0.154144287109375, 0.1612091064453125, 0.16827392578125, 0.1753387451171875, 0.182403564453125, 0.1894683837890625, 0.196533203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 11.0, 21.0, 36.0, 54.0, 81.0, 134.0, 234.0, 359.0, 676.0, 1218.0, 2284.0, 4206.0, 7942.0, 14875.0, 28701.0, 55492.0, 111615.0, 289614.0, 297350.0, 114967.0, 56186.0, 29357.0, 15319.0, 8164.0, 4305.0, 2358.0, 1315.0, 696.0, 437.0, 214.0, 137.0, 75.0, 47.0, 26.0, 17.0, 10.0, 8.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06463623046875, -0.06255245208740234, -0.06046867370605469, -0.05838489532470703, -0.056301116943359375, -0.05421733856201172, -0.05213356018066406, -0.050049781799316406, -0.04796600341796875, -0.045882225036621094, -0.04379844665527344, -0.04171466827392578, -0.039630889892578125, -0.03754711151123047, -0.03546333312988281, -0.033379554748535156, -0.0312957763671875, -0.029211997985839844, -0.027128219604492188, -0.02504444122314453, -0.022960662841796875, -0.02087688446044922, -0.018793106079101562, -0.016709327697753906, -0.01462554931640625, -0.012541770935058594, -0.010457992553710938, -0.008374214172363281, -0.006290435791015625, -0.004206657409667969, -0.0021228790283203125, -3.910064697265625e-05, 0.002044677734375, 0.004128456115722656, 0.0062122344970703125, 0.008296012878417969, 0.010379791259765625, 0.012463569641113281, 0.014547348022460938, 0.016631126403808594, 0.01871490478515625, 0.020798683166503906, 0.022882461547851562, 0.02496623992919922, 0.027050018310546875, 0.02913379669189453, 0.031217575073242188, 0.033301353454589844, 0.0353851318359375, 0.037468910217285156, 0.03955268859863281, 0.04163646697998047, 0.043720245361328125, 0.04580402374267578, 0.04788780212402344, 0.049971580505371094, 0.05205535888671875, 0.054139137268066406, 0.05622291564941406, 0.05830669403076172, 0.060390472412109375, 0.06247425079345703, 0.06455802917480469, 0.06664180755615234, 0.0687255859375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 8.0, 3.0, 2.0, 9.0, 5.0, 12.0, 13.0, 14.0, 23.0, 25.0, 29.0, 45.0, 66.0, 78.0, 82.0, 104.0, 126.0, 73.0, 75.0, 49.0, 34.0, 27.0, 19.0, 12.0, 14.0, 12.0, 8.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4437904357910156e-05, -2.369564026594162e-05, -2.2953376173973083e-05, -2.2211112082004547e-05, -2.146884799003601e-05, -2.0726583898067474e-05, -1.9984319806098938e-05, -1.92420557141304e-05, -1.8499791622161865e-05, -1.775752753019333e-05, -1.7015263438224792e-05, -1.6272999346256256e-05, -1.553073525428772e-05, -1.4788471162319183e-05, -1.4046207070350647e-05, -1.330394297838211e-05, -1.2561678886413574e-05, -1.1819414794445038e-05, -1.1077150702476501e-05, -1.0334886610507965e-05, -9.592622518539429e-06, -8.850358426570892e-06, -8.108094334602356e-06, -7.36583024263382e-06, -6.623566150665283e-06, -5.881302058696747e-06, -5.1390379667282104e-06, -4.396773874759674e-06, -3.6545097827911377e-06, -2.9122456908226013e-06, -2.169981598854065e-06, -1.4277175068855286e-06, -6.854534149169922e-07, 5.681067705154419e-08, 7.990747690200806e-07, 1.541338860988617e-06, 2.2836029529571533e-06, 3.0258670449256897e-06, 3.768131136894226e-06, 4.5103952288627625e-06, 5.252659320831299e-06, 5.994923412799835e-06, 6.737187504768372e-06, 7.479451596736908e-06, 8.221715688705444e-06, 8.96397978067398e-06, 9.706243872642517e-06, 1.0448507964611053e-05, 1.119077205657959e-05, 1.1933036148548126e-05, 1.2675300240516663e-05, 1.3417564332485199e-05, 1.4159828424453735e-05, 1.4902092516422272e-05, 1.5644356608390808e-05, 1.6386620700359344e-05, 1.712888479232788e-05, 1.7871148884296417e-05, 1.8613412976264954e-05, 1.935567706823349e-05, 2.0097941160202026e-05, 2.0840205252170563e-05, 2.15824693441391e-05, 2.2324733436107635e-05, 2.3066997528076172e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 15.0, 6.0, 16.0, 23.0, 25.0, 47.0, 71.0, 87.0, 145.0, 219.0, 356.0, 613.0, 979.0, 1840.0, 3408.0, 6564.0, 12933.0, 26031.0, 52206.0, 112478.0, 280208.0, 308706.0, 125552.0, 57687.0, 28457.0, 14212.0, 7166.0, 3699.0, 1944.0, 1115.0, 609.0, 394.0, 250.0, 147.0, 106.0, 77.0, 47.0, 31.0, 30.0, 10.0, 11.0, 12.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0650634765625, -0.06289958953857422, -0.06073570251464844, -0.058571815490722656, -0.056407928466796875, -0.054244041442871094, -0.05208015441894531, -0.04991626739501953, -0.04775238037109375, -0.04558849334716797, -0.04342460632324219, -0.041260719299316406, -0.039096832275390625, -0.036932945251464844, -0.03476905822753906, -0.03260517120361328, -0.0304412841796875, -0.02827739715576172, -0.026113510131835938, -0.023949623107910156, -0.021785736083984375, -0.019621849060058594, -0.017457962036132812, -0.015294075012207031, -0.01313018798828125, -0.010966300964355469, -0.008802413940429688, -0.006638526916503906, -0.004474639892578125, -0.0023107528686523438, -0.0001468658447265625, 0.0020170211791992188, 0.004180908203125, 0.006344795227050781, 0.008508682250976562, 0.010672569274902344, 0.012836456298828125, 0.015000343322753906, 0.017164230346679688, 0.01932811737060547, 0.02149200439453125, 0.02365589141845703, 0.025819778442382812, 0.027983665466308594, 0.030147552490234375, 0.032311439514160156, 0.03447532653808594, 0.03663921356201172, 0.0388031005859375, 0.04096698760986328, 0.04313087463378906, 0.045294761657714844, 0.047458648681640625, 0.049622535705566406, 0.05178642272949219, 0.05395030975341797, 0.05611419677734375, 0.05827808380126953, 0.06044197082519531, 0.0626058578491211, 0.06476974487304688, 0.06693363189697266, 0.06909751892089844, 0.07126140594482422, 0.07342529296875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 8.0, 4.0, 7.0, 6.0, 8.0, 20.0, 20.0, 29.0, 23.0, 37.0, 59.0, 87.0, 92.0, 122.0, 113.0, 82.0, 69.0, 55.0, 34.0, 28.0, 22.0, 19.0, 11.0, 11.0, 9.0, 5.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.098876953125, -0.09610366821289062, -0.09333038330078125, -0.09055709838867188, -0.0877838134765625, -0.08501052856445312, -0.08223724365234375, -0.07946395874023438, -0.076690673828125, -0.07391738891601562, -0.07114410400390625, -0.06837081909179688, -0.0655975341796875, -0.06282424926757812, -0.06005096435546875, -0.057277679443359375, -0.05450439453125, -0.051731109619140625, -0.04895782470703125, -0.046184539794921875, -0.0434112548828125, -0.040637969970703125, -0.03786468505859375, -0.035091400146484375, -0.032318115234375, -0.029544830322265625, -0.02677154541015625, -0.023998260498046875, -0.0212249755859375, -0.018451690673828125, -0.01567840576171875, -0.012905120849609375, -0.0101318359375, -0.007358551025390625, -0.00458526611328125, -0.001811981201171875, 0.0009613037109375, 0.003734588623046875, 0.00650787353515625, 0.009281158447265625, 0.012054443359375, 0.014827728271484375, 0.01760101318359375, 0.020374298095703125, 0.0231475830078125, 0.025920867919921875, 0.02869415283203125, 0.031467437744140625, 0.03424072265625, 0.037014007568359375, 0.03978729248046875, 0.042560577392578125, 0.0453338623046875, 0.048107147216796875, 0.05088043212890625, 0.053653717041015625, 0.056427001953125, 0.059200286865234375, 0.06197357177734375, 0.06474685668945312, 0.0675201416015625, 0.07029342651367188, 0.07306671142578125, 0.07583999633789062, 0.07861328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 32.0, 214.0, 448.0, 273.0, 35.0, 6.0, 4.0, 2.0], "bins": [-7.9451093673706055, -7.8094916343688965, -7.6738739013671875, -7.5382561683654785, -7.4026384353637695, -7.2670207023620605, -7.131402969360352, -6.995784759521484, -6.860167503356934, -6.724549770355225, -6.588932037353516, -6.453314304351807, -6.317696571350098, -6.182078838348389, -6.04646110534668, -5.9108428955078125, -5.7752251625061035, -5.6396074295043945, -5.5039896965026855, -5.368371963500977, -5.232754230499268, -5.097136497497559, -4.96151876449585, -4.825901031494141, -4.690282821655273, -4.5546650886535645, -4.4190473556518555, -4.2834296226501465, -4.1478118896484375, -4.0121941566467285, -3.8765761852264404, -3.7409584522247314, -3.6053409576416016, -3.4697232246398926, -3.3341054916381836, -3.1984877586364746, -3.0628700256347656, -2.9272522926330566, -2.7916343212127686, -2.6560165882110596, -2.5203988552093506, -2.3847811222076416, -2.2491633892059326, -2.1135456562042236, -1.977927803993225, -1.8423100709915161, -1.7066922187805176, -1.5710744857788086, -1.4354567527770996, -1.2998390197753906, -1.1642212867736816, -1.028603434562683, -0.8929857015609741, -0.7573679685592651, -0.6217501759529114, -0.4861323833465576, -0.35051459074020386, -0.21489682793617249, -0.07927906513214111, 0.05633869767189026, 0.19195646047592163, 0.3275741934776306, 0.4631919860839844, 0.5988097786903381, 0.7344275116920471]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 3.0, 5.0, 8.0, 10.0, 10.0, 16.0, 9.0, 17.0, 18.0, 24.0, 29.0, 29.0, 37.0, 37.0, 38.0, 37.0, 48.0, 47.0, 45.0, 50.0, 54.0, 48.0, 43.0, 43.0, 45.0, 36.0, 33.0, 23.0, 30.0, 25.0, 29.0, 15.0, 14.0, 6.0, 8.0, 9.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5556581020355225, -0.5344499349594116, -0.513241708278656, -0.49203354120254517, -0.47082534432411194, -0.4496171474456787, -0.42840898036956787, -0.40720078349113464, -0.3859925866127014, -0.3647843897342682, -0.34357619285583496, -0.3223680257797241, -0.3011598289012909, -0.27995163202285767, -0.2587434649467468, -0.2375352680683136, -0.21632707118988037, -0.19511887431144714, -0.1739106923341751, -0.15270251035690308, -0.13149431347846985, -0.11028612405061722, -0.08907793462276459, -0.06786975264549255, -0.046661555767059326, -0.025453366339206696, -0.004245176911354065, 0.016963012516498566, 0.038171201944351196, 0.05937939137220383, 0.08058758080005646, 0.10179576277732849, 0.12300390005111694, 0.14421209692955017, 0.1654202789068222, 0.18662846088409424, 0.20783665776252747, 0.2290448546409607, 0.25025302171707153, 0.27146121859550476, 0.292669415473938, 0.3138776123523712, 0.33508580923080444, 0.3562939763069153, 0.3775021731853485, 0.39871037006378174, 0.4199185371398926, 0.4411267340183258, 0.46233493089675903, 0.48354312777519226, 0.5047513246536255, 0.5259594917297363, 0.5471676588058472, 0.5683758854866028, 0.5895840525627136, 0.6107922792434692, 0.6320004463195801, 0.6532086133956909, 0.6744168400764465, 0.6956250071525574, 0.716833233833313, 0.7380414009094238, 0.7592495679855347, 0.7804577350616455, 0.8016659617424011]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 7.0, 9.0, 10.0, 8.0, 21.0, 33.0, 40.0, 86.0, 112.0, 184.0, 287.0, 494.0, 824.0, 1366.0, 2314.0, 4212.0, 7839.0, 14755.0, 29685.0, 62033.0, 136921.0, 340805.0, 1237631.0, 1630771.0, 418792.0, 161347.0, 72196.0, 34341.0, 17116.0, 8870.0, 4681.0, 2663.0, 1551.0, 872.0, 506.0, 355.0, 204.0, 115.0, 79.0, 53.0, 39.0, 20.0, 11.0, 7.0, 6.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.114990234375, -0.11151599884033203, -0.10804176330566406, -0.1045675277709961, -0.10109329223632812, -0.09761905670166016, -0.09414482116699219, -0.09067058563232422, -0.08719635009765625, -0.08372211456298828, -0.08024787902832031, -0.07677364349365234, -0.07329940795898438, -0.0698251724243164, -0.06635093688964844, -0.06287670135498047, -0.0594024658203125, -0.05592823028564453, -0.05245399475097656, -0.048979759216308594, -0.045505523681640625, -0.042031288146972656, -0.03855705261230469, -0.03508281707763672, -0.03160858154296875, -0.02813434600830078, -0.024660110473632812, -0.021185874938964844, -0.017711639404296875, -0.014237403869628906, -0.010763168334960938, -0.007288932800292969, -0.003814697265625, -0.00034046173095703125, 0.0031337738037109375, 0.006608009338378906, 0.010082244873046875, 0.013556480407714844, 0.017030715942382812, 0.02050495147705078, 0.02397918701171875, 0.02745342254638672, 0.030927658081054688, 0.034401893615722656, 0.037876129150390625, 0.041350364685058594, 0.04482460021972656, 0.04829883575439453, 0.0517730712890625, 0.05524730682373047, 0.05872154235839844, 0.062195777893066406, 0.06567001342773438, 0.06914424896240234, 0.07261848449707031, 0.07609272003173828, 0.07956695556640625, 0.08304119110107422, 0.08651542663574219, 0.08998966217041016, 0.09346389770507812, 0.0969381332397461, 0.10041236877441406, 0.10388660430908203, 0.10736083984375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 7.0, 7.0, 3.0, 16.0, 16.0, 13.0, 16.0, 16.0, 20.0, 21.0, 19.0, 35.0, 22.0, 29.0, 36.0, 36.0, 45.0, 37.0, 54.0, 51.0, 35.0, 24.0, 49.0, 48.0, 35.0, 42.0, 39.0, 22.0, 29.0, 25.0, 16.0, 27.0, 25.0, 14.0, 5.0, 19.0, 9.0, 11.0, 6.0, 5.0, 6.0, 1.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.0666799545288086, -0.06439018249511719, -0.06210041046142578, -0.059810638427734375, -0.05752086639404297, -0.05523109436035156, -0.052941322326660156, -0.05065155029296875, -0.048361778259277344, -0.04607200622558594, -0.04378223419189453, -0.041492462158203125, -0.03920269012451172, -0.03691291809082031, -0.034623146057128906, -0.0323333740234375, -0.030043601989746094, -0.027753829956054688, -0.02546405792236328, -0.023174285888671875, -0.02088451385498047, -0.018594741821289062, -0.016304969787597656, -0.01401519775390625, -0.011725425720214844, -0.009435653686523438, -0.007145881652832031, -0.004856109619140625, -0.0025663375854492188, -0.0002765655517578125, 0.0020132064819335938, 0.004302978515625, 0.006592750549316406, 0.008882522583007812, 0.011172294616699219, 0.013462066650390625, 0.01575183868408203, 0.018041610717773438, 0.020331382751464844, 0.02262115478515625, 0.024910926818847656, 0.027200698852539062, 0.02949047088623047, 0.031780242919921875, 0.03407001495361328, 0.03635978698730469, 0.038649559020996094, 0.0409393310546875, 0.043229103088378906, 0.04551887512207031, 0.04780864715576172, 0.050098419189453125, 0.05238819122314453, 0.05467796325683594, 0.056967735290527344, 0.05925750732421875, 0.061547279357910156, 0.06383705139160156, 0.06612682342529297, 0.06841659545898438, 0.07070636749267578, 0.07299613952636719, 0.0752859115600586, 0.07757568359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 13.0, 10.0, 30.0, 46.0, 80.0, 95.0, 160.0, 236.0, 385.0, 706.0, 1282.0, 2108.0, 3999.0, 7438.0, 14989.0, 31476.0, 69631.0, 161087.0, 410385.0, 1395952.0, 1392074.0, 407876.0, 160857.0, 69958.0, 31564.0, 15409.0, 7509.0, 3914.0, 2125.0, 1124.0, 664.0, 424.0, 250.0, 150.0, 75.0, 58.0, 47.0, 27.0, 14.0, 12.0, 9.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.152587890625, -0.1480998992919922, -0.14361190795898438, -0.13912391662597656, -0.13463592529296875, -0.13014793395996094, -0.12565994262695312, -0.12117195129394531, -0.1166839599609375, -0.11219596862792969, -0.10770797729492188, -0.10321998596191406, -0.09873199462890625, -0.09424400329589844, -0.08975601196289062, -0.08526802062988281, -0.080780029296875, -0.07629203796386719, -0.07180404663085938, -0.06731605529785156, -0.06282806396484375, -0.05834007263183594, -0.053852081298828125, -0.04936408996582031, -0.0448760986328125, -0.04038810729980469, -0.035900115966796875, -0.03141212463378906, -0.02692413330078125, -0.022436141967773438, -0.017948150634765625, -0.013460159301757812, -0.00897216796875, -0.0044841766357421875, 3.814697265625e-06, 0.0044918060302734375, 0.00897979736328125, 0.013467788696289062, 0.017955780029296875, 0.022443771362304688, 0.0269317626953125, 0.03141975402832031, 0.035907745361328125, 0.04039573669433594, 0.04488372802734375, 0.04937171936035156, 0.053859710693359375, 0.05834770202636719, 0.062835693359375, 0.06732368469238281, 0.07181167602539062, 0.07629966735839844, 0.08078765869140625, 0.08527565002441406, 0.08976364135742188, 0.09425163269042969, 0.0987396240234375, 0.10322761535644531, 0.10771560668945312, 0.11220359802246094, 0.11669158935546875, 0.12117958068847656, 0.12566757202148438, 0.1301555633544922, 0.1346435546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 6.0, 15.0, 13.0, 25.0, 37.0, 40.0, 47.0, 72.0, 86.0, 135.0, 156.0, 231.0, 300.0, 468.0, 635.0, 467.0, 376.0, 225.0, 174.0, 118.0, 100.0, 78.0, 57.0, 33.0, 34.0, 33.0, 24.0, 12.0, 18.0, 11.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17333984375, -0.16848182678222656, -0.16362380981445312, -0.1587657928466797, -0.15390777587890625, -0.1490497589111328, -0.14419174194335938, -0.13933372497558594, -0.1344757080078125, -0.12961769104003906, -0.12475967407226562, -0.11990165710449219, -0.11504364013671875, -0.11018562316894531, -0.10532760620117188, -0.10046958923339844, -0.095611572265625, -0.09075355529785156, -0.08589553833007812, -0.08103752136230469, -0.07617950439453125, -0.07132148742675781, -0.06646347045898438, -0.06160545349121094, -0.0567474365234375, -0.05188941955566406, -0.047031402587890625, -0.04217338562011719, -0.03731536865234375, -0.03245735168457031, -0.027599334716796875, -0.022741317749023438, -0.01788330078125, -0.013025283813476562, -0.008167266845703125, -0.0033092498779296875, 0.00154876708984375, 0.0064067840576171875, 0.011264801025390625, 0.016122817993164062, 0.0209808349609375, 0.025838851928710938, 0.030696868896484375, 0.03555488586425781, 0.04041290283203125, 0.04527091979980469, 0.050128936767578125, 0.05498695373535156, 0.059844970703125, 0.06470298767089844, 0.06956100463867188, 0.07441902160644531, 0.07927703857421875, 0.08413505554199219, 0.08899307250976562, 0.09385108947753906, 0.0987091064453125, 0.10356712341308594, 0.10842514038085938, 0.11328315734863281, 0.11814117431640625, 0.12299919128417969, 0.12785720825195312, 0.13271522521972656, 0.1375732421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 16.0, 41.0, 53.0, 81.0, 92.0, 134.0, 141.0, 120.0, 102.0, 80.0, 54.0, 32.0, 22.0, 13.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6839830875396729, -1.6435309648513794, -1.603078842163086, -1.5626267194747925, -1.522174596786499, -1.4817224740982056, -1.441270351409912, -1.4008182287216187, -1.3603661060333252, -1.3199139833450317, -1.2794618606567383, -1.2390097379684448, -1.1985576152801514, -1.158105492591858, -1.1176533699035645, -1.077201247215271, -1.0367491245269775, -0.9962970018386841, -0.9558448791503906, -0.9153927564620972, -0.8749406337738037, -0.8344885110855103, -0.7940363883972168, -0.7535842657089233, -0.7131321430206299, -0.6726800203323364, -0.632227897644043, -0.5917757749557495, -0.551323652267456, -0.5108715295791626, -0.47041940689086914, -0.4299672842025757, -0.3895151615142822, -0.34906303882598877, -0.3086109161376953, -0.26815879344940186, -0.2277066707611084, -0.18725454807281494, -0.14680242538452148, -0.10635030269622803, -0.06589818000793457, -0.025446057319641113, 0.015006065368652344, 0.0554581880569458, 0.09591031074523926, 0.13636243343353271, 0.17681455612182617, 0.21726667881011963, 0.2577188014984131, 0.29817092418670654, 0.338623046875, 0.37907516956329346, 0.4195272922515869, 0.45997941493988037, 0.5004315376281738, 0.5408836603164673, 0.5813357830047607, 0.6217879056930542, 0.6622400283813477, 0.7026921510696411, 0.7431442737579346, 0.783596396446228, 0.8240485191345215, 0.8645006418228149, 0.9049527645111084]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 12.0, 4.0, 9.0, 10.0, 9.0, 14.0, 13.0, 18.0, 18.0, 26.0, 25.0, 25.0, 38.0, 35.0, 40.0, 38.0, 39.0, 43.0, 40.0, 38.0, 43.0, 42.0, 32.0, 35.0, 41.0, 44.0, 44.0, 37.0, 28.0, 27.0, 24.0, 16.0, 17.0, 9.0, 13.0, 9.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4693639278411865, -0.45307642221450806, -0.4367889165878296, -0.42050138115882874, -0.40421387553215027, -0.3879263699054718, -0.37163883447647095, -0.3553513288497925, -0.339063823223114, -0.32277631759643555, -0.3064888119697571, -0.2902012765407562, -0.27391377091407776, -0.2576262652873993, -0.24133874475955963, -0.22505122423171997, -0.2087637186050415, -0.19247621297836304, -0.17618869245052338, -0.15990117192268372, -0.14361366629600525, -0.12732616066932678, -0.11103864014148712, -0.09475112706422806, -0.078463613986969, -0.06217610090970993, -0.04588858783245087, -0.029601074755191803, -0.01331356167793274, 0.0029739513993263245, 0.019261464476585388, 0.03554897755384445, 0.051836490631103516, 0.06812400370836258, 0.08441151678562164, 0.1006990298628807, 0.11698654294013977, 0.13327404856681824, 0.1495615690946579, 0.16584908962249756, 0.18213659524917603, 0.1984241008758545, 0.21471162140369415, 0.2309991419315338, 0.24728664755821228, 0.26357415318489075, 0.2798616886138916, 0.29614919424057007, 0.31243669986724854, 0.328724205493927, 0.34501171112060547, 0.3612992465496063, 0.3775867521762848, 0.39387425780296326, 0.4101617932319641, 0.4264492988586426, 0.44273680448532104, 0.4590243101119995, 0.475311815738678, 0.49159935116767883, 0.5078868865966797, 0.5241743922233582, 0.5404618978500366, 0.5567494034767151, 0.5730369091033936]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 1.0, 9.0, 10.0, 19.0, 27.0, 32.0, 40.0, 86.0, 98.0, 157.0, 230.0, 332.0, 421.0, 693.0, 897.0, 1385.0, 1989.0, 2910.0, 4141.0, 6362.0, 9706.0, 15891.0, 28139.0, 58152.0, 133720.0, 267120.0, 260995.0, 127514.0, 55674.0, 27300.0, 15558.0, 9370.0, 6243.0, 4206.0, 2813.0, 1949.0, 1372.0, 938.0, 648.0, 436.0, 316.0, 208.0, 137.0, 96.0, 64.0, 58.0, 31.0, 22.0, 16.0, 7.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.109619140625, -0.10619068145751953, -0.10276222229003906, -0.0993337631225586, -0.09590530395507812, -0.09247684478759766, -0.08904838562011719, -0.08561992645263672, -0.08219146728515625, -0.07876300811767578, -0.07533454895019531, -0.07190608978271484, -0.06847763061523438, -0.0650491714477539, -0.06162071228027344, -0.05819225311279297, -0.0547637939453125, -0.05133533477783203, -0.04790687561035156, -0.044478416442871094, -0.041049957275390625, -0.037621498107910156, -0.03419303894042969, -0.03076457977294922, -0.02733612060546875, -0.02390766143798828, -0.020479202270507812, -0.017050743103027344, -0.013622283935546875, -0.010193824768066406, -0.0067653656005859375, -0.0033369064331054688, 9.1552734375e-05, 0.0035200119018554688, 0.0069484710693359375, 0.010376930236816406, 0.013805389404296875, 0.017233848571777344, 0.020662307739257812, 0.02409076690673828, 0.02751922607421875, 0.03094768524169922, 0.03437614440917969, 0.037804603576660156, 0.041233062744140625, 0.044661521911621094, 0.04808998107910156, 0.05151844024658203, 0.0549468994140625, 0.05837535858154297, 0.06180381774902344, 0.0652322769165039, 0.06866073608398438, 0.07208919525146484, 0.07551765441894531, 0.07894611358642578, 0.08237457275390625, 0.08580303192138672, 0.08923149108886719, 0.09265995025634766, 0.09608840942382812, 0.0995168685913086, 0.10294532775878906, 0.10637378692626953, 0.10980224609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 9.0, 11.0, 11.0, 11.0, 11.0, 22.0, 23.0, 19.0, 26.0, 21.0, 22.0, 33.0, 45.0, 37.0, 35.0, 51.0, 44.0, 49.0, 47.0, 48.0, 42.0, 40.0, 31.0, 39.0, 28.0, 34.0, 24.0, 26.0, 27.0, 22.0, 15.0, 15.0, 14.0, 13.0, 14.0, 6.0, 8.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.073486328125, -0.07098865509033203, -0.06849098205566406, -0.0659933090209961, -0.06349563598632812, -0.060997962951660156, -0.05850028991699219, -0.05600261688232422, -0.05350494384765625, -0.05100727081298828, -0.04850959777832031, -0.046011924743652344, -0.043514251708984375, -0.041016578674316406, -0.03851890563964844, -0.03602123260498047, -0.0335235595703125, -0.03102588653564453, -0.028528213500976562, -0.026030540466308594, -0.023532867431640625, -0.021035194396972656, -0.018537521362304688, -0.01603984832763672, -0.01354217529296875, -0.011044502258300781, -0.008546829223632812, -0.006049156188964844, -0.003551483154296875, -0.0010538101196289062, 0.0014438629150390625, 0.003941535949707031, 0.006439208984375, 0.008936882019042969, 0.011434555053710938, 0.013932228088378906, 0.016429901123046875, 0.018927574157714844, 0.021425247192382812, 0.02392292022705078, 0.02642059326171875, 0.02891826629638672, 0.03141593933105469, 0.033913612365722656, 0.036411285400390625, 0.038908958435058594, 0.04140663146972656, 0.04390430450439453, 0.0464019775390625, 0.04889965057373047, 0.05139732360839844, 0.053894996643066406, 0.056392669677734375, 0.058890342712402344, 0.06138801574707031, 0.06388568878173828, 0.06638336181640625, 0.06888103485107422, 0.07137870788574219, 0.07387638092041016, 0.07637405395507812, 0.0788717269897461, 0.08136940002441406, 0.08386707305908203, 0.08636474609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 0.0, 5.0, 16.0, 14.0, 18.0, 29.0, 43.0, 73.0, 131.0, 257.0, 527.0, 1149.0, 2686.0, 5742.0, 13491.0, 38055.0, 164948.0, 540804.0, 208259.0, 45229.0, 15172.0, 6427.0, 2864.0, 1360.0, 581.0, 317.0, 152.0, 91.0, 35.0, 35.0, 11.0, 10.0, 5.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.229248046875, -0.22261619567871094, -0.21598434448242188, -0.2093524932861328, -0.20272064208984375, -0.1960887908935547, -0.18945693969726562, -0.18282508850097656, -0.1761932373046875, -0.16956138610839844, -0.16292953491210938, -0.1562976837158203, -0.14966583251953125, -0.1430339813232422, -0.13640213012695312, -0.12977027893066406, -0.123138427734375, -0.11650657653808594, -0.10987472534179688, -0.10324287414550781, -0.09661102294921875, -0.08997917175292969, -0.08334732055664062, -0.07671546936035156, -0.0700836181640625, -0.06345176696777344, -0.056819915771484375, -0.05018806457519531, -0.04355621337890625, -0.03692436218261719, -0.030292510986328125, -0.023660659790039062, -0.01702880859375, -0.010396957397460938, -0.003765106201171875, 0.0028667449951171875, 0.00949859619140625, 0.016130447387695312, 0.022762298583984375, 0.029394149780273438, 0.0360260009765625, 0.04265785217285156, 0.049289703369140625, 0.05592155456542969, 0.06255340576171875, 0.06918525695800781, 0.07581710815429688, 0.08244895935058594, 0.089080810546875, 0.09571266174316406, 0.10234451293945312, 0.10897636413574219, 0.11560821533203125, 0.12224006652832031, 0.12887191772460938, 0.13550376892089844, 0.1421356201171875, 0.14876747131347656, 0.15539932250976562, 0.1620311737060547, 0.16866302490234375, 0.1752948760986328, 0.18192672729492188, 0.18855857849121094, 0.1951904296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 5.0, 4.0, 11.0, 16.0, 11.0, 23.0, 9.0, 23.0, 17.0, 22.0, 20.0, 29.0, 42.0, 41.0, 33.0, 34.0, 41.0, 39.0, 33.0, 37.0, 45.0, 36.0, 41.0, 40.0, 38.0, 29.0, 28.0, 35.0, 33.0, 26.0, 23.0, 23.0, 17.0, 10.0, 20.0, 11.0, 17.0, 7.0, 6.0, 5.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.225830078125, -0.2192535400390625, -0.212677001953125, -0.2061004638671875, -0.19952392578125, -0.1929473876953125, -0.186370849609375, -0.1797943115234375, -0.1732177734375, -0.1666412353515625, -0.160064697265625, -0.1534881591796875, -0.14691162109375, -0.1403350830078125, -0.133758544921875, -0.1271820068359375, -0.12060546875, -0.1140289306640625, -0.107452392578125, -0.1008758544921875, -0.09429931640625, -0.0877227783203125, -0.081146240234375, -0.0745697021484375, -0.0679931640625, -0.0614166259765625, -0.054840087890625, -0.0482635498046875, -0.04168701171875, -0.0351104736328125, -0.028533935546875, -0.0219573974609375, -0.015380859375, -0.0088043212890625, -0.002227783203125, 0.0043487548828125, 0.01092529296875, 0.0175018310546875, 0.024078369140625, 0.0306549072265625, 0.0372314453125, 0.0438079833984375, 0.050384521484375, 0.0569610595703125, 0.06353759765625, 0.0701141357421875, 0.076690673828125, 0.0832672119140625, 0.08984375, 0.0964202880859375, 0.102996826171875, 0.1095733642578125, 0.11614990234375, 0.1227264404296875, 0.129302978515625, 0.1358795166015625, 0.1424560546875, 0.1490325927734375, 0.155609130859375, 0.1621856689453125, 0.16876220703125, 0.1753387451171875, 0.181915283203125, 0.1884918212890625, 0.195068359375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 13.0, 17.0, 25.0, 29.0, 49.0, 74.0, 109.0, 175.0, 267.0, 433.0, 675.0, 1164.0, 1906.0, 3303.0, 5698.0, 9802.0, 17369.0, 33135.0, 68768.0, 170764.0, 335505.0, 222910.0, 87313.0, 40649.0, 20879.0, 11615.0, 6392.0, 3852.0, 2221.0, 1302.0, 765.0, 486.0, 291.0, 177.0, 135.0, 89.0, 49.0, 40.0, 29.0, 17.0, 17.0, 16.0, 7.0, 5.0, 5.0, 1.0, 6.0, 0.0, 1.0], "bins": [-0.07135009765625, -0.06934833526611328, -0.06734657287597656, -0.06534481048583984, -0.06334304809570312, -0.061341285705566406, -0.05933952331542969, -0.05733776092529297, -0.05533599853515625, -0.05333423614501953, -0.05133247375488281, -0.049330711364746094, -0.047328948974609375, -0.045327186584472656, -0.04332542419433594, -0.04132366180419922, -0.0393218994140625, -0.03732013702392578, -0.03531837463378906, -0.033316612243652344, -0.031314849853515625, -0.029313087463378906, -0.027311325073242188, -0.02530956268310547, -0.02330780029296875, -0.02130603790283203, -0.019304275512695312, -0.017302513122558594, -0.015300750732421875, -0.013298988342285156, -0.011297225952148438, -0.009295463562011719, -0.007293701171875, -0.005291938781738281, -0.0032901763916015625, -0.0012884140014648438, 0.000713348388671875, 0.0027151107788085938, 0.0047168731689453125, 0.006718635559082031, 0.00872039794921875, 0.010722160339355469, 0.012723922729492188, 0.014725685119628906, 0.016727447509765625, 0.018729209899902344, 0.020730972290039062, 0.02273273468017578, 0.0247344970703125, 0.02673625946044922, 0.028738021850585938, 0.030739784240722656, 0.032741546630859375, 0.034743309020996094, 0.03674507141113281, 0.03874683380126953, 0.04074859619140625, 0.04275035858154297, 0.04475212097167969, 0.046753883361816406, 0.048755645751953125, 0.050757408142089844, 0.05275917053222656, 0.05476093292236328, 0.0567626953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 5.0, 4.0, 11.0, 12.0, 10.0, 18.0, 32.0, 46.0, 72.0, 96.0, 134.0, 127.0, 133.0, 96.0, 55.0, 42.0, 28.0, 21.0, 11.0, 12.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.3736228942871094e-05, -3.292318433523178e-05, -3.211013972759247e-05, -3.1297095119953156e-05, -3.0484050512313843e-05, -2.967100590467453e-05, -2.8857961297035217e-05, -2.8044916689395905e-05, -2.7231872081756592e-05, -2.641882747411728e-05, -2.5605782866477966e-05, -2.4792738258838654e-05, -2.397969365119934e-05, -2.3166649043560028e-05, -2.2353604435920715e-05, -2.1540559828281403e-05, -2.072751522064209e-05, -1.9914470613002777e-05, -1.9101426005363464e-05, -1.828838139772415e-05, -1.747533679008484e-05, -1.6662292182445526e-05, -1.5849247574806213e-05, -1.50362029671669e-05, -1.4223158359527588e-05, -1.3410113751888275e-05, -1.2597069144248962e-05, -1.178402453660965e-05, -1.0970979928970337e-05, -1.0157935321331024e-05, -9.344890713691711e-06, -8.531846106052399e-06, -7.718801498413086e-06, -6.905756890773773e-06, -6.0927122831344604e-06, -5.279667675495148e-06, -4.466623067855835e-06, -3.6535784602165222e-06, -2.8405338525772095e-06, -2.0274892449378967e-06, -1.214444637298584e-06, -4.0140002965927124e-07, 4.116445779800415e-07, 1.2246891856193542e-06, 2.037733793258667e-06, 2.8507784008979797e-06, 3.6638230085372925e-06, 4.476867616176605e-06, 5.289912223815918e-06, 6.102956831455231e-06, 6.9160014390945435e-06, 7.729046046733856e-06, 8.542090654373169e-06, 9.355135262012482e-06, 1.0168179869651794e-05, 1.0981224477291107e-05, 1.179426908493042e-05, 1.2607313692569733e-05, 1.3420358300209045e-05, 1.4233402907848358e-05, 1.5046447515487671e-05, 1.5859492123126984e-05, 1.6672536730766296e-05, 1.748558133840561e-05, 1.8298625946044922e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 14.0, 36.0, 27.0, 45.0, 72.0, 117.0, 156.0, 290.0, 503.0, 989.0, 1780.0, 3752.0, 7980.0, 17303.0, 40231.0, 104049.0, 279107.0, 346631.0, 147725.0, 54380.0, 22982.0, 10481.0, 4809.0, 2294.0, 1236.0, 648.0, 357.0, 193.0, 123.0, 77.0, 54.0, 32.0, 23.0, 12.0, 12.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08050537109375, -0.0780782699584961, -0.07565116882324219, -0.07322406768798828, -0.07079696655273438, -0.06836986541748047, -0.06594276428222656, -0.06351566314697266, -0.06108856201171875, -0.058661460876464844, -0.05623435974121094, -0.05380725860595703, -0.051380157470703125, -0.04895305633544922, -0.04652595520019531, -0.044098854064941406, -0.0416717529296875, -0.039244651794433594, -0.03681755065917969, -0.03439044952392578, -0.031963348388671875, -0.02953624725341797, -0.027109146118164062, -0.024682044982910156, -0.02225494384765625, -0.019827842712402344, -0.017400741577148438, -0.014973640441894531, -0.012546539306640625, -0.010119438171386719, -0.0076923370361328125, -0.005265235900878906, -0.002838134765625, -0.00041103363037109375, 0.0020160675048828125, 0.004443168640136719, 0.006870269775390625, 0.009297370910644531, 0.011724472045898438, 0.014151573181152344, 0.01657867431640625, 0.019005775451660156, 0.021432876586914062, 0.02385997772216797, 0.026287078857421875, 0.02871417999267578, 0.031141281127929688, 0.033568382263183594, 0.0359954833984375, 0.038422584533691406, 0.04084968566894531, 0.04327678680419922, 0.045703887939453125, 0.04813098907470703, 0.05055809020996094, 0.052985191345214844, 0.05541229248046875, 0.057839393615722656, 0.06026649475097656, 0.06269359588623047, 0.06512069702148438, 0.06754779815673828, 0.06997489929199219, 0.0724020004272461, 0.0748291015625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 9.0, 12.0, 8.0, 10.0, 20.0, 28.0, 24.0, 26.0, 40.0, 67.0, 71.0, 129.0, 100.0, 100.0, 82.0, 71.0, 57.0, 26.0, 25.0, 20.0, 22.0, 8.0, 6.0, 10.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08551025390625, -0.08263206481933594, -0.07975387573242188, -0.07687568664550781, -0.07399749755859375, -0.07111930847167969, -0.06824111938476562, -0.06536293029785156, -0.0624847412109375, -0.05960655212402344, -0.056728363037109375, -0.05385017395019531, -0.05097198486328125, -0.04809379577636719, -0.045215606689453125, -0.04233741760253906, -0.039459228515625, -0.03658103942871094, -0.033702850341796875, -0.030824661254882812, -0.02794647216796875, -0.025068283081054688, -0.022190093994140625, -0.019311904907226562, -0.0164337158203125, -0.013555526733398438, -0.010677337646484375, -0.0077991485595703125, -0.00492095947265625, -0.0020427703857421875, 0.000835418701171875, 0.0037136077880859375, 0.006591796875, 0.009469985961914062, 0.012348175048828125, 0.015226364135742188, 0.01810455322265625, 0.020982742309570312, 0.023860931396484375, 0.026739120483398438, 0.0296173095703125, 0.03249549865722656, 0.035373687744140625, 0.03825187683105469, 0.04113006591796875, 0.04400825500488281, 0.046886444091796875, 0.04976463317871094, 0.052642822265625, 0.05552101135253906, 0.058399200439453125, 0.06127738952636719, 0.06415557861328125, 0.06703376770019531, 0.06991195678710938, 0.07279014587402344, 0.0756683349609375, 0.07854652404785156, 0.08142471313476562, 0.08430290222167969, 0.08718109130859375, 0.09005928039550781, 0.09293746948242188, 0.09581565856933594, 0.09869384765625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 17.0, 26.0, 38.0, 28.0, 62.0, 94.0, 84.0, 83.0, 93.0, 98.0, 81.0, 84.0, 60.0, 42.0, 31.0, 25.0, 17.0, 9.0, 6.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7377037405967712, -0.7131842374801636, -0.6886647343635559, -0.6641452312469482, -0.6396256685256958, -0.6151061654090881, -0.5905866622924805, -0.5660671591758728, -0.5415476560592651, -0.5170281529426575, -0.4925086200237274, -0.46798911690711975, -0.4434695839881897, -0.41895008087158203, -0.39443057775497437, -0.3699110746383667, -0.34539151191711426, -0.3208720088005066, -0.29635247588157654, -0.27183297276496887, -0.2473134547472, -0.22279393672943115, -0.1982744336128235, -0.17375491559505463, -0.14923539757728577, -0.1247158795595169, -0.10019636899232864, -0.07567685842514038, -0.05115734040737152, -0.02663782238960266, -0.002118319272994995, 0.022401198744773865, 0.0469207763671875, 0.07144029438495636, 0.09595980495214462, 0.12047931551933289, 0.14499883353710175, 0.1695183515548706, 0.19403785467147827, 0.21855737268924713, 0.243076890707016, 0.26759639382362366, 0.2921159267425537, 0.3166354298591614, 0.34115493297576904, 0.3656744658946991, 0.39019396901130676, 0.4147135019302368, 0.4392330050468445, 0.46375250816345215, 0.4882720410823822, 0.5127915143966675, 0.5373110771179199, 0.5618305802345276, 0.5863500833511353, 0.6108695864677429, 0.6353890895843506, 0.6599085927009583, 0.6844280958175659, 0.7089476585388184, 0.733467161655426, 0.7579866647720337, 0.7825061678886414, 0.807025671005249, 0.8315452337265015]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 5.0, 9.0, 3.0, 3.0, 4.0, 12.0, 12.0, 11.0, 14.0, 16.0, 18.0, 18.0, 16.0, 16.0, 33.0, 32.0, 27.0, 30.0, 37.0, 30.0, 32.0, 32.0, 34.0, 33.0, 39.0, 34.0, 38.0, 34.0, 38.0, 31.0, 33.0, 38.0, 27.0, 32.0, 28.0, 18.0, 18.0, 12.0, 21.0, 15.0, 15.0, 12.0, 9.0, 8.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.5534484386444092, -0.5368196368217468, -0.5201908349990845, -0.5035620927810669, -0.48693329095840454, -0.4703044891357422, -0.4536757171154022, -0.43704694509506226, -0.4204181432723999, -0.40378934144973755, -0.3871605694293976, -0.3705317974090576, -0.35390299558639526, -0.3372741937637329, -0.32064542174339294, -0.304016649723053, -0.2873878479003906, -0.27075904607772827, -0.2541302740573883, -0.23750148713588715, -0.220872700214386, -0.20424391329288483, -0.18761512637138367, -0.1709863394498825, -0.15435755252838135, -0.1377287656068802, -0.12109997868537903, -0.10447119176387787, -0.08784240484237671, -0.07121361792087555, -0.05458483099937439, -0.03795604407787323, -0.021327316761016846, -0.004698529839515686, 0.011930257081985474, 0.028559044003486633, 0.04518783092498779, 0.06181661784648895, 0.07844540476799011, 0.09507419168949127, 0.11170297861099243, 0.1283317655324936, 0.14496055245399475, 0.1615893393754959, 0.17821812629699707, 0.19484691321849823, 0.2114757001399994, 0.22810448706150055, 0.2447332739830017, 0.26136207580566406, 0.27799084782600403, 0.294619619846344, 0.31124842166900635, 0.3278772234916687, 0.34450599551200867, 0.36113476753234863, 0.377763569355011, 0.39439237117767334, 0.4110211431980133, 0.42764991521835327, 0.4442787170410156, 0.460907518863678, 0.47753629088401794, 0.4941650629043579, 0.5107938647270203]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 5.0, 8.0, 18.0, 18.0, 33.0, 53.0, 92.0, 142.0, 220.0, 386.0, 589.0, 1043.0, 1787.0, 3357.0, 6646.0, 13162.0, 28560.0, 65710.0, 160987.0, 430974.0, 1417250.0, 1368515.0, 414983.0, 157679.0, 65154.0, 28410.0, 13469.0, 6734.0, 3659.0, 1969.0, 1044.0, 622.0, 380.0, 206.0, 135.0, 91.0, 52.0, 39.0, 33.0, 18.0, 8.0, 7.0, 11.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.11187744140625, -0.1080179214477539, -0.10415840148925781, -0.10029888153076172, -0.09643936157226562, -0.09257984161376953, -0.08872032165527344, -0.08486080169677734, -0.08100128173828125, -0.07714176177978516, -0.07328224182128906, -0.06942272186279297, -0.06556320190429688, -0.06170368194580078, -0.05784416198730469, -0.053984642028808594, -0.0501251220703125, -0.046265602111816406, -0.04240608215332031, -0.03854656219482422, -0.034687042236328125, -0.03082752227783203, -0.026968002319335938, -0.023108482360839844, -0.01924896240234375, -0.015389442443847656, -0.011529922485351562, -0.007670402526855469, -0.003810882568359375, 4.863739013671875e-05, 0.0039081573486328125, 0.007767677307128906, 0.011627197265625, 0.015486717224121094, 0.019346237182617188, 0.02320575714111328, 0.027065277099609375, 0.03092479705810547, 0.03478431701660156, 0.038643836975097656, 0.04250335693359375, 0.046362876892089844, 0.05022239685058594, 0.05408191680908203, 0.057941436767578125, 0.06180095672607422, 0.06566047668457031, 0.0695199966430664, 0.0733795166015625, 0.0772390365600586, 0.08109855651855469, 0.08495807647705078, 0.08881759643554688, 0.09267711639404297, 0.09653663635253906, 0.10039615631103516, 0.10425567626953125, 0.10811519622802734, 0.11197471618652344, 0.11583423614501953, 0.11969375610351562, 0.12355327606201172, 0.1274127960205078, 0.1312723159790039, 0.1351318359375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 9.0, 16.0, 8.0, 12.0, 27.0, 15.0, 20.0, 28.0, 29.0, 37.0, 23.0, 48.0, 31.0, 44.0, 35.0, 35.0, 43.0, 38.0, 34.0, 43.0, 39.0, 46.0, 36.0, 25.0, 38.0, 35.0, 24.0, 32.0, 24.0, 20.0, 12.0, 15.0, 9.0, 11.0, 12.0, 6.0, 5.0, 4.0, 3.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.074951171875, -0.07263565063476562, -0.07032012939453125, -0.06800460815429688, -0.0656890869140625, -0.06337356567382812, -0.06105804443359375, -0.058742523193359375, -0.056427001953125, -0.054111480712890625, -0.05179595947265625, -0.049480438232421875, -0.0471649169921875, -0.044849395751953125, -0.04253387451171875, -0.040218353271484375, -0.03790283203125, -0.035587310791015625, -0.03327178955078125, -0.030956268310546875, -0.0286407470703125, -0.026325225830078125, -0.02400970458984375, -0.021694183349609375, -0.019378662109375, -0.017063140869140625, -0.01474761962890625, -0.012432098388671875, -0.0101165771484375, -0.007801055908203125, -0.00548553466796875, -0.003170013427734375, -0.0008544921875, 0.001461029052734375, 0.00377655029296875, 0.006092071533203125, 0.0084075927734375, 0.010723114013671875, 0.01303863525390625, 0.015354156494140625, 0.017669677734375, 0.019985198974609375, 0.02230072021484375, 0.024616241455078125, 0.0269317626953125, 0.029247283935546875, 0.03156280517578125, 0.033878326416015625, 0.03619384765625, 0.038509368896484375, 0.04082489013671875, 0.043140411376953125, 0.0454559326171875, 0.047771453857421875, 0.05008697509765625, 0.052402496337890625, 0.054718017578125, 0.057033538818359375, 0.05934906005859375, 0.061664581298828125, 0.0639801025390625, 0.06629562377929688, 0.06861114501953125, 0.07092666625976562, 0.0732421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 13.0, 15.0, 30.0, 42.0, 67.0, 95.0, 223.0, 366.0, 698.0, 1396.0, 2973.0, 6727.0, 16157.0, 40317.0, 106633.0, 301393.0, 1021096.0, 1849073.0, 551466.0, 183055.0, 67024.0, 26147.0, 10587.0, 4572.0, 2006.0, 986.0, 535.0, 222.0, 143.0, 94.0, 46.0, 34.0, 19.0, 11.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13037109375, -0.12558937072753906, -0.12080764770507812, -0.11602592468261719, -0.11124420166015625, -0.10646247863769531, -0.10168075561523438, -0.09689903259277344, -0.0921173095703125, -0.08733558654785156, -0.08255386352539062, -0.07777214050292969, -0.07299041748046875, -0.06820869445800781, -0.06342697143554688, -0.05864524841308594, -0.053863525390625, -0.04908180236816406, -0.044300079345703125, -0.03951835632324219, -0.03473663330078125, -0.029954910278320312, -0.025173187255859375, -0.020391464233398438, -0.0156097412109375, -0.010828018188476562, -0.006046295166015625, -0.0012645721435546875, 0.00351715087890625, 0.008298873901367188, 0.013080596923828125, 0.017862319946289062, 0.02264404296875, 0.027425765991210938, 0.032207489013671875, 0.03698921203613281, 0.04177093505859375, 0.04655265808105469, 0.051334381103515625, 0.05611610412597656, 0.0608978271484375, 0.06567955017089844, 0.07046127319335938, 0.07524299621582031, 0.08002471923828125, 0.08480644226074219, 0.08958816528320312, 0.09436988830566406, 0.099151611328125, 0.10393333435058594, 0.10871505737304688, 0.11349678039550781, 0.11827850341796875, 0.12306022644042969, 0.12784194946289062, 0.13262367248535156, 0.1374053955078125, 0.14218711853027344, 0.14696884155273438, 0.1517505645751953, 0.15653228759765625, 0.1613140106201172, 0.16609573364257812, 0.17087745666503906, 0.1756591796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 11.0, 19.0, 26.0, 29.0, 40.0, 48.0, 76.0, 87.0, 115.0, 144.0, 245.0, 307.0, 422.0, 645.0, 478.0, 384.0, 258.0, 178.0, 143.0, 104.0, 78.0, 62.0, 38.0, 38.0, 28.0, 11.0, 15.0, 10.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.1936798095703125, -0.188262939453125, -0.1828460693359375, -0.17742919921875, -0.1720123291015625, -0.166595458984375, -0.1611785888671875, -0.15576171875, -0.1503448486328125, -0.144927978515625, -0.1395111083984375, -0.13409423828125, -0.1286773681640625, -0.123260498046875, -0.1178436279296875, -0.1124267578125, -0.1070098876953125, -0.101593017578125, -0.0961761474609375, -0.09075927734375, -0.0853424072265625, -0.079925537109375, -0.0745086669921875, -0.069091796875, -0.0636749267578125, -0.058258056640625, -0.0528411865234375, -0.04742431640625, -0.0420074462890625, -0.036590576171875, -0.0311737060546875, -0.0257568359375, -0.0203399658203125, -0.014923095703125, -0.0095062255859375, -0.00408935546875, 0.0013275146484375, 0.006744384765625, 0.0121612548828125, 0.017578125, 0.0229949951171875, 0.028411865234375, 0.0338287353515625, 0.03924560546875, 0.0446624755859375, 0.050079345703125, 0.0554962158203125, 0.0609130859375, 0.0663299560546875, 0.071746826171875, 0.0771636962890625, 0.08258056640625, 0.0879974365234375, 0.093414306640625, 0.0988311767578125, 0.104248046875, 0.1096649169921875, 0.115081787109375, 0.1204986572265625, 0.12591552734375, 0.1313323974609375, 0.136749267578125, 0.1421661376953125, 0.1475830078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 13.0, 15.0, 27.0, 44.0, 87.0, 95.0, 107.0, 112.0, 134.0, 106.0, 73.0, 52.0, 45.0, 29.0, 17.0, 10.0, 10.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7024692296981812, -0.6666556596755981, -0.6308421492576599, -0.5950285792350769, -0.5592150688171387, -0.5234014987945557, -0.48758795857429504, -0.4517744183540344, -0.4159608781337738, -0.3801473379135132, -0.34433379769325256, -0.30852025747299194, -0.27270668745040894, -0.2368931621313095, -0.2010796070098877, -0.16526606678962708, -0.12945252656936646, -0.09363898634910583, -0.05782543867826462, -0.0220118910074234, 0.01380164921283722, 0.04961518943309784, 0.08542874455451965, 0.12124228477478027, 0.1570558249950409, 0.1928693652153015, 0.22868290543556213, 0.26449644565582275, 0.30031001567840576, 0.336123526096344, 0.371937096118927, 0.4077506363391876, 0.44356417655944824, 0.47937771677970886, 0.5151912569999695, 0.5510048270225525, 0.5868183374404907, 0.6226319074630737, 0.6584454774856567, 0.694258987903595, 0.7300724983215332, 0.7658860683441162, 0.8016995787620544, 0.8375131487846375, 0.8733266592025757, 0.9091402292251587, 0.9449537992477417, 0.9807673096656799, 1.0165808200836182, 1.0523943901062012, 1.0882079601287842, 1.1240214109420776, 1.1598349809646606, 1.1956485509872437, 1.2314621210098267, 1.2672755718231201, 1.3030892610549927, 1.3389028310775757, 1.3747164011001587, 1.4105298519134521, 1.4463434219360352, 1.4821569919586182, 1.5179705619812012, 1.5537841320037842, 1.5895975828170776]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 3.0, 7.0, 8.0, 17.0, 13.0, 22.0, 19.0, 13.0, 24.0, 24.0, 21.0, 21.0, 25.0, 40.0, 40.0, 34.0, 28.0, 35.0, 37.0, 36.0, 39.0, 41.0, 30.0, 41.0, 35.0, 39.0, 33.0, 30.0, 31.0, 19.0, 26.0, 33.0, 19.0, 23.0, 13.0, 15.0, 7.0, 10.0, 10.0, 6.0, 4.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5141424536705017, -0.497933566570282, -0.48172470927238464, -0.4655158221721649, -0.4493069648742676, -0.43309807777404785, -0.4168891906738281, -0.4006803035736084, -0.38447144627571106, -0.36826255917549133, -0.352053701877594, -0.33584481477737427, -0.31963592767715454, -0.3034270703792572, -0.2872181832790375, -0.27100932598114014, -0.2548004388809204, -0.23859156668186188, -0.22238269448280334, -0.20617380738258362, -0.18996493518352509, -0.17375606298446655, -0.15754717588424683, -0.1413383036851883, -0.12512943148612976, -0.10892055928707123, -0.0927116796374321, -0.07650279998779297, -0.060293927788734436, -0.0440850555896759, -0.027876175940036774, -0.011667296290397644, 0.004541575908660889, 0.02075045183300972, 0.03695932775735855, 0.05316820368170738, 0.06937707960605621, 0.08558595180511475, 0.10179483145475388, 0.118003711104393, 0.13421258330345154, 0.15042145550251007, 0.1666303277015686, 0.18283921480178833, 0.19904808700084686, 0.2152569591999054, 0.23146584630012512, 0.24767471849918365, 0.2638835906982422, 0.2800924777984619, 0.29630133509635925, 0.312510222196579, 0.3287190794944763, 0.34492796659469604, 0.36113685369491577, 0.3773457407951355, 0.39355459809303284, 0.40976348519325256, 0.4259723424911499, 0.44218122959136963, 0.45839011669158936, 0.4745989739894867, 0.4908078610897064, 0.5070167183876038, 0.5232256054878235]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 12.0, 22.0, 37.0, 35.0, 63.0, 98.0, 154.0, 236.0, 303.0, 434.0, 589.0, 857.0, 1117.0, 1642.0, 2242.0, 3105.0, 4101.0, 5675.0, 8170.0, 11961.0, 19198.0, 36120.0, 90420.0, 260828.0, 340574.0, 139635.0, 49772.0, 23935.0, 14133.0, 9381.0, 6522.0, 4660.0, 3447.0, 2514.0, 1878.0, 1324.0, 998.0, 684.0, 501.0, 402.0, 260.0, 176.0, 117.0, 85.0, 37.0, 37.0, 21.0, 13.0, 16.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.1455078125, -0.14112472534179688, -0.13674163818359375, -0.13235855102539062, -0.1279754638671875, -0.12359237670898438, -0.11920928955078125, -0.11482620239257812, -0.110443115234375, -0.10606002807617188, -0.10167694091796875, -0.09729385375976562, -0.0929107666015625, -0.08852767944335938, -0.08414459228515625, -0.07976150512695312, -0.07537841796875, -0.07099533081054688, -0.06661224365234375, -0.062229156494140625, -0.0578460693359375, -0.053462982177734375, -0.04907989501953125, -0.044696807861328125, -0.040313720703125, -0.035930633544921875, -0.03154754638671875, -0.027164459228515625, -0.0227813720703125, -0.018398284912109375, -0.01401519775390625, -0.009632110595703125, -0.0052490234375, -0.000865936279296875, 0.00351715087890625, 0.007900238037109375, 0.0122833251953125, 0.016666412353515625, 0.02104949951171875, 0.025432586669921875, 0.029815673828125, 0.034198760986328125, 0.03858184814453125, 0.042964935302734375, 0.0473480224609375, 0.051731109619140625, 0.05611419677734375, 0.060497283935546875, 0.06488037109375, 0.06926345825195312, 0.07364654541015625, 0.07802963256835938, 0.0824127197265625, 0.08679580688476562, 0.09117889404296875, 0.09556198120117188, 0.099945068359375, 0.10432815551757812, 0.10871124267578125, 0.11309432983398438, 0.1174774169921875, 0.12186050415039062, 0.12624359130859375, 0.13062667846679688, 0.135009765625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 5.0, 4.0, 10.0, 11.0, 19.0, 20.0, 18.0, 21.0, 27.0, 23.0, 20.0, 34.0, 47.0, 32.0, 46.0, 37.0, 41.0, 42.0, 53.0, 50.0, 42.0, 48.0, 45.0, 34.0, 32.0, 27.0, 30.0, 28.0, 20.0, 14.0, 19.0, 14.0, 15.0, 15.0, 9.0, 8.0, 8.0, 5.0, 5.0, 1.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08038330078125, -0.07783889770507812, -0.07529449462890625, -0.07275009155273438, -0.0702056884765625, -0.06766128540039062, -0.06511688232421875, -0.06257247924804688, -0.060028076171875, -0.057483673095703125, -0.05493927001953125, -0.052394866943359375, -0.0498504638671875, -0.047306060791015625, -0.04476165771484375, -0.042217254638671875, -0.0396728515625, -0.037128448486328125, -0.03458404541015625, -0.032039642333984375, -0.0294952392578125, -0.026950836181640625, -0.02440643310546875, -0.021862030029296875, -0.019317626953125, -0.016773223876953125, -0.01422882080078125, -0.011684417724609375, -0.0091400146484375, -0.006595611572265625, -0.00405120849609375, -0.001506805419921875, 0.00103759765625, 0.003582000732421875, 0.00612640380859375, 0.008670806884765625, 0.0112152099609375, 0.013759613037109375, 0.01630401611328125, 0.018848419189453125, 0.021392822265625, 0.023937225341796875, 0.02648162841796875, 0.029026031494140625, 0.0315704345703125, 0.034114837646484375, 0.03665924072265625, 0.039203643798828125, 0.041748046875, 0.044292449951171875, 0.04683685302734375, 0.049381256103515625, 0.0519256591796875, 0.054470062255859375, 0.05701446533203125, 0.059558868408203125, 0.062103271484375, 0.06464767456054688, 0.06719207763671875, 0.06973648071289062, 0.0722808837890625, 0.07482528686523438, 0.07736968994140625, 0.07991409301757812, 0.08245849609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 15.0, 10.0, 19.0, 22.0, 35.0, 61.0, 67.0, 135.0, 235.0, 417.0, 873.0, 1744.0, 3752.0, 7946.0, 17616.0, 40351.0, 153816.0, 585710.0, 161217.0, 40844.0, 17816.0, 8195.0, 3826.0, 1850.0, 884.0, 428.0, 261.0, 132.0, 99.0, 53.0, 42.0, 18.0, 16.0, 12.0, 7.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2529296875, -0.24538230895996094, -0.23783493041992188, -0.2302875518798828, -0.22274017333984375, -0.2151927947998047, -0.20764541625976562, -0.20009803771972656, -0.1925506591796875, -0.18500328063964844, -0.17745590209960938, -0.1699085235595703, -0.16236114501953125, -0.1548137664794922, -0.14726638793945312, -0.13971900939941406, -0.132171630859375, -0.12462425231933594, -0.11707687377929688, -0.10952949523925781, -0.10198211669921875, -0.09443473815917969, -0.08688735961914062, -0.07933998107910156, -0.0717926025390625, -0.06424522399902344, -0.056697845458984375, -0.04915046691894531, -0.04160308837890625, -0.03405570983886719, -0.026508331298828125, -0.018960952758789062, -0.01141357421875, -0.0038661956787109375, 0.003681182861328125, 0.011228561401367188, 0.01877593994140625, 0.026323318481445312, 0.033870697021484375, 0.04141807556152344, 0.0489654541015625, 0.05651283264160156, 0.06406021118164062, 0.07160758972167969, 0.07915496826171875, 0.08670234680175781, 0.09424972534179688, 0.10179710388183594, 0.109344482421875, 0.11689186096191406, 0.12443923950195312, 0.1319866180419922, 0.13953399658203125, 0.1470813751220703, 0.15462875366210938, 0.16217613220214844, 0.1697235107421875, 0.17727088928222656, 0.18481826782226562, 0.1923656463623047, 0.19991302490234375, 0.2074604034423828, 0.21500778198242188, 0.22255516052246094, 0.2301025390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 7.0, 5.0, 3.0, 5.0, 6.0, 16.0, 8.0, 16.0, 15.0, 19.0, 26.0, 23.0, 21.0, 31.0, 33.0, 30.0, 27.0, 36.0, 42.0, 44.0, 48.0, 40.0, 32.0, 39.0, 55.0, 21.0, 33.0, 34.0, 26.0, 31.0, 31.0, 29.0, 30.0, 17.0, 17.0, 19.0, 14.0, 13.0, 11.0, 12.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.222900390625, -0.21584320068359375, -0.2087860107421875, -0.20172882080078125, -0.194671630859375, -0.18761444091796875, -0.1805572509765625, -0.17350006103515625, -0.16644287109375, -0.15938568115234375, -0.1523284912109375, -0.14527130126953125, -0.138214111328125, -0.13115692138671875, -0.1240997314453125, -0.11704254150390625, -0.1099853515625, -0.10292816162109375, -0.0958709716796875, -0.08881378173828125, -0.081756591796875, -0.07469940185546875, -0.0676422119140625, -0.06058502197265625, -0.05352783203125, -0.04647064208984375, -0.0394134521484375, -0.03235626220703125, -0.025299072265625, -0.01824188232421875, -0.0111846923828125, -0.00412750244140625, 0.0029296875, 0.00998687744140625, 0.0170440673828125, 0.02410125732421875, 0.031158447265625, 0.03821563720703125, 0.0452728271484375, 0.05233001708984375, 0.05938720703125, 0.06644439697265625, 0.0735015869140625, 0.08055877685546875, 0.087615966796875, 0.09467315673828125, 0.1017303466796875, 0.10878753662109375, 0.1158447265625, 0.12290191650390625, 0.1299591064453125, 0.13701629638671875, 0.144073486328125, 0.15113067626953125, 0.1581878662109375, 0.16524505615234375, 0.17230224609375, 0.17935943603515625, 0.1864166259765625, 0.19347381591796875, 0.200531005859375, 0.20758819580078125, 0.2146453857421875, 0.22170257568359375, 0.228759765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 15.0, 17.0, 21.0, 23.0, 19.0, 60.0, 64.0, 99.0, 155.0, 222.0, 374.0, 523.0, 790.0, 1155.0, 1844.0, 2809.0, 4019.0, 6138.0, 9550.0, 16587.0, 36088.0, 107074.0, 378094.0, 322748.0, 88128.0, 31023.0, 15028.0, 8791.0, 5658.0, 3949.0, 2500.0, 1714.0, 1113.0, 774.0, 462.0, 280.0, 237.0, 128.0, 88.0, 67.0, 44.0, 27.0, 21.0, 13.0, 8.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0732421875, -0.07079410552978516, -0.06834602355957031, -0.06589794158935547, -0.06344985961914062, -0.06100177764892578, -0.05855369567871094, -0.056105613708496094, -0.05365753173828125, -0.051209449768066406, -0.04876136779785156, -0.04631328582763672, -0.043865203857421875, -0.04141712188720703, -0.03896903991699219, -0.036520957946777344, -0.0340728759765625, -0.031624794006347656, -0.029176712036132812, -0.02672863006591797, -0.024280548095703125, -0.02183246612548828, -0.019384384155273438, -0.016936302185058594, -0.01448822021484375, -0.012040138244628906, -0.009592056274414062, -0.007143974304199219, -0.004695892333984375, -0.0022478103637695312, 0.0002002716064453125, 0.0026483535766601562, 0.005096435546875, 0.007544517517089844, 0.009992599487304688, 0.012440681457519531, 0.014888763427734375, 0.01733684539794922, 0.019784927368164062, 0.022233009338378906, 0.02468109130859375, 0.027129173278808594, 0.029577255249023438, 0.03202533721923828, 0.034473419189453125, 0.03692150115966797, 0.03936958312988281, 0.041817665100097656, 0.0442657470703125, 0.046713829040527344, 0.04916191101074219, 0.05160999298095703, 0.054058074951171875, 0.05650615692138672, 0.05895423889160156, 0.061402320861816406, 0.06385040283203125, 0.0662984848022461, 0.06874656677246094, 0.07119464874267578, 0.07364273071289062, 0.07609081268310547, 0.07853889465332031, 0.08098697662353516, 0.08343505859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 4.0, 3.0, 11.0, 8.0, 12.0, 12.0, 7.0, 24.0, 23.0, 65.0, 82.0, 155.0, 189.0, 148.0, 74.0, 42.0, 36.0, 20.0, 16.0, 10.0, 6.0, 1.0, 6.0, 5.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.944469451904297e-05, -2.850312739610672e-05, -2.756156027317047e-05, -2.6619993150234222e-05, -2.5678426027297974e-05, -2.4736858904361725e-05, -2.3795291781425476e-05, -2.2853724658489227e-05, -2.191215753555298e-05, -2.097059041261673e-05, -2.002902328968048e-05, -1.9087456166744232e-05, -1.8145889043807983e-05, -1.7204321920871735e-05, -1.6262754797935486e-05, -1.5321187674999237e-05, -1.4379620552062988e-05, -1.343805342912674e-05, -1.249648630619049e-05, -1.1554919183254242e-05, -1.0613352060317993e-05, -9.671784937381744e-06, -8.730217814445496e-06, -7.788650691509247e-06, -6.847083568572998e-06, -5.905516445636749e-06, -4.9639493227005005e-06, -4.022382199764252e-06, -3.080815076828003e-06, -2.139247953891754e-06, -1.1976808309555054e-06, -2.561137080192566e-07, 6.854534149169922e-07, 1.627020537853241e-06, 2.5685876607894897e-06, 3.5101547837257385e-06, 4.451721906661987e-06, 5.393289029598236e-06, 6.334856152534485e-06, 7.276423275470734e-06, 8.217990398406982e-06, 9.159557521343231e-06, 1.010112464427948e-05, 1.1042691767215729e-05, 1.1984258890151978e-05, 1.2925826013088226e-05, 1.3867393136024475e-05, 1.4808960258960724e-05, 1.5750527381896973e-05, 1.669209450483322e-05, 1.763366162776947e-05, 1.857522875070572e-05, 1.9516795873641968e-05, 2.0458362996578217e-05, 2.1399930119514465e-05, 2.2341497242450714e-05, 2.3283064365386963e-05, 2.422463148832321e-05, 2.516619861125946e-05, 2.610776573419571e-05, 2.7049332857131958e-05, 2.7990899980068207e-05, 2.8932467103004456e-05, 2.9874034225940704e-05, 3.081560134887695e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 8.0, 4.0, 10.0, 16.0, 30.0, 47.0, 65.0, 102.0, 175.0, 272.0, 505.0, 834.0, 1703.0, 3062.0, 6087.0, 12123.0, 29335.0, 106443.0, 377236.0, 360183.0, 98569.0, 27633.0, 11659.0, 5724.0, 3040.0, 1584.0, 884.0, 498.0, 281.0, 141.0, 107.0, 69.0, 44.0, 28.0, 17.0, 16.0, 7.0, 5.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0748291015625, -0.07205486297607422, -0.06928062438964844, -0.06650638580322266, -0.06373214721679688, -0.060957908630371094, -0.05818367004394531, -0.05540943145751953, -0.05263519287109375, -0.04986095428466797, -0.04708671569824219, -0.044312477111816406, -0.041538238525390625, -0.038763999938964844, -0.03598976135253906, -0.03321552276611328, -0.0304412841796875, -0.02766704559326172, -0.024892807006835938, -0.022118568420410156, -0.019344329833984375, -0.016570091247558594, -0.013795852661132812, -0.011021614074707031, -0.00824737548828125, -0.005473136901855469, -0.0026988983154296875, 7.534027099609375e-05, 0.002849578857421875, 0.005623817443847656, 0.008398056030273438, 0.011172294616699219, 0.013946533203125, 0.01672077178955078, 0.019495010375976562, 0.022269248962402344, 0.025043487548828125, 0.027817726135253906, 0.030591964721679688, 0.03336620330810547, 0.03614044189453125, 0.03891468048095703, 0.04168891906738281, 0.044463157653808594, 0.047237396240234375, 0.050011634826660156, 0.05278587341308594, 0.05556011199951172, 0.0583343505859375, 0.06110858917236328, 0.06388282775878906, 0.06665706634521484, 0.06943130493164062, 0.0722055435180664, 0.07497978210449219, 0.07775402069091797, 0.08052825927734375, 0.08330249786376953, 0.08607673645019531, 0.0888509750366211, 0.09162521362304688, 0.09439945220947266, 0.09717369079589844, 0.09994792938232422, 0.10272216796875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 2.0, 9.0, 7.0, 14.0, 22.0, 44.0, 59.0, 59.0, 87.0, 89.0, 105.0, 109.0, 88.0, 79.0, 61.0, 35.0, 32.0, 19.0, 12.0, 15.0, 15.0, 8.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09814453125, -0.09505748748779297, -0.09197044372558594, -0.0888833999633789, -0.08579635620117188, -0.08270931243896484, -0.07962226867675781, -0.07653522491455078, -0.07344818115234375, -0.07036113739013672, -0.06727409362792969, -0.06418704986572266, -0.061100006103515625, -0.058012962341308594, -0.05492591857910156, -0.05183887481689453, -0.0487518310546875, -0.04566478729248047, -0.04257774353027344, -0.039490699768066406, -0.036403656005859375, -0.033316612243652344, -0.030229568481445312, -0.02714252471923828, -0.02405548095703125, -0.02096843719482422, -0.017881393432617188, -0.014794349670410156, -0.011707305908203125, -0.008620262145996094, -0.0055332183837890625, -0.0024461746215820312, 0.000640869140625, 0.0037279129028320312, 0.0068149566650390625, 0.009902000427246094, 0.012989044189453125, 0.016076087951660156, 0.019163131713867188, 0.02225017547607422, 0.02533721923828125, 0.02842426300048828, 0.03151130676269531, 0.034598350524902344, 0.037685394287109375, 0.040772438049316406, 0.04385948181152344, 0.04694652557373047, 0.0500335693359375, 0.05312061309814453, 0.05620765686035156, 0.059294700622558594, 0.062381744384765625, 0.06546878814697266, 0.06855583190917969, 0.07164287567138672, 0.07472991943359375, 0.07781696319580078, 0.08090400695800781, 0.08399105072021484, 0.08707809448242188, 0.0901651382446289, 0.09325218200683594, 0.09633922576904297, 0.09942626953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 11.0, 13.0, 29.0, 29.0, 39.0, 62.0, 88.0, 105.0, 101.0, 95.0, 109.0, 83.0, 72.0, 45.0, 28.0, 27.0, 18.0, 7.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8294528722763062, -0.8005977869033813, -0.7717427611351013, -0.7428876757621765, -0.7140326499938965, -0.6851775646209717, -0.6563225388526917, -0.6274674534797668, -0.5986124277114868, -0.569757342338562, -0.540902316570282, -0.5120472311973572, -0.48319220542907715, -0.45433712005615234, -0.4254820942878723, -0.3966270089149475, -0.3677719533443451, -0.3389168977737427, -0.31006184220314026, -0.28120678663253784, -0.2523517310619354, -0.22349666059017181, -0.1946416050195694, -0.16578654944896698, -0.13693149387836456, -0.10807643830776215, -0.07922138273715973, -0.050366319715976715, -0.021511264145374298, 0.007343798875808716, 0.03619885444641113, 0.06505391001701355, 0.09390896558761597, 0.12276402115821838, 0.1516190767288208, 0.18047413229942322, 0.20932918787002563, 0.23818425834178925, 0.26703929901123047, 0.2958943843841553, 0.3247494101524353, 0.3536044657230377, 0.38245952129364014, 0.41131457686424255, 0.44016963243484497, 0.4690247178077698, 0.4978797435760498, 0.5267348289489746, 0.5555899143218994, 0.5844449996948242, 0.6133000254631042, 0.642155110836029, 0.6710101366043091, 0.6998652219772339, 0.7287202477455139, 0.7575753331184387, 0.7864303588867188, 0.8152854442596436, 0.8441404700279236, 0.8729955554008484, 0.9018505811691284, 0.9307056665420532, 0.9595606923103333, 0.9884157776832581, 1.017270803451538]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 14.0, 7.0, 12.0, 10.0, 18.0, 31.0, 26.0, 27.0, 26.0, 31.0, 29.0, 33.0, 35.0, 42.0, 42.0, 38.0, 42.0, 36.0, 34.0, 45.0, 46.0, 37.0, 37.0, 32.0, 36.0, 38.0, 25.0, 23.0, 28.0, 25.0, 18.0, 9.0, 11.0, 10.0, 8.0, 8.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.7734276652336121, -0.7516672611236572, -0.7299067974090576, -0.7081463932991028, -0.686385989189148, -0.6646255254745483, -0.6428651213645935, -0.6211047172546387, -0.5993442535400391, -0.5775838494300842, -0.5558233857154846, -0.5340629816055298, -0.512302577495575, -0.49054214358329773, -0.4687817096710205, -0.4470213055610657, -0.42526090145111084, -0.4035004675388336, -0.3817400634288788, -0.35997962951660156, -0.33821922540664673, -0.3164587914943695, -0.2946983575820923, -0.27293795347213745, -0.25117751955986023, -0.2294171005487442, -0.20765668153762817, -0.18589624762535095, -0.16413582861423492, -0.1423754096031189, -0.12061497569084167, -0.09885455667972565, -0.0770941972732544, -0.05533377453684807, -0.03357335180044174, -0.011812925338745117, 0.00994749367237091, 0.03170791268348694, 0.05346834659576416, 0.07522876560688019, 0.09698918461799622, 0.11874960362911224, 0.14051002264022827, 0.1622704565525055, 0.18403087556362152, 0.20579129457473755, 0.22755172848701477, 0.2493121474981308, 0.2710725665092468, 0.29283300042152405, 0.3145934045314789, 0.3363538384437561, 0.35811424255371094, 0.37987467646598816, 0.4016351103782654, 0.4233955144882202, 0.44515594840049744, 0.46691638231277466, 0.4886767864227295, 0.5104372501373291, 0.5321976542472839, 0.5539580583572388, 0.5757185220718384, 0.5974789261817932, 0.619239330291748]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 31.0, 28.0, 35.0, 51.0, 83.0, 139.0, 184.0, 279.0, 434.0, 615.0, 1091.0, 1733.0, 2969.0, 5336.0, 10625.0, 20989.0, 43596.0, 95458.0, 223266.0, 604057.0, 1578377.0, 999220.0, 343729.0, 138885.0, 62249.0, 29023.0, 14332.0, 7526.0, 3985.0, 2259.0, 1299.0, 801.0, 544.0, 315.0, 227.0, 143.0, 123.0, 59.0, 65.0, 33.0, 18.0, 19.0, 17.0, 3.0, 9.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0994873046875, -0.09624958038330078, -0.09301185607910156, -0.08977413177490234, -0.08653640747070312, -0.0832986831665039, -0.08006095886230469, -0.07682323455810547, -0.07358551025390625, -0.07034778594970703, -0.06711006164550781, -0.0638723373413086, -0.060634613037109375, -0.057396888732910156, -0.05415916442871094, -0.05092144012451172, -0.0476837158203125, -0.04444599151611328, -0.04120826721191406, -0.037970542907714844, -0.034732818603515625, -0.031495094299316406, -0.028257369995117188, -0.02501964569091797, -0.02178192138671875, -0.01854419708251953, -0.015306472778320312, -0.012068748474121094, -0.008831024169921875, -0.005593299865722656, -0.0023555755615234375, 0.0008821487426757812, 0.004119873046875, 0.007357597351074219, 0.010595321655273438, 0.013833045959472656, 0.017070770263671875, 0.020308494567871094, 0.023546218872070312, 0.02678394317626953, 0.03002166748046875, 0.03325939178466797, 0.03649711608886719, 0.039734840393066406, 0.042972564697265625, 0.046210289001464844, 0.04944801330566406, 0.05268573760986328, 0.0559234619140625, 0.05916118621826172, 0.06239891052246094, 0.06563663482666016, 0.06887435913085938, 0.0721120834350586, 0.07534980773925781, 0.07858753204345703, 0.08182525634765625, 0.08506298065185547, 0.08830070495605469, 0.0915384292602539, 0.09477615356445312, 0.09801387786865234, 0.10125160217285156, 0.10448932647705078, 0.10772705078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 13.0, 4.0, 6.0, 12.0, 10.0, 22.0, 11.0, 26.0, 20.0, 16.0, 30.0, 29.0, 31.0, 32.0, 36.0, 47.0, 45.0, 51.0, 46.0, 43.0, 42.0, 41.0, 41.0, 40.0, 38.0, 31.0, 34.0, 28.0, 34.0, 23.0, 17.0, 21.0, 10.0, 17.0, 6.0, 16.0, 11.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0897216796875, -0.08702754974365234, -0.08433341979980469, -0.08163928985595703, -0.07894515991210938, -0.07625102996826172, -0.07355690002441406, -0.0708627700805664, -0.06816864013671875, -0.0654745101928711, -0.06278038024902344, -0.06008625030517578, -0.057392120361328125, -0.05469799041748047, -0.05200386047363281, -0.049309730529785156, -0.0466156005859375, -0.043921470642089844, -0.04122734069824219, -0.03853321075439453, -0.035839080810546875, -0.03314495086669922, -0.030450820922851562, -0.027756690979003906, -0.02506256103515625, -0.022368431091308594, -0.019674301147460938, -0.01698017120361328, -0.014286041259765625, -0.011591911315917969, -0.008897781372070312, -0.006203651428222656, -0.003509521484375, -0.0008153915405273438, 0.0018787384033203125, 0.004572868347167969, 0.007266998291015625, 0.009961128234863281, 0.012655258178710938, 0.015349388122558594, 0.01804351806640625, 0.020737648010253906, 0.023431777954101562, 0.02612590789794922, 0.028820037841796875, 0.03151416778564453, 0.03420829772949219, 0.036902427673339844, 0.0395965576171875, 0.042290687561035156, 0.04498481750488281, 0.04767894744873047, 0.050373077392578125, 0.05306720733642578, 0.05576133728027344, 0.058455467224121094, 0.06114959716796875, 0.0638437271118164, 0.06653785705566406, 0.06923198699951172, 0.07192611694335938, 0.07462024688720703, 0.07731437683105469, 0.08000850677490234, 0.08270263671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 8.0, 12.0, 15.0, 29.0, 45.0, 75.0, 152.0, 275.0, 638.0, 1418.0, 3666.0, 11605.0, 42099.0, 174306.0, 957842.0, 2450810.0, 425551.0, 91693.0, 23311.0, 6660.0, 2276.0, 928.0, 418.0, 193.0, 124.0, 41.0, 34.0, 20.0, 18.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16064453125, -0.15343475341796875, -0.1462249755859375, -0.13901519775390625, -0.131805419921875, -0.12459564208984375, -0.1173858642578125, -0.11017608642578125, -0.10296630859375, -0.09575653076171875, -0.0885467529296875, -0.08133697509765625, -0.074127197265625, -0.06691741943359375, -0.0597076416015625, -0.05249786376953125, -0.0452880859375, -0.03807830810546875, -0.0308685302734375, -0.02365875244140625, -0.016448974609375, -0.00923919677734375, -0.0020294189453125, 0.00518035888671875, 0.01239013671875, 0.01959991455078125, 0.0268096923828125, 0.03401947021484375, 0.041229248046875, 0.04843902587890625, 0.0556488037109375, 0.06285858154296875, 0.070068359375, 0.07727813720703125, 0.0844879150390625, 0.09169769287109375, 0.098907470703125, 0.10611724853515625, 0.1133270263671875, 0.12053680419921875, 0.12774658203125, 0.13495635986328125, 0.1421661376953125, 0.14937591552734375, 0.156585693359375, 0.16379547119140625, 0.1710052490234375, 0.17821502685546875, 0.1854248046875, 0.19263458251953125, 0.1998443603515625, 0.20705413818359375, 0.214263916015625, 0.22147369384765625, 0.2286834716796875, 0.23589324951171875, 0.24310302734375, 0.25031280517578125, 0.2575225830078125, 0.26473236083984375, 0.271942138671875, 0.27915191650390625, 0.2863616943359375, 0.29357147216796875, 0.30078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 18.0, 11.0, 21.0, 30.0, 39.0, 48.0, 65.0, 99.0, 118.0, 165.0, 233.0, 343.0, 486.0, 665.0, 552.0, 357.0, 235.0, 159.0, 129.0, 92.0, 56.0, 39.0, 29.0, 25.0, 11.0, 19.0, 10.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2318115234375, -0.2254657745361328, -0.21912002563476562, -0.21277427673339844, -0.20642852783203125, -0.20008277893066406, -0.19373703002929688, -0.1873912811279297, -0.1810455322265625, -0.1746997833251953, -0.16835403442382812, -0.16200828552246094, -0.15566253662109375, -0.14931678771972656, -0.14297103881835938, -0.1366252899169922, -0.130279541015625, -0.12393379211425781, -0.11758804321289062, -0.11124229431152344, -0.10489654541015625, -0.09855079650878906, -0.09220504760742188, -0.08585929870605469, -0.0795135498046875, -0.07316780090332031, -0.06682205200195312, -0.06047630310058594, -0.05413055419921875, -0.04778480529785156, -0.041439056396484375, -0.03509330749511719, -0.02874755859375, -0.022401809692382812, -0.016056060791015625, -0.009710311889648438, -0.00336456298828125, 0.0029811859130859375, 0.009326934814453125, 0.015672683715820312, 0.0220184326171875, 0.028364181518554688, 0.034709930419921875, 0.04105567932128906, 0.04740142822265625, 0.05374717712402344, 0.060092926025390625, 0.06643867492675781, 0.072784423828125, 0.07913017272949219, 0.08547592163085938, 0.09182167053222656, 0.09816741943359375, 0.10451316833496094, 0.11085891723632812, 0.11720466613769531, 0.1235504150390625, 0.1298961639404297, 0.13624191284179688, 0.14258766174316406, 0.14893341064453125, 0.15527915954589844, 0.16162490844726562, 0.1679706573486328, 0.17431640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 13.0, 28.0, 45.0, 65.0, 87.0, 109.0, 152.0, 123.0, 118.0, 89.0, 57.0, 50.0, 23.0, 10.0, 12.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0661143064498901, -1.0239194631576538, -0.981724739074707, -0.9395298957824707, -0.8973351716995239, -0.8551403284072876, -0.812945544719696, -0.7707507610321045, -0.7285559773445129, -0.6863611936569214, -0.6441664099693298, -0.6019716262817383, -0.559776782989502, -0.5175820589065552, -0.47538721561431885, -0.4331924319267273, -0.39099764823913574, -0.3488028645515442, -0.30660808086395264, -0.2644132673740387, -0.22221848368644714, -0.1800236999988556, -0.13782888650894165, -0.0956341028213501, -0.053439319133758545, -0.011244527995586395, 0.030950263142585754, 0.0731450617313385, 0.11533984541893005, 0.1575346291065216, 0.19972944259643555, 0.2419242262840271, 0.2841188907623291, 0.32631367444992065, 0.3685084581375122, 0.41070327162742615, 0.4528980553150177, 0.49509283900260925, 0.5372876524925232, 0.5794824361801147, 0.6216772198677063, 0.6638720035552979, 0.7060667872428894, 0.748261570930481, 0.7904564142227173, 0.8326511383056641, 0.8748459815979004, 0.9170407652854919, 0.9592355489730835, 1.0014303922653198, 1.0436251163482666, 1.085819959640503, 1.1280146837234497, 1.170209527015686, 1.2124042510986328, 1.2545990943908691, 1.2967939376831055, 1.3389887809753418, 1.3811835050582886, 1.423378348350525, 1.4655730724334717, 1.507767915725708, 1.5499627590179443, 1.5921574831008911, 1.634352207183838]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 13.0, 7.0, 8.0, 13.0, 11.0, 14.0, 20.0, 21.0, 34.0, 30.0, 34.0, 36.0, 39.0, 52.0, 51.0, 50.0, 61.0, 50.0, 46.0, 43.0, 44.0, 50.0, 40.0, 36.0, 35.0, 32.0, 27.0, 23.0, 28.0, 13.0, 15.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6467407941818237, -0.6221418976783752, -0.5975430011749268, -0.5729441046714783, -0.5483452081680298, -0.5237463116645813, -0.4991474449634552, -0.4745485484600067, -0.4499496519565582, -0.42535075545310974, -0.40075185894966125, -0.37615299224853516, -0.35155409574508667, -0.3269551992416382, -0.3023563027381897, -0.2777574062347412, -0.2531585097312927, -0.22855961322784424, -0.20396071672439575, -0.17936183512210846, -0.15476293861865997, -0.1301640421152115, -0.1055651605129242, -0.08096626400947571, -0.05636736750602722, -0.031768474727869034, -0.007169581949710846, 0.017429307103157043, 0.04202820360660553, 0.06662710011005402, 0.09122598171234131, 0.1158248782157898, 0.14042383432388306, 0.16502273082733154, 0.18962162733078003, 0.21422050893306732, 0.2388194054365158, 0.2634183168411255, 0.2880171835422516, 0.3126160800457001, 0.33721497654914856, 0.36181387305259705, 0.38641276955604553, 0.41101163625717163, 0.4356105327606201, 0.4602094292640686, 0.4848083257675171, 0.5094072222709656, 0.5340061187744141, 0.5586050152778625, 0.583203911781311, 0.6078028082847595, 0.632401704788208, 0.6570006012916565, 0.681599497795105, 0.7061983346939087, 0.730797290802002, 0.7553961873054504, 0.7799950838088989, 0.8045939803123474, 0.8291928768157959, 0.8537917733192444, 0.8783906698226929, 0.9029895067214966, 0.9275884032249451]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 5.0, 18.0, 31.0, 43.0, 94.0, 119.0, 246.0, 478.0, 767.0, 1374.0, 2421.0, 4165.0, 7135.0, 12589.0, 22234.0, 47564.0, 177692.0, 480145.0, 188798.0, 49569.0, 22695.0, 12853.0, 7447.0, 4325.0, 2500.0, 1370.0, 800.0, 462.0, 245.0, 135.0, 78.0, 47.0, 26.0, 23.0, 12.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20654296875, -0.20019149780273438, -0.19384002685546875, -0.18748855590820312, -0.1811370849609375, -0.17478561401367188, -0.16843414306640625, -0.16208267211914062, -0.155731201171875, -0.14937973022460938, -0.14302825927734375, -0.13667678833007812, -0.1303253173828125, -0.12397384643554688, -0.11762237548828125, -0.11127090454101562, -0.10491943359375, -0.09856796264648438, -0.09221649169921875, -0.08586502075195312, -0.0795135498046875, -0.07316207885742188, -0.06681060791015625, -0.060459136962890625, -0.054107666015625, -0.047756195068359375, -0.04140472412109375, -0.035053253173828125, -0.0287017822265625, -0.022350311279296875, -0.01599884033203125, -0.009647369384765625, -0.0032958984375, 0.003055572509765625, 0.00940704345703125, 0.015758514404296875, 0.0221099853515625, 0.028461456298828125, 0.03481292724609375, 0.041164398193359375, 0.047515869140625, 0.053867340087890625, 0.06021881103515625, 0.06657028198242188, 0.0729217529296875, 0.07927322387695312, 0.08562469482421875, 0.09197616577148438, 0.09832763671875, 0.10467910766601562, 0.11103057861328125, 0.11738204956054688, 0.1237335205078125, 0.13008499145507812, 0.13643646240234375, 0.14278793334960938, 0.149139404296875, 0.15549087524414062, 0.16184234619140625, 0.16819381713867188, 0.1745452880859375, 0.18089675903320312, 0.18724822998046875, 0.19359970092773438, 0.199951171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 8.0, 12.0, 15.0, 14.0, 19.0, 18.0, 17.0, 27.0, 26.0, 34.0, 36.0, 29.0, 44.0, 41.0, 40.0, 42.0, 49.0, 55.0, 40.0, 41.0, 60.0, 46.0, 34.0, 31.0, 29.0, 25.0, 31.0, 17.0, 25.0, 23.0, 19.0, 17.0, 7.0, 7.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.09814453125, -0.09541130065917969, -0.09267807006835938, -0.08994483947753906, -0.08721160888671875, -0.08447837829589844, -0.08174514770507812, -0.07901191711425781, -0.0762786865234375, -0.07354545593261719, -0.07081222534179688, -0.06807899475097656, -0.06534576416015625, -0.06261253356933594, -0.059879302978515625, -0.05714607238769531, -0.054412841796875, -0.05167961120605469, -0.048946380615234375, -0.04621315002441406, -0.04347991943359375, -0.04074668884277344, -0.038013458251953125, -0.03528022766113281, -0.0325469970703125, -0.029813766479492188, -0.027080535888671875, -0.024347305297851562, -0.02161407470703125, -0.018880844116210938, -0.016147613525390625, -0.013414382934570312, -0.01068115234375, -0.007947921752929688, -0.005214691162109375, -0.0024814605712890625, 0.00025177001953125, 0.0029850006103515625, 0.005718231201171875, 0.008451461791992188, 0.0111846923828125, 0.013917922973632812, 0.016651153564453125, 0.019384384155273438, 0.02211761474609375, 0.024850845336914062, 0.027584075927734375, 0.030317306518554688, 0.033050537109375, 0.03578376770019531, 0.038516998291015625, 0.04125022888183594, 0.04398345947265625, 0.04671669006347656, 0.049449920654296875, 0.05218315124511719, 0.0549163818359375, 0.05764961242675781, 0.060382843017578125, 0.06311607360839844, 0.06584930419921875, 0.06858253479003906, 0.07131576538085938, 0.07404899597167969, 0.0767822265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 9.0, 3.0, 8.0, 12.0, 20.0, 37.0, 52.0, 80.0, 130.0, 265.0, 491.0, 952.0, 2325.0, 5832.0, 15261.0, 40981.0, 212865.0, 624743.0, 97727.0, 28284.0, 10958.0, 4249.0, 1695.0, 706.0, 360.0, 199.0, 126.0, 69.0, 51.0, 31.0, 14.0, 13.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.310546875, -0.3014984130859375, -0.292449951171875, -0.2834014892578125, -0.27435302734375, -0.2653045654296875, -0.256256103515625, -0.2472076416015625, -0.2381591796875, -0.2291107177734375, -0.220062255859375, -0.2110137939453125, -0.20196533203125, -0.1929168701171875, -0.183868408203125, -0.1748199462890625, -0.165771484375, -0.1567230224609375, -0.147674560546875, -0.1386260986328125, -0.12957763671875, -0.1205291748046875, -0.111480712890625, -0.1024322509765625, -0.0933837890625, -0.0843353271484375, -0.075286865234375, -0.0662384033203125, -0.05718994140625, -0.0481414794921875, -0.039093017578125, -0.0300445556640625, -0.02099609375, -0.0119476318359375, -0.002899169921875, 0.0061492919921875, 0.01519775390625, 0.0242462158203125, 0.033294677734375, 0.0423431396484375, 0.0513916015625, 0.0604400634765625, 0.069488525390625, 0.0785369873046875, 0.08758544921875, 0.0966339111328125, 0.105682373046875, 0.1147308349609375, 0.123779296875, 0.1328277587890625, 0.141876220703125, 0.1509246826171875, 0.15997314453125, 0.1690216064453125, 0.178070068359375, 0.1871185302734375, 0.1961669921875, 0.2052154541015625, 0.214263916015625, 0.2233123779296875, 0.23236083984375, 0.2414093017578125, 0.250457763671875, 0.2595062255859375, 0.2685546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 9.0, 16.0, 15.0, 11.0, 25.0, 16.0, 19.0, 32.0, 32.0, 29.0, 49.0, 52.0, 42.0, 36.0, 48.0, 59.0, 43.0, 63.0, 53.0, 39.0, 35.0, 39.0, 38.0, 37.0, 19.0, 20.0, 22.0, 21.0, 21.0, 13.0, 12.0, 7.0, 6.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2861328125, -0.27712249755859375, -0.2681121826171875, -0.25910186767578125, -0.250091552734375, -0.24108123779296875, -0.2320709228515625, -0.22306060791015625, -0.21405029296875, -0.20503997802734375, -0.1960296630859375, -0.18701934814453125, -0.178009033203125, -0.16899871826171875, -0.1599884033203125, -0.15097808837890625, -0.1419677734375, -0.13295745849609375, -0.1239471435546875, -0.11493682861328125, -0.105926513671875, -0.09691619873046875, -0.0879058837890625, -0.07889556884765625, -0.06988525390625, -0.06087493896484375, -0.0518646240234375, -0.04285430908203125, -0.033843994140625, -0.02483367919921875, -0.0158233642578125, -0.00681304931640625, 0.002197265625, 0.01120758056640625, 0.0202178955078125, 0.02922821044921875, 0.038238525390625, 0.04724884033203125, 0.0562591552734375, 0.06526947021484375, 0.07427978515625, 0.08329010009765625, 0.0923004150390625, 0.10131072998046875, 0.110321044921875, 0.11933135986328125, 0.1283416748046875, 0.13735198974609375, 0.1463623046875, 0.15537261962890625, 0.1643829345703125, 0.17339324951171875, 0.182403564453125, 0.19141387939453125, 0.2004241943359375, 0.20943450927734375, 0.21844482421875, 0.22745513916015625, 0.2364654541015625, 0.24547576904296875, 0.254486083984375, 0.26349639892578125, 0.2725067138671875, 0.28151702880859375, 0.29052734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 8.0, 9.0, 15.0, 16.0, 18.0, 29.0, 54.0, 54.0, 121.0, 139.0, 187.0, 339.0, 525.0, 782.0, 1247.0, 1838.0, 2955.0, 4394.0, 7070.0, 11623.0, 18558.0, 31072.0, 56238.0, 123253.0, 284180.0, 264043.0, 111059.0, 52534.0, 29092.0, 17453.0, 10805.0, 6755.0, 4312.0, 2743.0, 1744.0, 1131.0, 747.0, 477.0, 326.0, 184.0, 132.0, 73.0, 74.0, 39.0, 31.0, 23.0, 13.0, 16.0, 4.0, 2.0, 2.0, 6.0, 5.0, 0.0, 3.0, 1.0], "bins": [-0.052947998046875, -0.051340579986572266, -0.04973316192626953, -0.0481257438659668, -0.04651832580566406, -0.04491090774536133, -0.043303489685058594, -0.04169607162475586, -0.040088653564453125, -0.03848123550415039, -0.036873817443847656, -0.03526639938354492, -0.03365898132324219, -0.03205156326293945, -0.03044414520263672, -0.028836727142333984, -0.02722930908203125, -0.025621891021728516, -0.02401447296142578, -0.022407054901123047, -0.020799636840820312, -0.019192218780517578, -0.017584800720214844, -0.01597738265991211, -0.014369964599609375, -0.01276254653930664, -0.011155128479003906, -0.009547710418701172, -0.007940292358398438, -0.006332874298095703, -0.004725456237792969, -0.0031180381774902344, -0.0015106201171875, 9.679794311523438e-05, 0.0017042160034179688, 0.003311634063720703, 0.0049190521240234375, 0.006526470184326172, 0.008133888244628906, 0.00974130630493164, 0.011348724365234375, 0.01295614242553711, 0.014563560485839844, 0.016170978546142578, 0.017778396606445312, 0.019385814666748047, 0.02099323272705078, 0.022600650787353516, 0.02420806884765625, 0.025815486907958984, 0.02742290496826172, 0.029030323028564453, 0.030637741088867188, 0.03224515914916992, 0.033852577209472656, 0.03545999526977539, 0.037067413330078125, 0.03867483139038086, 0.040282249450683594, 0.04188966751098633, 0.04349708557128906, 0.0451045036315918, 0.04671192169189453, 0.048319339752197266, 0.0499267578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 3.0, 4.0, 8.0, 9.0, 11.0, 9.0, 22.0, 23.0, 55.0, 78.0, 159.0, 137.0, 161.0, 96.0, 58.0, 44.0, 24.0, 16.0, 14.0, 19.0, 8.0, 10.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.540515899658203e-05, -3.441330045461655e-05, -3.342144191265106e-05, -3.242958337068558e-05, -3.143772482872009e-05, -3.0445866286754608e-05, -2.9454007744789124e-05, -2.846214920282364e-05, -2.7470290660858154e-05, -2.647843211889267e-05, -2.5486573576927185e-05, -2.44947150349617e-05, -2.3502856492996216e-05, -2.251099795103073e-05, -2.1519139409065247e-05, -2.0527280867099762e-05, -1.9535422325134277e-05, -1.8543563783168793e-05, -1.7551705241203308e-05, -1.6559846699237823e-05, -1.556798815727234e-05, -1.4576129615306854e-05, -1.358427107334137e-05, -1.2592412531375885e-05, -1.16005539894104e-05, -1.0608695447444916e-05, -9.616836905479431e-06, -8.624978363513947e-06, -7.633119821548462e-06, -6.641261279582977e-06, -5.649402737617493e-06, -4.657544195652008e-06, -3.6656856536865234e-06, -2.673827111721039e-06, -1.6819685697555542e-06, -6.901100277900696e-07, 3.0174851417541504e-07, 1.2936070561408997e-06, 2.2854655981063843e-06, 3.277324140071869e-06, 4.2691826820373535e-06, 5.261041224002838e-06, 6.252899765968323e-06, 7.244758307933807e-06, 8.236616849899292e-06, 9.228475391864777e-06, 1.0220333933830261e-05, 1.1212192475795746e-05, 1.220405101776123e-05, 1.3195909559726715e-05, 1.41877681016922e-05, 1.5179626643657684e-05, 1.617148518562317e-05, 1.7163343727588654e-05, 1.8155202269554138e-05, 1.9147060811519623e-05, 2.0138919353485107e-05, 2.1130777895450592e-05, 2.2122636437416077e-05, 2.311449497938156e-05, 2.4106353521347046e-05, 2.509821206331253e-05, 2.6090070605278015e-05, 2.70819291472435e-05, 2.8073787689208984e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 7.0, 15.0, 19.0, 31.0, 44.0, 57.0, 96.0, 149.0, 246.0, 400.0, 669.0, 1231.0, 2260.0, 4333.0, 8595.0, 17218.0, 36464.0, 83355.0, 218101.0, 358578.0, 182393.0, 71234.0, 31776.0, 15192.0, 7555.0, 3814.0, 1957.0, 1122.0, 612.0, 372.0, 247.0, 139.0, 97.0, 60.0, 38.0, 22.0, 17.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06536865234375, -0.06335163116455078, -0.06133460998535156, -0.059317588806152344, -0.057300567626953125, -0.055283546447753906, -0.05326652526855469, -0.05124950408935547, -0.04923248291015625, -0.04721546173095703, -0.04519844055175781, -0.043181419372558594, -0.041164398193359375, -0.039147377014160156, -0.03713035583496094, -0.03511333465576172, -0.0330963134765625, -0.03107929229736328, -0.029062271118164062, -0.027045249938964844, -0.025028228759765625, -0.023011207580566406, -0.020994186401367188, -0.01897716522216797, -0.01696014404296875, -0.014943122863769531, -0.012926101684570312, -0.010909080505371094, -0.008892059326171875, -0.006875038146972656, -0.0048580169677734375, -0.0028409957885742188, -0.000823974609375, 0.0011930465698242188, 0.0032100677490234375, 0.005227088928222656, 0.007244110107421875, 0.009261131286621094, 0.011278152465820312, 0.013295173645019531, 0.01531219482421875, 0.01732921600341797, 0.019346237182617188, 0.021363258361816406, 0.023380279541015625, 0.025397300720214844, 0.027414321899414062, 0.02943134307861328, 0.0314483642578125, 0.03346538543701172, 0.03548240661621094, 0.037499427795410156, 0.039516448974609375, 0.041533470153808594, 0.04355049133300781, 0.04556751251220703, 0.04758453369140625, 0.04960155487060547, 0.05161857604980469, 0.053635597229003906, 0.055652618408203125, 0.057669639587402344, 0.05968666076660156, 0.06170368194580078, 0.063720703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 10.0, 6.0, 10.0, 12.0, 18.0, 20.0, 28.0, 28.0, 31.0, 50.0, 63.0, 80.0, 75.0, 81.0, 84.0, 91.0, 50.0, 43.0, 35.0, 27.0, 19.0, 17.0, 16.0, 15.0, 9.0, 11.0, 9.0, 9.0, 4.0, 3.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0], "bins": [-0.07879638671875, -0.07663297653198242, -0.07446956634521484, -0.07230615615844727, -0.07014274597167969, -0.06797933578491211, -0.06581592559814453, -0.06365251541137695, -0.061489105224609375, -0.0593256950378418, -0.05716228485107422, -0.05499887466430664, -0.05283546447753906, -0.050672054290771484, -0.048508644104003906, -0.04634523391723633, -0.04418182373046875, -0.04201841354370117, -0.039855003356933594, -0.037691593170166016, -0.03552818298339844, -0.03336477279663086, -0.03120136260986328, -0.029037952423095703, -0.026874542236328125, -0.024711132049560547, -0.02254772186279297, -0.02038431167602539, -0.018220901489257812, -0.016057491302490234, -0.013894081115722656, -0.011730670928955078, -0.0095672607421875, -0.007403850555419922, -0.005240440368652344, -0.0030770301818847656, -0.0009136199951171875, 0.0012497901916503906, 0.0034132003784179688, 0.005576610565185547, 0.007740020751953125, 0.009903430938720703, 0.012066841125488281, 0.01423025131225586, 0.016393661499023438, 0.018557071685791016, 0.020720481872558594, 0.022883892059326172, 0.02504730224609375, 0.027210712432861328, 0.029374122619628906, 0.031537532806396484, 0.03370094299316406, 0.03586435317993164, 0.03802776336669922, 0.0401911735534668, 0.042354583740234375, 0.04451799392700195, 0.04668140411376953, 0.04884481430053711, 0.05100822448730469, 0.053171634674072266, 0.055335044860839844, 0.05749845504760742, 0.059661865234375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 16.0, 60.0, 147.0, 229.0, 225.0, 174.0, 81.0, 35.0, 13.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8842415809631348, -2.815929889678955, -2.7476184368133545, -2.679306745529175, -2.610995292663574, -2.5426836013793945, -2.474371910095215, -2.4060604572296143, -2.3377487659454346, -2.269437074661255, -2.2011256217956543, -2.1328139305114746, -2.064502477645874, -1.9961907863616943, -1.9278792142868042, -1.859567642211914, -1.791256070137024, -1.7229444980621338, -1.6546329259872437, -1.5863213539123535, -1.5180096626281738, -1.4496980905532837, -1.3813865184783936, -1.3130749464035034, -1.2447633743286133, -1.1764518022537231, -1.108140230178833, -1.0398285388946533, -0.9715169668197632, -0.903205394744873, -0.8348938226699829, -0.7665822505950928, -0.6982705593109131, -0.629958987236023, -0.561647355556488, -0.4933357834815979, -0.4250241816043854, -0.35671257972717285, -0.2884010076522827, -0.2200894057750702, -0.15177780389785767, -0.08346620947122574, -0.015154615044593811, 0.05315697193145752, 0.12146857380867004, 0.18978017568588257, 0.2580917477607727, 0.32640334963798523, 0.39471495151519775, 0.4630265533924103, 0.5313381552696228, 0.5996497273445129, 0.6679613590240479, 0.736272931098938, 0.8045845031738281, 0.8728960752487183, 0.9412077069282532, 1.009519338607788, 1.0778309106826782, 1.1461424827575684, 1.2144540548324585, 1.2827656269073486, 1.3510773181915283, 1.4193888902664185, 1.4877004623413086]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 2.0, 5.0, 0.0, 11.0, 7.0, 17.0, 13.0, 15.0, 18.0, 29.0, 32.0, 29.0, 33.0, 26.0, 35.0, 33.0, 35.0, 34.0, 48.0, 35.0, 42.0, 39.0, 39.0, 41.0, 40.0, 33.0, 38.0, 34.0, 31.0, 29.0, 24.0, 14.0, 19.0, 18.0, 23.0, 12.0, 11.0, 4.0, 12.0, 8.0, 8.0, 5.0, 6.0, 2.0, 6.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.6708263754844666, -0.6509302854537964, -0.6310341954231262, -0.611138105392456, -0.5912420749664307, -0.5713459849357605, -0.5514498949050903, -0.5315538048744202, -0.51165771484375, -0.49176162481307983, -0.47186556458473206, -0.4519694745540619, -0.4320733845233917, -0.41217732429504395, -0.3922812342643738, -0.3723851442337036, -0.35248908400535583, -0.33259299397468567, -0.3126969337463379, -0.2928008437156677, -0.27290475368499756, -0.2530086636543274, -0.23311260342597961, -0.21321651339530945, -0.19332043826580048, -0.1734243631362915, -0.15352827310562134, -0.13363219797611237, -0.1137361153960228, -0.09384003281593323, -0.07394395768642426, -0.05404786765575409, -0.03415179252624512, -0.014255711808800697, 0.0056403689086437225, 0.025536447763442993, 0.04543253034353256, 0.06532861292362213, 0.0852246880531311, 0.10512077808380127, 0.12501685321331024, 0.1449129283428192, 0.16480901837348938, 0.18470509350299835, 0.20460116863250732, 0.2244972586631775, 0.24439333379268646, 0.2642894387245178, 0.2841854989528656, 0.30408158898353577, 0.32397764921188354, 0.3438737392425537, 0.3637698292732239, 0.38366591930389404, 0.4035619795322418, 0.423458069562912, 0.44335412979125977, 0.46325021982192993, 0.4831462800502777, 0.5030423402786255, 0.5229384303092957, 0.5428345203399658, 0.562730610370636, 0.5826267004013062, 0.6025227904319763]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 17.0, 19.0, 21.0, 39.0, 51.0, 86.0, 117.0, 221.0, 353.0, 544.0, 973.0, 1591.0, 2685.0, 4714.0, 8137.0, 14462.0, 25656.0, 45262.0, 81662.0, 150925.0, 289897.0, 599405.0, 1077684.0, 929627.0, 464698.0, 227254.0, 119435.0, 64946.0, 36337.0, 20274.0, 11202.0, 6635.0, 3828.0, 2194.0, 1281.0, 806.0, 464.0, 294.0, 161.0, 118.0, 70.0, 51.0, 40.0, 18.0, 11.0, 6.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.066162109375, -0.06394290924072266, -0.06172370910644531, -0.05950450897216797, -0.057285308837890625, -0.05506610870361328, -0.05284690856933594, -0.050627708435058594, -0.04840850830078125, -0.046189308166503906, -0.04397010803222656, -0.04175090789794922, -0.039531707763671875, -0.03731250762939453, -0.03509330749511719, -0.032874107360839844, -0.0306549072265625, -0.028435707092285156, -0.026216506958007812, -0.02399730682373047, -0.021778106689453125, -0.01955890655517578, -0.017339706420898438, -0.015120506286621094, -0.01290130615234375, -0.010682106018066406, -0.008462905883789062, -0.006243705749511719, -0.004024505615234375, -0.0018053054809570312, 0.0004138946533203125, 0.0026330947875976562, 0.004852294921875, 0.007071495056152344, 0.009290695190429688, 0.011509895324707031, 0.013729095458984375, 0.01594829559326172, 0.018167495727539062, 0.020386695861816406, 0.02260589599609375, 0.024825096130371094, 0.027044296264648438, 0.02926349639892578, 0.031482696533203125, 0.03370189666748047, 0.03592109680175781, 0.038140296936035156, 0.0403594970703125, 0.042578697204589844, 0.04479789733886719, 0.04701709747314453, 0.049236297607421875, 0.05145549774169922, 0.05367469787597656, 0.055893898010253906, 0.05811309814453125, 0.060332298278808594, 0.06255149841308594, 0.06477069854736328, 0.06698989868164062, 0.06920909881591797, 0.07142829895019531, 0.07364749908447266, 0.07586669921875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 11.0, 4.0, 7.0, 13.0, 10.0, 12.0, 15.0, 26.0, 28.0, 21.0, 34.0, 24.0, 24.0, 33.0, 37.0, 42.0, 44.0, 38.0, 33.0, 36.0, 43.0, 42.0, 32.0, 37.0, 38.0, 41.0, 23.0, 39.0, 28.0, 35.0, 15.0, 19.0, 20.0, 15.0, 10.0, 11.0, 14.0, 10.0, 8.0, 10.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0701904296875, -0.06787872314453125, -0.0655670166015625, -0.06325531005859375, -0.060943603515625, -0.05863189697265625, -0.0563201904296875, -0.05400848388671875, -0.05169677734375, -0.04938507080078125, -0.0470733642578125, -0.04476165771484375, -0.042449951171875, -0.04013824462890625, -0.0378265380859375, -0.03551483154296875, -0.033203125, -0.03089141845703125, -0.0285797119140625, -0.02626800537109375, -0.023956298828125, -0.02164459228515625, -0.0193328857421875, -0.01702117919921875, -0.01470947265625, -0.01239776611328125, -0.0100860595703125, -0.00777435302734375, -0.005462646484375, -0.00315093994140625, -0.0008392333984375, 0.00147247314453125, 0.0037841796875, 0.00609588623046875, 0.0084075927734375, 0.01071929931640625, 0.013031005859375, 0.01534271240234375, 0.0176544189453125, 0.01996612548828125, 0.02227783203125, 0.02458953857421875, 0.0269012451171875, 0.02921295166015625, 0.031524658203125, 0.03383636474609375, 0.0361480712890625, 0.03845977783203125, 0.040771484375, 0.04308319091796875, 0.0453948974609375, 0.04770660400390625, 0.050018310546875, 0.05233001708984375, 0.0546417236328125, 0.05695343017578125, 0.05926513671875, 0.06157684326171875, 0.0638885498046875, 0.06620025634765625, 0.068511962890625, 0.07082366943359375, 0.0731353759765625, 0.07544708251953125, 0.0777587890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 14.0, 29.0, 39.0, 74.0, 125.0, 257.0, 489.0, 994.0, 2397.0, 7577.0, 34346.0, 189735.0, 1437499.0, 2175971.0, 280615.0, 48357.0, 10415.0, 3066.0, 1156.0, 509.0, 277.0, 149.0, 65.0, 54.0, 27.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.2869911193847656, -0.27881622314453125, -0.2706413269042969, -0.2624664306640625, -0.2542915344238281, -0.24611663818359375, -0.23794174194335938, -0.229766845703125, -0.22159194946289062, -0.21341705322265625, -0.20524215698242188, -0.1970672607421875, -0.18889236450195312, -0.18071746826171875, -0.17254257202148438, -0.16436767578125, -0.15619277954101562, -0.14801788330078125, -0.13984298706054688, -0.1316680908203125, -0.12349319458007812, -0.11531829833984375, -0.10714340209960938, -0.098968505859375, -0.09079360961914062, -0.08261871337890625, -0.07444381713867188, -0.0662689208984375, -0.058094024658203125, -0.04991912841796875, -0.041744232177734375, -0.0335693359375, -0.025394439697265625, -0.01721954345703125, -0.009044647216796875, -0.0008697509765625, 0.007305145263671875, 0.01548004150390625, 0.023654937744140625, 0.031829833984375, 0.040004730224609375, 0.04817962646484375, 0.056354522705078125, 0.0645294189453125, 0.07270431518554688, 0.08087921142578125, 0.08905410766601562, 0.09722900390625, 0.10540390014648438, 0.11357879638671875, 0.12175369262695312, 0.1299285888671875, 0.13810348510742188, 0.14627838134765625, 0.15445327758789062, 0.162628173828125, 0.17080307006835938, 0.17897796630859375, 0.18715286254882812, 0.1953277587890625, 0.20350265502929688, 0.21167755126953125, 0.21985244750976562, 0.22802734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 9.0, 2.0, 5.0, 10.0, 10.0, 20.0, 14.0, 22.0, 46.0, 58.0, 55.0, 89.0, 132.0, 185.0, 237.0, 343.0, 493.0, 613.0, 501.0, 353.0, 240.0, 179.0, 107.0, 98.0, 53.0, 53.0, 45.0, 18.0, 14.0, 17.0, 12.0, 14.0, 16.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.187408447265625, -0.18145751953125, -0.175506591796875, -0.1695556640625, -0.163604736328125, -0.15765380859375, -0.151702880859375, -0.145751953125, -0.139801025390625, -0.13385009765625, -0.127899169921875, -0.1219482421875, -0.115997314453125, -0.11004638671875, -0.104095458984375, -0.09814453125, -0.092193603515625, -0.08624267578125, -0.080291748046875, -0.0743408203125, -0.068389892578125, -0.06243896484375, -0.056488037109375, -0.050537109375, -0.044586181640625, -0.03863525390625, -0.032684326171875, -0.0267333984375, -0.020782470703125, -0.01483154296875, -0.008880615234375, -0.0029296875, 0.003021240234375, 0.00897216796875, 0.014923095703125, 0.0208740234375, 0.026824951171875, 0.03277587890625, 0.038726806640625, 0.044677734375, 0.050628662109375, 0.05657958984375, 0.062530517578125, 0.0684814453125, 0.074432373046875, 0.08038330078125, 0.086334228515625, 0.09228515625, 0.098236083984375, 0.10418701171875, 0.110137939453125, 0.1160888671875, 0.122039794921875, 0.12799072265625, 0.133941650390625, 0.139892578125, 0.145843505859375, 0.15179443359375, 0.157745361328125, 0.1636962890625, 0.169647216796875, 0.17559814453125, 0.181549072265625, 0.1875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 12.0, 13.0, 23.0, 31.0, 58.0, 78.0, 106.0, 135.0, 121.0, 126.0, 108.0, 62.0, 47.0, 27.0, 23.0, 11.0, 6.0, 1.0, 6.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.3622791767120361, -1.3215593099594116, -1.280839443206787, -1.2401195764541626, -1.199399709701538, -1.1586799621582031, -1.1179600954055786, -1.077240228652954, -1.0365203619003296, -0.9958004951477051, -0.9550806283950806, -0.9143608212471008, -0.8736409544944763, -0.8329210877418518, -0.7922012805938721, -0.7514814138412476, -0.710761547088623, -0.6700416803359985, -0.629321813583374, -0.5886020064353943, -0.5478821396827698, -0.5071622729301453, -0.46644243597984314, -0.425722599029541, -0.3850027322769165, -0.344282865524292, -0.30356302857398987, -0.26284319162368774, -0.22212332487106323, -0.18140347301959991, -0.1406836211681366, -0.09996378421783447, -0.05924391746520996, -0.018524065613746643, 0.022195786237716675, 0.06291563808917999, 0.10363548994064331, 0.14435534179210663, 0.18507519364356995, 0.22579503059387207, 0.2665148973464966, 0.3072347640991211, 0.3479546010494232, 0.38867443799972534, 0.42939430475234985, 0.47011417150497437, 0.5108339786529541, 0.5515538454055786, 0.5922737121582031, 0.6329935789108276, 0.6737134456634521, 0.7144332528114319, 0.7551531195640564, 0.7958729863166809, 0.8365927934646606, 0.8773126602172852, 0.9180325269699097, 0.9587523937225342, 0.9994722604751587, 1.0401921272277832, 1.0809118747711182, 1.1216317415237427, 1.1623516082763672, 1.2030714750289917, 1.2437913417816162]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 4.0, 8.0, 18.0, 14.0, 15.0, 29.0, 26.0, 25.0, 19.0, 42.0, 21.0, 35.0, 44.0, 35.0, 53.0, 42.0, 35.0, 48.0, 37.0, 49.0, 54.0, 41.0, 40.0, 45.0, 30.0, 35.0, 17.0, 23.0, 21.0, 20.0, 11.0, 10.0, 10.0, 6.0, 12.0, 6.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5831884145736694, -0.5626325607299805, -0.5420767664909363, -0.5215209126472473, -0.5009650588035583, -0.4804092347621918, -0.4598534107208252, -0.43929755687713623, -0.41874173283576965, -0.3981859087944031, -0.3776300549507141, -0.35707423090934753, -0.33651840686798096, -0.315962553024292, -0.2954067289829254, -0.27485090494155884, -0.2542950510978699, -0.2337392121553421, -0.21318337321281433, -0.19262754917144775, -0.17207171022891998, -0.1515158712863922, -0.13096004724502563, -0.11040420830249786, -0.08984836935997009, -0.06929253041744232, -0.04873669892549515, -0.028180863708257675, -0.007625028491020203, 0.012930810451507568, 0.03348664194345474, 0.054042473435401917, 0.07459837198257446, 0.09515421092510223, 0.11571004241704941, 0.13626587390899658, 0.15682171285152435, 0.17737755179405212, 0.1979333758354187, 0.21848921477794647, 0.23904505372047424, 0.2596008777618408, 0.2801567316055298, 0.30071255564689636, 0.32126837968826294, 0.3418242335319519, 0.3623800575733185, 0.38293588161468506, 0.403491735458374, 0.4240475594997406, 0.44460341334342957, 0.46515923738479614, 0.4857150912284851, 0.5062708854675293, 0.5268267393112183, 0.5473825931549072, 0.5679384469985962, 0.5884943008422852, 0.6090500950813293, 0.6296059489250183, 0.6501618027687073, 0.6707175970077515, 0.6912734508514404, 0.7118293046951294, 0.7323850989341736]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 8.0, 6.0, 17.0, 23.0, 31.0, 53.0, 73.0, 106.0, 159.0, 208.0, 310.0, 437.0, 654.0, 943.0, 1438.0, 2169.0, 3124.0, 4574.0, 6698.0, 9968.0, 14806.0, 22622.0, 37099.0, 68335.0, 139091.0, 241110.0, 221279.0, 118838.0, 59051.0, 32938.0, 20491.0, 13439.0, 9067.0, 6222.0, 4126.0, 2884.0, 1985.0, 1299.0, 924.0, 626.0, 435.0, 293.0, 197.0, 124.0, 87.0, 62.0, 46.0, 26.0, 17.0, 14.0, 15.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11529541015625, -0.11178970336914062, -0.10828399658203125, -0.10477828979492188, -0.1012725830078125, -0.09776687622070312, -0.09426116943359375, -0.09075546264648438, -0.087249755859375, -0.08374404907226562, -0.08023834228515625, -0.07673263549804688, -0.0732269287109375, -0.06972122192382812, -0.06621551513671875, -0.06270980834960938, -0.0592041015625, -0.055698394775390625, -0.05219268798828125, -0.048686981201171875, -0.0451812744140625, -0.041675567626953125, -0.03816986083984375, -0.034664154052734375, -0.031158447265625, -0.027652740478515625, -0.02414703369140625, -0.020641326904296875, -0.0171356201171875, -0.013629913330078125, -0.01012420654296875, -0.006618499755859375, -0.00311279296875, 0.000392913818359375, 0.00389862060546875, 0.007404327392578125, 0.0109100341796875, 0.014415740966796875, 0.01792144775390625, 0.021427154541015625, 0.024932861328125, 0.028438568115234375, 0.03194427490234375, 0.035449981689453125, 0.0389556884765625, 0.042461395263671875, 0.04596710205078125, 0.049472808837890625, 0.052978515625, 0.056484222412109375, 0.05998992919921875, 0.06349563598632812, 0.0670013427734375, 0.07050704956054688, 0.07401275634765625, 0.07751846313476562, 0.081024169921875, 0.08452987670898438, 0.08803558349609375, 0.09154129028320312, 0.0950469970703125, 0.09855270385742188, 0.10205841064453125, 0.10556411743164062, 0.10906982421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 10.0, 8.0, 9.0, 4.0, 19.0, 21.0, 21.0, 29.0, 30.0, 23.0, 24.0, 40.0, 33.0, 38.0, 41.0, 35.0, 45.0, 45.0, 63.0, 39.0, 45.0, 42.0, 47.0, 45.0, 41.0, 33.0, 29.0, 26.0, 23.0, 15.0, 11.0, 11.0, 11.0, 7.0, 4.0, 6.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.06643199920654297, -0.06377220153808594, -0.061112403869628906, -0.058452606201171875, -0.055792808532714844, -0.05313301086425781, -0.05047321319580078, -0.04781341552734375, -0.04515361785888672, -0.04249382019042969, -0.039834022521972656, -0.037174224853515625, -0.034514427185058594, -0.03185462951660156, -0.02919483184814453, -0.0265350341796875, -0.02387523651123047, -0.021215438842773438, -0.018555641174316406, -0.015895843505859375, -0.013236045837402344, -0.010576248168945312, -0.007916450500488281, -0.00525665283203125, -0.0025968551635742188, 6.29425048828125e-05, 0.0027227401733398438, 0.005382537841796875, 0.008042335510253906, 0.010702133178710938, 0.013361930847167969, 0.016021728515625, 0.01868152618408203, 0.021341323852539062, 0.024001121520996094, 0.026660919189453125, 0.029320716857910156, 0.03198051452636719, 0.03464031219482422, 0.03730010986328125, 0.03995990753173828, 0.04261970520019531, 0.045279502868652344, 0.047939300537109375, 0.050599098205566406, 0.05325889587402344, 0.05591869354248047, 0.0585784912109375, 0.06123828887939453, 0.06389808654785156, 0.0665578842163086, 0.06921768188476562, 0.07187747955322266, 0.07453727722167969, 0.07719707489013672, 0.07985687255859375, 0.08251667022705078, 0.08517646789550781, 0.08783626556396484, 0.09049606323242188, 0.0931558609008789, 0.09581565856933594, 0.09847545623779297, 0.10113525390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 1.0, 11.0, 11.0, 11.0, 23.0, 26.0, 45.0, 66.0, 69.0, 107.0, 197.0, 282.0, 440.0, 833.0, 1681.0, 3450.0, 7884.0, 17668.0, 42228.0, 124905.0, 439753.0, 281300.0, 75320.0, 28709.0, 12533.0, 5463.0, 2523.0, 1271.0, 667.0, 385.0, 225.0, 161.0, 95.0, 61.0, 39.0, 27.0, 25.0, 15.0, 14.0, 7.0, 3.0, 2.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.223388671875, -0.21657562255859375, -0.2097625732421875, -0.20294952392578125, -0.196136474609375, -0.18932342529296875, -0.1825103759765625, -0.17569732666015625, -0.16888427734375, -0.16207122802734375, -0.1552581787109375, -0.14844512939453125, -0.141632080078125, -0.13481903076171875, -0.1280059814453125, -0.12119293212890625, -0.1143798828125, -0.10756683349609375, -0.1007537841796875, -0.09394073486328125, -0.087127685546875, -0.08031463623046875, -0.0735015869140625, -0.06668853759765625, -0.05987548828125, -0.05306243896484375, -0.0462493896484375, -0.03943634033203125, -0.032623291015625, -0.02581024169921875, -0.0189971923828125, -0.01218414306640625, -0.00537109375, 0.00144195556640625, 0.0082550048828125, 0.01506805419921875, 0.021881103515625, 0.02869415283203125, 0.0355072021484375, 0.04232025146484375, 0.04913330078125, 0.05594635009765625, 0.0627593994140625, 0.06957244873046875, 0.076385498046875, 0.08319854736328125, 0.0900115966796875, 0.09682464599609375, 0.1036376953125, 0.11045074462890625, 0.1172637939453125, 0.12407684326171875, 0.130889892578125, 0.13770294189453125, 0.1445159912109375, 0.15132904052734375, 0.15814208984375, 0.16495513916015625, 0.1717681884765625, 0.17858123779296875, 0.185394287109375, 0.19220733642578125, 0.1990203857421875, 0.20583343505859375, 0.212646484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 4.0, 8.0, 12.0, 12.0, 6.0, 18.0, 20.0, 23.0, 15.0, 40.0, 32.0, 30.0, 37.0, 30.0, 52.0, 48.0, 52.0, 57.0, 53.0, 54.0, 58.0, 41.0, 44.0, 29.0, 38.0, 34.0, 34.0, 24.0, 16.0, 7.0, 12.0, 12.0, 11.0, 11.0, 6.0, 5.0, 5.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.2583045959472656, -0.25000762939453125, -0.24171066284179688, -0.2334136962890625, -0.22511672973632812, -0.21681976318359375, -0.20852279663085938, -0.200225830078125, -0.19192886352539062, -0.18363189697265625, -0.17533493041992188, -0.1670379638671875, -0.15874099731445312, -0.15044403076171875, -0.14214706420898438, -0.13385009765625, -0.12555313110351562, -0.11725616455078125, -0.10895919799804688, -0.1006622314453125, -0.09236526489257812, -0.08406829833984375, -0.07577133178710938, -0.067474365234375, -0.059177398681640625, -0.05088043212890625, -0.042583465576171875, -0.0342864990234375, -0.025989532470703125, -0.01769256591796875, -0.009395599365234375, -0.0010986328125, 0.007198333740234375, 0.01549530029296875, 0.023792266845703125, 0.0320892333984375, 0.040386199951171875, 0.04868316650390625, 0.056980133056640625, 0.065277099609375, 0.07357406616210938, 0.08187103271484375, 0.09016799926757812, 0.0984649658203125, 0.10676193237304688, 0.11505889892578125, 0.12335586547851562, 0.13165283203125, 0.13994979858398438, 0.14824676513671875, 0.15654373168945312, 0.1648406982421875, 0.17313766479492188, 0.18143463134765625, 0.18973159790039062, 0.198028564453125, 0.20632553100585938, 0.21462249755859375, 0.22291946411132812, 0.2312164306640625, 0.23951339721679688, 0.24781036376953125, 0.2561073303222656, 0.264404296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 14.0, 13.0, 16.0, 32.0, 43.0, 78.0, 141.0, 305.0, 711.0, 1771.0, 4801.0, 12391.0, 34482.0, 115677.0, 507921.0, 272716.0, 62886.0, 21379.0, 8032.0, 3046.0, 1109.0, 480.0, 235.0, 111.0, 57.0, 34.0, 23.0, 17.0, 17.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1375732421875, -0.1337270736694336, -0.1298809051513672, -0.12603473663330078, -0.12218856811523438, -0.11834239959716797, -0.11449623107910156, -0.11065006256103516, -0.10680389404296875, -0.10295772552490234, -0.09911155700683594, -0.09526538848876953, -0.09141921997070312, -0.08757305145263672, -0.08372688293457031, -0.0798807144165039, -0.0760345458984375, -0.0721883773803711, -0.06834220886230469, -0.06449604034423828, -0.060649871826171875, -0.05680370330810547, -0.05295753479003906, -0.049111366271972656, -0.04526519775390625, -0.041419029235839844, -0.03757286071777344, -0.03372669219970703, -0.029880523681640625, -0.02603435516357422, -0.022188186645507812, -0.018342018127441406, -0.014495849609375, -0.010649681091308594, -0.0068035125732421875, -0.0029573440551757812, 0.000888824462890625, 0.004734992980957031, 0.008581161499023438, 0.012427330017089844, 0.01627349853515625, 0.020119667053222656, 0.023965835571289062, 0.02781200408935547, 0.031658172607421875, 0.03550434112548828, 0.03935050964355469, 0.043196678161621094, 0.0470428466796875, 0.050889015197753906, 0.05473518371582031, 0.05858135223388672, 0.062427520751953125, 0.06627368927001953, 0.07011985778808594, 0.07396602630615234, 0.07781219482421875, 0.08165836334228516, 0.08550453186035156, 0.08935070037841797, 0.09319686889648438, 0.09704303741455078, 0.10088920593261719, 0.1047353744506836, 0.10858154296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 5.0, 12.0, 10.0, 8.0, 15.0, 13.0, 22.0, 41.0, 52.0, 97.0, 110.0, 129.0, 114.0, 99.0, 77.0, 49.0, 30.0, 34.0, 22.0, 15.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.855062484741211e-05, -2.7528032660484314e-05, -2.650544047355652e-05, -2.5482848286628723e-05, -2.4460256099700928e-05, -2.3437663912773132e-05, -2.2415071725845337e-05, -2.139247953891754e-05, -2.0369887351989746e-05, -1.934729516506195e-05, -1.8324702978134155e-05, -1.730211079120636e-05, -1.6279518604278564e-05, -1.5256926417350769e-05, -1.4234334230422974e-05, -1.3211742043495178e-05, -1.2189149856567383e-05, -1.1166557669639587e-05, -1.0143965482711792e-05, -9.121373295783997e-06, -8.098781108856201e-06, -7.076188921928406e-06, -6.05359673500061e-06, -5.031004548072815e-06, -4.0084123611450195e-06, -2.985820174217224e-06, -1.9632279872894287e-06, -9.406358003616333e-07, 8.195638656616211e-08, 1.1045485734939575e-06, 2.127140760421753e-06, 3.1497329473495483e-06, 4.172325134277344e-06, 5.194917321205139e-06, 6.2175095081329346e-06, 7.24010169506073e-06, 8.262693881988525e-06, 9.28528606891632e-06, 1.0307878255844116e-05, 1.1330470442771912e-05, 1.2353062629699707e-05, 1.3375654816627502e-05, 1.4398247003555298e-05, 1.5420839190483093e-05, 1.644343137741089e-05, 1.7466023564338684e-05, 1.848861575126648e-05, 1.9511207938194275e-05, 2.053380012512207e-05, 2.1556392312049866e-05, 2.257898449897766e-05, 2.3601576685905457e-05, 2.4624168872833252e-05, 2.5646761059761047e-05, 2.6669353246688843e-05, 2.7691945433616638e-05, 2.8714537620544434e-05, 2.973712980747223e-05, 3.0759721994400024e-05, 3.178231418132782e-05, 3.2804906368255615e-05, 3.382749855518341e-05, 3.4850090742111206e-05, 3.5872682929039e-05, 3.68952751159668e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 8.0, 29.0, 27.0, 44.0, 76.0, 86.0, 175.0, 339.0, 601.0, 1398.0, 3048.0, 7333.0, 17776.0, 45452.0, 134253.0, 375192.0, 304112.0, 98619.0, 35414.0, 14177.0, 5614.0, 2454.0, 1076.0, 538.0, 283.0, 166.0, 96.0, 63.0, 33.0, 23.0, 16.0, 13.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0869140625, -0.08434772491455078, -0.08178138732910156, -0.07921504974365234, -0.07664871215820312, -0.0740823745727539, -0.07151603698730469, -0.06894969940185547, -0.06638336181640625, -0.06381702423095703, -0.06125068664550781, -0.058684349060058594, -0.056118011474609375, -0.053551673889160156, -0.05098533630371094, -0.04841899871826172, -0.0458526611328125, -0.04328632354736328, -0.04071998596191406, -0.038153648376464844, -0.035587310791015625, -0.033020973205566406, -0.030454635620117188, -0.02788829803466797, -0.02532196044921875, -0.02275562286376953, -0.020189285278320312, -0.017622947692871094, -0.015056610107421875, -0.012490272521972656, -0.009923934936523438, -0.007357597351074219, -0.004791259765625, -0.0022249221801757812, 0.0003414154052734375, 0.0029077529907226562, 0.005474090576171875, 0.008040428161621094, 0.010606765747070312, 0.013173103332519531, 0.01573944091796875, 0.01830577850341797, 0.020872116088867188, 0.023438453674316406, 0.026004791259765625, 0.028571128845214844, 0.031137466430664062, 0.03370380401611328, 0.0362701416015625, 0.03883647918701172, 0.04140281677246094, 0.043969154357910156, 0.046535491943359375, 0.049101829528808594, 0.05166816711425781, 0.05423450469970703, 0.05680084228515625, 0.05936717987060547, 0.06193351745605469, 0.0644998550415039, 0.06706619262695312, 0.06963253021240234, 0.07219886779785156, 0.07476520538330078, 0.07733154296875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 5.0, 6.0, 14.0, 16.0, 20.0, 25.0, 15.0, 27.0, 30.0, 44.0, 39.0, 44.0, 70.0, 72.0, 75.0, 71.0, 61.0, 57.0, 50.0, 39.0, 44.0, 27.0, 24.0, 17.0, 21.0, 17.0, 5.0, 12.0, 5.0, 8.0, 5.0, 7.0, 3.0, 5.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.08160400390625, -0.07944250106811523, -0.07728099822998047, -0.0751194953918457, -0.07295799255371094, -0.07079648971557617, -0.0686349868774414, -0.06647348403930664, -0.06431198120117188, -0.06215047836303711, -0.059988975524902344, -0.05782747268676758, -0.05566596984863281, -0.05350446701049805, -0.05134296417236328, -0.049181461334228516, -0.04701995849609375, -0.044858455657958984, -0.04269695281982422, -0.04053544998168945, -0.03837394714355469, -0.03621244430541992, -0.034050941467285156, -0.03188943862915039, -0.029727935791015625, -0.02756643295288086, -0.025404930114746094, -0.023243427276611328, -0.021081924438476562, -0.018920421600341797, -0.01675891876220703, -0.014597415924072266, -0.0124359130859375, -0.010274410247802734, -0.008112907409667969, -0.005951404571533203, -0.0037899017333984375, -0.0016283988952636719, 0.0005331039428710938, 0.0026946067810058594, 0.004856109619140625, 0.007017612457275391, 0.009179115295410156, 0.011340618133544922, 0.013502120971679688, 0.015663623809814453, 0.01782512664794922, 0.019986629486083984, 0.02214813232421875, 0.024309635162353516, 0.02647113800048828, 0.028632640838623047, 0.030794143676757812, 0.03295564651489258, 0.035117149353027344, 0.03727865219116211, 0.039440155029296875, 0.04160165786743164, 0.043763160705566406, 0.04592466354370117, 0.04808616638183594, 0.0502476692199707, 0.05240917205810547, 0.054570674896240234, 0.056732177734375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 23.0, 38.0, 70.0, 95.0, 131.0, 140.0, 158.0, 137.0, 85.0, 51.0, 28.0, 18.0, 9.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6272348165512085, -0.5839220285415649, -0.5406093001365662, -0.497296541929245, -0.45398378372192383, -0.41067102551460266, -0.3673582673072815, -0.3240455090999603, -0.28073275089263916, -0.237419992685318, -0.19410723447799683, -0.15079447627067566, -0.10748171806335449, -0.06416895985603333, -0.020856201648712158, 0.02245655655860901, 0.06576931476593018, 0.10908207297325134, 0.1523948311805725, 0.19570758938789368, 0.23902034759521484, 0.282333105802536, 0.3256458640098572, 0.36895862221717834, 0.4122713804244995, 0.4555841386318207, 0.49889689683914185, 0.5422096252441406, 0.5855224132537842, 0.6288352012634277, 0.6721479296684265, 0.7154606580734253, 0.7587733268737793, 0.8020861148834229, 0.8453988432884216, 0.8887115716934204, 0.932024359703064, 0.9753371477127075, 1.0186498165130615, 1.061962604522705, 1.1052753925323486, 1.1485881805419922, 1.1919009685516357, 1.2352136373519897, 1.2785264253616333, 1.3218392133712769, 1.3651518821716309, 1.4084646701812744, 1.451777458190918, 1.4950902462005615, 1.538403034210205, 1.581715703010559, 1.6250284910202026, 1.6683412790298462, 1.7116539478302002, 1.7549667358398438, 1.7982795238494873, 1.8415923118591309, 1.8849050998687744, 1.9282177686691284, 1.971530556678772, 2.014843225479126, 2.0581560134887695, 2.101468801498413, 2.1447815895080566]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 13.0, 13.0, 19.0, 17.0, 17.0, 26.0, 14.0, 15.0, 24.0, 25.0, 28.0, 42.0, 26.0, 38.0, 31.0, 36.0, 39.0, 50.0, 31.0, 37.0, 44.0, 40.0, 41.0, 30.0, 21.0, 41.0, 17.0, 19.0, 21.0, 19.0, 19.0, 20.0, 16.0, 18.0, 12.0, 9.0, 6.0, 10.0, 8.0, 4.0, 8.0, 6.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.601394534111023, -0.5831962823867798, -0.5649980306625366, -0.5467997789382935, -0.5286015272140503, -0.5104032754898071, -0.49220502376556396, -0.4740067720413208, -0.45580852031707764, -0.4376102685928345, -0.4194120168685913, -0.40121376514434814, -0.383015513420105, -0.3648172616958618, -0.34661900997161865, -0.3284207582473755, -0.3102225065231323, -0.29202425479888916, -0.273826003074646, -0.25562775135040283, -0.23742949962615967, -0.2192312479019165, -0.20103299617767334, -0.18283474445343018, -0.164636492729187, -0.14643824100494385, -0.12823998928070068, -0.11004173755645752, -0.09184348583221436, -0.07364523410797119, -0.05544698238372803, -0.03724873065948486, -0.0190504789352417, -0.0008522272109985352, 0.01734602451324463, 0.03554427623748779, 0.05374252796173096, 0.07194077968597412, 0.09013903141021729, 0.10833728313446045, 0.1265355348587036, 0.14473378658294678, 0.16293203830718994, 0.1811302900314331, 0.19932854175567627, 0.21752679347991943, 0.2357250452041626, 0.25392329692840576, 0.2721215486526489, 0.2903198003768921, 0.30851805210113525, 0.3267163038253784, 0.3449145555496216, 0.36311280727386475, 0.3813110589981079, 0.3995093107223511, 0.41770756244659424, 0.4359058141708374, 0.45410406589508057, 0.47230231761932373, 0.4905005693435669, 0.5086988210678101, 0.5268970727920532, 0.5450953245162964, 0.5632935762405396]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 9.0, 7.0, 15.0, 20.0, 24.0, 46.0, 70.0, 106.0, 177.0, 283.0, 484.0, 869.0, 1493.0, 2764.0, 5185.0, 10233.0, 20401.0, 41217.0, 83963.0, 179620.0, 425289.0, 1039763.0, 1293773.0, 616520.0, 248250.0, 113158.0, 54474.0, 27264.0, 13654.0, 6995.0, 3593.0, 1930.0, 1113.0, 584.0, 353.0, 231.0, 147.0, 76.0, 48.0, 33.0, 13.0, 9.0, 15.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07550048828125, -0.07291507720947266, -0.07032966613769531, -0.06774425506591797, -0.06515884399414062, -0.06257343292236328, -0.05998802185058594, -0.057402610778808594, -0.05481719970703125, -0.052231788635253906, -0.04964637756347656, -0.04706096649169922, -0.044475555419921875, -0.04189014434814453, -0.03930473327636719, -0.036719322204589844, -0.0341339111328125, -0.031548500061035156, -0.028963088989257812, -0.02637767791748047, -0.023792266845703125, -0.02120685577392578, -0.018621444702148438, -0.016036033630371094, -0.01345062255859375, -0.010865211486816406, -0.008279800415039062, -0.005694389343261719, -0.003108978271484375, -0.0005235671997070312, 0.0020618438720703125, 0.004647254943847656, 0.007232666015625, 0.009818077087402344, 0.012403488159179688, 0.014988899230957031, 0.017574310302734375, 0.02015972137451172, 0.022745132446289062, 0.025330543518066406, 0.02791595458984375, 0.030501365661621094, 0.03308677673339844, 0.03567218780517578, 0.038257598876953125, 0.04084300994873047, 0.04342842102050781, 0.046013832092285156, 0.0485992431640625, 0.051184654235839844, 0.05377006530761719, 0.05635547637939453, 0.058940887451171875, 0.06152629852294922, 0.06411170959472656, 0.0666971206665039, 0.06928253173828125, 0.0718679428100586, 0.07445335388183594, 0.07703876495361328, 0.07962417602539062, 0.08220958709716797, 0.08479499816894531, 0.08738040924072266, 0.0899658203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 4.0, 7.0, 11.0, 16.0, 18.0, 13.0, 27.0, 25.0, 28.0, 32.0, 35.0, 35.0, 47.0, 30.0, 35.0, 45.0, 35.0, 33.0, 49.0, 42.0, 47.0, 42.0, 43.0, 42.0, 29.0, 29.0, 38.0, 23.0, 25.0, 26.0, 19.0, 18.0, 15.0, 9.0, 5.0, 8.0, 2.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0765380859375, -0.07406234741210938, -0.07158660888671875, -0.06911087036132812, -0.0666351318359375, -0.06415939331054688, -0.06168365478515625, -0.059207916259765625, -0.056732177734375, -0.054256439208984375, -0.05178070068359375, -0.049304962158203125, -0.0468292236328125, -0.044353485107421875, -0.04187774658203125, -0.039402008056640625, -0.03692626953125, -0.034450531005859375, -0.03197479248046875, -0.029499053955078125, -0.0270233154296875, -0.024547576904296875, -0.02207183837890625, -0.019596099853515625, -0.017120361328125, -0.014644622802734375, -0.01216888427734375, -0.009693145751953125, -0.0072174072265625, -0.004741668701171875, -0.00226593017578125, 0.000209808349609375, 0.002685546875, 0.005161285400390625, 0.00763702392578125, 0.010112762451171875, 0.0125885009765625, 0.015064239501953125, 0.01753997802734375, 0.020015716552734375, 0.022491455078125, 0.024967193603515625, 0.02744293212890625, 0.029918670654296875, 0.0323944091796875, 0.034870147705078125, 0.03734588623046875, 0.039821624755859375, 0.04229736328125, 0.044773101806640625, 0.04724884033203125, 0.049724578857421875, 0.0522003173828125, 0.054676055908203125, 0.05715179443359375, 0.059627532958984375, 0.062103271484375, 0.06457901000976562, 0.06705474853515625, 0.06953048706054688, 0.0720062255859375, 0.07448196411132812, 0.07695770263671875, 0.07943344116210938, 0.0819091796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 5.0, 9.0, 11.0, 19.0, 39.0, 59.0, 127.0, 204.0, 400.0, 907.0, 2022.0, 5788.0, 19940.0, 91047.0, 545608.0, 2790082.0, 606289.0, 100207.0, 21559.0, 6020.0, 2216.0, 888.0, 390.0, 196.0, 107.0, 67.0, 38.0, 20.0, 5.0, 9.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2177734375, -0.20986175537109375, -0.2019500732421875, -0.19403839111328125, -0.186126708984375, -0.17821502685546875, -0.1703033447265625, -0.16239166259765625, -0.15447998046875, -0.14656829833984375, -0.1386566162109375, -0.13074493408203125, -0.122833251953125, -0.11492156982421875, -0.1070098876953125, -0.09909820556640625, -0.0911865234375, -0.08327484130859375, -0.0753631591796875, -0.06745147705078125, -0.059539794921875, -0.05162811279296875, -0.0437164306640625, -0.03580474853515625, -0.02789306640625, -0.01998138427734375, -0.0120697021484375, -0.00415802001953125, 0.003753662109375, 0.01166534423828125, 0.0195770263671875, 0.02748870849609375, 0.035400390625, 0.04331207275390625, 0.0512237548828125, 0.05913543701171875, 0.067047119140625, 0.07495880126953125, 0.0828704833984375, 0.09078216552734375, 0.09869384765625, 0.10660552978515625, 0.1145172119140625, 0.12242889404296875, 0.130340576171875, 0.13825225830078125, 0.1461639404296875, 0.15407562255859375, 0.1619873046875, 0.16989898681640625, 0.1778106689453125, 0.18572235107421875, 0.193634033203125, 0.20154571533203125, 0.2094573974609375, 0.21736907958984375, 0.22528076171875, 0.23319244384765625, 0.2411041259765625, 0.24901580810546875, 0.256927490234375, 0.26483917236328125, 0.2727508544921875, 0.28066253662109375, 0.28857421875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 10.0, 19.0, 28.0, 37.0, 37.0, 70.0, 95.0, 107.0, 188.0, 282.0, 445.0, 644.0, 667.0, 481.0, 301.0, 201.0, 136.0, 87.0, 67.0, 46.0, 29.0, 24.0, 12.0, 19.0, 8.0, 13.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2274169921875, -0.2207317352294922, -0.21404647827148438, -0.20736122131347656, -0.20067596435546875, -0.19399070739746094, -0.18730545043945312, -0.1806201934814453, -0.1739349365234375, -0.1672496795654297, -0.16056442260742188, -0.15387916564941406, -0.14719390869140625, -0.14050865173339844, -0.13382339477539062, -0.1271381378173828, -0.120452880859375, -0.11376762390136719, -0.10708236694335938, -0.10039710998535156, -0.09371185302734375, -0.08702659606933594, -0.08034133911132812, -0.07365608215332031, -0.0669708251953125, -0.06028556823730469, -0.053600311279296875, -0.04691505432128906, -0.04022979736328125, -0.03354454040527344, -0.026859283447265625, -0.020174026489257812, -0.01348876953125, -0.0068035125732421875, -0.000118255615234375, 0.0065670013427734375, 0.01325225830078125, 0.019937515258789062, 0.026622772216796875, 0.03330802917480469, 0.0399932861328125, 0.04667854309082031, 0.053363800048828125, 0.06004905700683594, 0.06673431396484375, 0.07341957092285156, 0.08010482788085938, 0.08679008483886719, 0.093475341796875, 0.10016059875488281, 0.10684585571289062, 0.11353111267089844, 0.12021636962890625, 0.12690162658691406, 0.13358688354492188, 0.1402721405029297, 0.1469573974609375, 0.1536426544189453, 0.16032791137695312, 0.16701316833496094, 0.17369842529296875, 0.18038368225097656, 0.18706893920898438, 0.1937541961669922, 0.200439453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 11.0, 27.0, 50.0, 78.0, 140.0, 191.0, 190.0, 150.0, 85.0, 33.0, 18.0, 10.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.662413239479065, -1.595971941947937, -1.529530644416809, -1.4630893468856812, -1.3966481685638428, -1.3302068710327148, -1.263765573501587, -1.197324275970459, -1.130882978439331, -1.0644416809082031, -0.9980003833770752, -0.931559145450592, -0.8651178479194641, -0.7986765503883362, -0.732235312461853, -0.6657940149307251, -0.5993527173995972, -0.5329114198684692, -0.4664701521396637, -0.40002888441085815, -0.3335875868797302, -0.2671462893486023, -0.20070502161979675, -0.1342637538909912, -0.06782245635986328, -0.0013811737298965454, 0.06506010890007019, 0.13150139153003693, 0.19794267416000366, 0.2643839716911316, 0.33082523941993713, 0.3972665071487427, 0.46370792388916016, 0.5301492214202881, 0.596590518951416, 0.6630317568778992, 0.7294730544090271, 0.795914351940155, 0.8623555898666382, 0.9287968873977661, 0.995238184928894, 1.061679482460022, 1.12812077999115, 1.1945620775222778, 1.2610032558441162, 1.3274445533752441, 1.393885850906372, 1.4603271484375, 1.526768445968628, 1.5932097434997559, 1.6596510410308838, 1.7260923385620117, 1.7925336360931396, 1.8589749336242676, 1.925416111946106, 1.9918574094772339, 2.0582985877990723, 2.1247398853302, 2.191181182861328, 2.257622480392456, 2.324063777923584, 2.390505075454712, 2.45694637298584, 2.5233874320983887, 2.5898289680480957]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 7.0, 4.0, 10.0, 11.0, 20.0, 26.0, 17.0, 31.0, 28.0, 29.0, 38.0, 40.0, 30.0, 31.0, 44.0, 50.0, 52.0, 48.0, 47.0, 59.0, 42.0, 49.0, 45.0, 38.0, 31.0, 46.0, 20.0, 24.0, 16.0, 15.0, 13.0, 8.0, 9.0, 8.0, 8.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5951695442199707, -0.5733194947242737, -0.5514693856239319, -0.5296193361282349, -0.5077692270278931, -0.48591917753219604, -0.46406909823417664, -0.4422190189361572, -0.4203689396381378, -0.3985188603401184, -0.376668781042099, -0.3548187017440796, -0.33296865224838257, -0.31111854314804077, -0.28926849365234375, -0.26741841435432434, -0.24556833505630493, -0.22371825575828552, -0.2018681764602661, -0.1800181120634079, -0.1581680327653885, -0.13631795346736908, -0.11446788907051086, -0.09261780977249146, -0.07076773047447205, -0.048917654901742935, -0.027067579329013824, -0.005217507481575012, 0.016632571816444397, 0.038482651114463806, 0.06033271551132202, 0.08218279480934143, 0.10403293371200562, 0.12588301301002502, 0.14773309230804443, 0.16958315670490265, 0.19143323600292206, 0.21328331530094147, 0.23513337969779968, 0.2569834589958191, 0.2788335382938385, 0.3006836175918579, 0.3225336968898773, 0.34438377618789673, 0.36623382568359375, 0.38808393478393555, 0.40993398427963257, 0.431784063577652, 0.4536341428756714, 0.4754842221736908, 0.4973343014717102, 0.5191843509674072, 0.541034460067749, 0.562884509563446, 0.5847345590591431, 0.6065846681594849, 0.6284347772598267, 0.6502848267555237, 0.6721349358558655, 0.6939849853515625, 0.7158350944519043, 0.7376851439476013, 0.7595351934432983, 0.7813853025436401, 0.8032353520393372]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 7.0, 5.0, 7.0, 11.0, 18.0, 25.0, 37.0, 73.0, 121.0, 175.0, 250.0, 430.0, 688.0, 1227.0, 1960.0, 3259.0, 5814.0, 10488.0, 21312.0, 44655.0, 92519.0, 167657.0, 227131.0, 207393.0, 130768.0, 66468.0, 31560.0, 15445.0, 8133.0, 4459.0, 2528.0, 1502.0, 939.0, 572.0, 324.0, 219.0, 135.0, 94.0, 47.0, 27.0, 26.0, 15.0, 14.0, 9.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1112060546875, -0.10791301727294922, -0.10461997985839844, -0.10132694244384766, -0.09803390502929688, -0.0947408676147461, -0.09144783020019531, -0.08815479278564453, -0.08486175537109375, -0.08156871795654297, -0.07827568054199219, -0.0749826431274414, -0.07168960571289062, -0.06839656829833984, -0.06510353088378906, -0.06181049346923828, -0.0585174560546875, -0.05522441864013672, -0.05193138122558594, -0.048638343811035156, -0.045345306396484375, -0.042052268981933594, -0.03875923156738281, -0.03546619415283203, -0.03217315673828125, -0.02888011932373047, -0.025587081909179688, -0.022294044494628906, -0.019001007080078125, -0.015707969665527344, -0.012414932250976562, -0.009121894836425781, -0.005828857421875, -0.0025358200073242188, 0.0007572174072265625, 0.004050254821777344, 0.007343292236328125, 0.010636329650878906, 0.013929367065429688, 0.01722240447998047, 0.02051544189453125, 0.02380847930908203, 0.027101516723632812, 0.030394554138183594, 0.033687591552734375, 0.036980628967285156, 0.04027366638183594, 0.04356670379638672, 0.0468597412109375, 0.05015277862548828, 0.05344581604003906, 0.056738853454589844, 0.060031890869140625, 0.0633249282836914, 0.06661796569824219, 0.06991100311279297, 0.07320404052734375, 0.07649707794189453, 0.07979011535644531, 0.0830831527709961, 0.08637619018554688, 0.08966922760009766, 0.09296226501464844, 0.09625530242919922, 0.09954833984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 13.0, 9.0, 10.0, 12.0, 12.0, 17.0, 14.0, 33.0, 24.0, 32.0, 28.0, 32.0, 31.0, 18.0, 44.0, 46.0, 39.0, 44.0, 46.0, 34.0, 36.0, 33.0, 37.0, 32.0, 38.0, 43.0, 34.0, 25.0, 17.0, 23.0, 24.0, 15.0, 20.0, 12.0, 6.0, 10.0, 10.0, 5.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06787109375, -0.06564903259277344, -0.06342697143554688, -0.06120491027832031, -0.05898284912109375, -0.05676078796386719, -0.054538726806640625, -0.05231666564941406, -0.0500946044921875, -0.04787254333496094, -0.045650482177734375, -0.04342842102050781, -0.04120635986328125, -0.03898429870605469, -0.036762237548828125, -0.03454017639160156, -0.032318115234375, -0.030096054077148438, -0.027873992919921875, -0.025651931762695312, -0.02342987060546875, -0.021207809448242188, -0.018985748291015625, -0.016763687133789062, -0.0145416259765625, -0.012319564819335938, -0.010097503662109375, -0.007875442504882812, -0.00565338134765625, -0.0034313201904296875, -0.001209259033203125, 0.0010128021240234375, 0.00323486328125, 0.0054569244384765625, 0.007678985595703125, 0.009901046752929688, 0.01212310791015625, 0.014345169067382812, 0.016567230224609375, 0.018789291381835938, 0.0210113525390625, 0.023233413696289062, 0.025455474853515625, 0.027677536010742188, 0.02989959716796875, 0.03212165832519531, 0.034343719482421875, 0.03656578063964844, 0.038787841796875, 0.04100990295410156, 0.043231964111328125, 0.04545402526855469, 0.04767608642578125, 0.04989814758300781, 0.052120208740234375, 0.05434226989746094, 0.0565643310546875, 0.05878639221191406, 0.061008453369140625, 0.06323051452636719, 0.06545257568359375, 0.06767463684082031, 0.06989669799804688, 0.07211875915527344, 0.0743408203125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 9.0, 12.0, 24.0, 18.0, 40.0, 50.0, 85.0, 133.0, 216.0, 367.0, 703.0, 1377.0, 2859.0, 6094.0, 14481.0, 41193.0, 135266.0, 327971.0, 322142.0, 129718.0, 40116.0, 13980.0, 5972.0, 2732.0, 1297.0, 685.0, 375.0, 203.0, 145.0, 86.0, 58.0, 36.0, 23.0, 18.0, 17.0, 10.0, 5.0, 12.0, 5.0, 5.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1641845703125, -0.15935325622558594, -0.15452194213867188, -0.1496906280517578, -0.14485931396484375, -0.1400279998779297, -0.13519668579101562, -0.13036537170410156, -0.1255340576171875, -0.12070274353027344, -0.11587142944335938, -0.11104011535644531, -0.10620880126953125, -0.10137748718261719, -0.09654617309570312, -0.09171485900878906, -0.086883544921875, -0.08205223083496094, -0.07722091674804688, -0.07238960266113281, -0.06755828857421875, -0.06272697448730469, -0.057895660400390625, -0.05306434631347656, -0.0482330322265625, -0.04340171813964844, -0.038570404052734375, -0.03373908996582031, -0.02890777587890625, -0.024076461791992188, -0.019245147705078125, -0.014413833618164062, -0.00958251953125, -0.0047512054443359375, 8.0108642578125e-05, 0.0049114227294921875, 0.00974273681640625, 0.014574050903320312, 0.019405364990234375, 0.024236679077148438, 0.0290679931640625, 0.03389930725097656, 0.038730621337890625, 0.04356193542480469, 0.04839324951171875, 0.05322456359863281, 0.058055877685546875, 0.06288719177246094, 0.067718505859375, 0.07254981994628906, 0.07738113403320312, 0.08221244812011719, 0.08704376220703125, 0.09187507629394531, 0.09670639038085938, 0.10153770446777344, 0.1063690185546875, 0.11120033264160156, 0.11603164672851562, 0.12086296081542969, 0.12569427490234375, 0.1305255889892578, 0.13535690307617188, 0.14018821716308594, 0.14501953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 6.0, 5.0, 9.0, 14.0, 8.0, 17.0, 9.0, 29.0, 20.0, 25.0, 26.0, 31.0, 31.0, 51.0, 44.0, 45.0, 53.0, 42.0, 44.0, 43.0, 65.0, 39.0, 37.0, 44.0, 47.0, 32.0, 31.0, 22.0, 17.0, 25.0, 12.0, 16.0, 12.0, 6.0, 12.0, 4.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.2509765625, -0.24390411376953125, -0.2368316650390625, -0.22975921630859375, -0.222686767578125, -0.21561431884765625, -0.2085418701171875, -0.20146942138671875, -0.19439697265625, -0.18732452392578125, -0.1802520751953125, -0.17317962646484375, -0.166107177734375, -0.15903472900390625, -0.1519622802734375, -0.14488983154296875, -0.1378173828125, -0.13074493408203125, -0.1236724853515625, -0.11660003662109375, -0.109527587890625, -0.10245513916015625, -0.0953826904296875, -0.08831024169921875, -0.08123779296875, -0.07416534423828125, -0.0670928955078125, -0.06002044677734375, -0.052947998046875, -0.04587554931640625, -0.0388031005859375, -0.03173065185546875, -0.024658203125, -0.01758575439453125, -0.0105133056640625, -0.00344085693359375, 0.003631591796875, 0.01070404052734375, 0.0177764892578125, 0.02484893798828125, 0.03192138671875, 0.03899383544921875, 0.0460662841796875, 0.05313873291015625, 0.060211181640625, 0.06728363037109375, 0.0743560791015625, 0.08142852783203125, 0.0885009765625, 0.09557342529296875, 0.1026458740234375, 0.10971832275390625, 0.116790771484375, 0.12386322021484375, 0.1309356689453125, 0.13800811767578125, 0.14508056640625, 0.15215301513671875, 0.1592254638671875, 0.16629791259765625, 0.173370361328125, 0.18044281005859375, 0.1875152587890625, 0.19458770751953125, 0.20166015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 7.0, 14.0, 13.0, 19.0, 31.0, 40.0, 61.0, 85.0, 161.0, 220.0, 459.0, 785.0, 1494.0, 2862.0, 6034.0, 13171.0, 30251.0, 75059.0, 188081.0, 314490.0, 238962.0, 103414.0, 40266.0, 17064.0, 7779.0, 3674.0, 1831.0, 916.0, 493.0, 314.0, 159.0, 111.0, 72.0, 49.0, 30.0, 30.0, 10.0, 9.0, 12.0, 4.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0], "bins": [-0.08203125, -0.07979393005371094, -0.07755661010742188, -0.07531929016113281, -0.07308197021484375, -0.07084465026855469, -0.06860733032226562, -0.06637001037597656, -0.0641326904296875, -0.06189537048339844, -0.059658050537109375, -0.05742073059082031, -0.05518341064453125, -0.05294609069824219, -0.050708770751953125, -0.04847145080566406, -0.046234130859375, -0.04399681091308594, -0.041759490966796875, -0.03952217102050781, -0.03728485107421875, -0.03504753112792969, -0.032810211181640625, -0.030572891235351562, -0.0283355712890625, -0.026098251342773438, -0.023860931396484375, -0.021623611450195312, -0.01938629150390625, -0.017148971557617188, -0.014911651611328125, -0.012674331665039062, -0.01043701171875, -0.008199691772460938, -0.005962371826171875, -0.0037250518798828125, -0.00148773193359375, 0.0007495880126953125, 0.002986907958984375, 0.0052242279052734375, 0.0074615478515625, 0.009698867797851562, 0.011936187744140625, 0.014173507690429688, 0.01641082763671875, 0.018648147583007812, 0.020885467529296875, 0.023122787475585938, 0.025360107421875, 0.027597427368164062, 0.029834747314453125, 0.03207206726074219, 0.03430938720703125, 0.03654670715332031, 0.038784027099609375, 0.04102134704589844, 0.0432586669921875, 0.04549598693847656, 0.047733306884765625, 0.04997062683105469, 0.05220794677734375, 0.05444526672363281, 0.056682586669921875, 0.05891990661621094, 0.0611572265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 5.0, 7.0, 8.0, 9.0, 19.0, 19.0, 30.0, 36.0, 37.0, 43.0, 60.0, 65.0, 67.0, 84.0, 89.0, 74.0, 84.0, 49.0, 34.0, 43.0, 33.0, 22.0, 16.0, 14.0, 9.0, 13.0, 7.0, 3.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0503997802734375e-05, -1.9861385226249695e-05, -1.9218772649765015e-05, -1.8576160073280334e-05, -1.7933547496795654e-05, -1.7290934920310974e-05, -1.6648322343826294e-05, -1.6005709767341614e-05, -1.5363097190856934e-05, -1.4720484614372253e-05, -1.4077872037887573e-05, -1.3435259461402893e-05, -1.2792646884918213e-05, -1.2150034308433533e-05, -1.1507421731948853e-05, -1.0864809155464172e-05, -1.0222196578979492e-05, -9.579584002494812e-06, -8.936971426010132e-06, -8.294358849525452e-06, -7.651746273040771e-06, -7.009133696556091e-06, -6.366521120071411e-06, -5.723908543586731e-06, -5.081295967102051e-06, -4.438683390617371e-06, -3.7960708141326904e-06, -3.1534582376480103e-06, -2.51084566116333e-06, -1.86823308467865e-06, -1.2256205081939697e-06, -5.830079317092896e-07, 5.960464477539063e-08, 7.022172212600708e-07, 1.344829797744751e-06, 1.987442374229431e-06, 2.6300549507141113e-06, 3.2726675271987915e-06, 3.915280103683472e-06, 4.557892680168152e-06, 5.200505256652832e-06, 5.843117833137512e-06, 6.485730409622192e-06, 7.1283429861068726e-06, 7.770955562591553e-06, 8.413568139076233e-06, 9.056180715560913e-06, 9.698793292045593e-06, 1.0341405868530273e-05, 1.0984018445014954e-05, 1.1626631021499634e-05, 1.2269243597984314e-05, 1.2911856174468994e-05, 1.3554468750953674e-05, 1.4197081327438354e-05, 1.4839693903923035e-05, 1.5482306480407715e-05, 1.6124919056892395e-05, 1.6767531633377075e-05, 1.7410144209861755e-05, 1.8052756786346436e-05, 1.8695369362831116e-05, 1.9337981939315796e-05, 1.9980594515800476e-05, 2.0623207092285156e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 8.0, 16.0, 25.0, 43.0, 43.0, 78.0, 130.0, 246.0, 362.0, 621.0, 1061.0, 1890.0, 3867.0, 8947.0, 24042.0, 69908.0, 197243.0, 347102.0, 245971.0, 93906.0, 31754.0, 11323.0, 4647.0, 2238.0, 1199.0, 737.0, 408.0, 273.0, 154.0, 120.0, 83.0, 26.0, 35.0, 20.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0810546875, -0.0786447525024414, -0.07623481750488281, -0.07382488250732422, -0.07141494750976562, -0.06900501251220703, -0.06659507751464844, -0.06418514251708984, -0.06177520751953125, -0.059365272521972656, -0.05695533752441406, -0.05454540252685547, -0.052135467529296875, -0.04972553253173828, -0.04731559753417969, -0.044905662536621094, -0.0424957275390625, -0.040085792541503906, -0.03767585754394531, -0.03526592254638672, -0.032855987548828125, -0.03044605255126953, -0.028036117553710938, -0.025626182556152344, -0.02321624755859375, -0.020806312561035156, -0.018396377563476562, -0.01598644256591797, -0.013576507568359375, -0.011166572570800781, -0.008756637573242188, -0.006346702575683594, -0.003936767578125, -0.0015268325805664062, 0.0008831024169921875, 0.0032930374145507812, 0.005702972412109375, 0.008112907409667969, 0.010522842407226562, 0.012932777404785156, 0.01534271240234375, 0.017752647399902344, 0.020162582397460938, 0.02257251739501953, 0.024982452392578125, 0.02739238739013672, 0.029802322387695312, 0.032212257385253906, 0.0346221923828125, 0.037032127380371094, 0.03944206237792969, 0.04185199737548828, 0.044261932373046875, 0.04667186737060547, 0.04908180236816406, 0.051491737365722656, 0.05390167236328125, 0.056311607360839844, 0.05872154235839844, 0.06113147735595703, 0.06354141235351562, 0.06595134735107422, 0.06836128234863281, 0.0707712173461914, 0.07318115234375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 5.0, 3.0, 3.0, 5.0, 3.0, 7.0, 19.0, 14.0, 16.0, 31.0, 47.0, 50.0, 53.0, 61.0, 67.0, 67.0, 76.0, 102.0, 79.0, 57.0, 47.0, 42.0, 39.0, 22.0, 21.0, 24.0, 10.0, 10.0, 7.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09716796875, -0.09461498260498047, -0.09206199645996094, -0.0895090103149414, -0.08695602416992188, -0.08440303802490234, -0.08185005187988281, -0.07929706573486328, -0.07674407958984375, -0.07419109344482422, -0.07163810729980469, -0.06908512115478516, -0.06653213500976562, -0.0639791488647461, -0.06142616271972656, -0.05887317657470703, -0.0563201904296875, -0.05376720428466797, -0.05121421813964844, -0.048661231994628906, -0.046108245849609375, -0.043555259704589844, -0.04100227355957031, -0.03844928741455078, -0.03589630126953125, -0.03334331512451172, -0.030790328979492188, -0.028237342834472656, -0.025684356689453125, -0.023131370544433594, -0.020578384399414062, -0.01802539825439453, -0.015472412109375, -0.012919425964355469, -0.010366439819335938, -0.007813453674316406, -0.005260467529296875, -0.0027074813842773438, -0.0001544952392578125, 0.0023984909057617188, 0.00495147705078125, 0.007504463195800781, 0.010057449340820312, 0.012610435485839844, 0.015163421630859375, 0.017716407775878906, 0.020269393920898438, 0.02282238006591797, 0.0253753662109375, 0.02792835235595703, 0.030481338500976562, 0.033034324645996094, 0.035587310791015625, 0.038140296936035156, 0.04069328308105469, 0.04324626922607422, 0.04579925537109375, 0.04835224151611328, 0.05090522766113281, 0.053458213806152344, 0.056011199951171875, 0.058564186096191406, 0.06111717224121094, 0.06367015838623047, 0.06622314453125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 12.0, 28.0, 56.0, 85.0, 112.0, 150.0, 148.0, 138.0, 110.0, 54.0, 38.0, 30.0, 10.0, 5.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8192116618156433, -0.7836429476737976, -0.7480742931365967, -0.712505578994751, -0.6769368648529053, -0.6413681507110596, -0.6057994365692139, -0.5702307820320129, -0.5346620678901672, -0.49909335374832153, -0.4635246694087982, -0.4279559850692749, -0.3923872709274292, -0.3568185567855835, -0.3212498724460602, -0.28568118810653687, -0.25011247396469116, -0.21454377472400665, -0.17897507548332214, -0.14340637624263763, -0.10783767700195312, -0.07226897776126862, -0.036700278520584106, -0.0011315792798995972, 0.03443711996078491, 0.07000581920146942, 0.10557451844215393, 0.14114321768283844, 0.17671191692352295, 0.21228061616420746, 0.24784931540489197, 0.2834179997444153, 0.3189866542816162, 0.3545553684234619, 0.39012405276298523, 0.42569273710250854, 0.46126145124435425, 0.49683016538619995, 0.5323988199234009, 0.5679675340652466, 0.6035362482070923, 0.639104962348938, 0.6746736764907837, 0.7102423310279846, 0.7458110451698303, 0.781379759311676, 0.816948413848877, 0.8525171279907227, 0.8880858421325684, 0.9236545562744141, 0.9592232704162598, 0.9947919249534607, 1.0303606986999512, 1.0659292936325073, 1.101498007774353, 1.1370667219161987, 1.1726354360580444, 1.2082041501998901, 1.2437728643417358, 1.2793415784835815, 1.3149101734161377, 1.3504788875579834, 1.386047601699829, 1.4216163158416748, 1.4571850299835205]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 6.0, 5.0, 9.0, 6.0, 10.0, 7.0, 20.0, 14.0, 15.0, 18.0, 19.0, 17.0, 27.0, 28.0, 35.0, 25.0, 30.0, 37.0, 33.0, 22.0, 46.0, 46.0, 45.0, 37.0, 50.0, 50.0, 35.0, 13.0, 27.0, 24.0, 29.0, 26.0, 28.0, 24.0, 18.0, 18.0, 22.0, 19.0, 9.0, 16.0, 3.0, 11.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5323914885520935, -0.5159826278686523, -0.49957382678985596, -0.4831649959087372, -0.4667561650276184, -0.45034730434417725, -0.43393847346305847, -0.4175296425819397, -0.4011208117008209, -0.38471198081970215, -0.3683031499385834, -0.3518943190574646, -0.33548545837402344, -0.31907665729522705, -0.3026677966117859, -0.2862589657306671, -0.26985013484954834, -0.25344130396842957, -0.2370324730873108, -0.22062362730503082, -0.20421479642391205, -0.18780596554279327, -0.1713971197605133, -0.15498828887939453, -0.13857945799827576, -0.12217062711715698, -0.10576178878545761, -0.08935295045375824, -0.07294411957263947, -0.05653528869152069, -0.04012645035982132, -0.023717612028121948, -0.007308781147003174, 0.009100053459405899, 0.025508888065814972, 0.041917722672224045, 0.05832655727863312, 0.07473538815975189, 0.09114422649145126, 0.10755306482315063, 0.12396189570426941, 0.14037072658538818, 0.15677955746650696, 0.17318840324878693, 0.1895972341299057, 0.20600606501102448, 0.22241491079330444, 0.23882374167442322, 0.255232572555542, 0.27164140343666077, 0.28805023431777954, 0.3044590651988983, 0.3208678960800171, 0.33727675676345825, 0.353685587644577, 0.3700944185256958, 0.3865032494068146, 0.40291208028793335, 0.4193209111690521, 0.4357297420501709, 0.45213860273361206, 0.46854740381240845, 0.4849562644958496, 0.501365065574646, 0.5177739262580872]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 22.0, 41.0, 51.0, 67.0, 110.0, 152.0, 258.0, 469.0, 836.0, 1549.0, 2814.0, 5567.0, 11532.0, 25050.0, 58132.0, 145463.0, 414945.0, 1244025.0, 1446575.0, 527308.0, 181957.0, 70666.0, 29904.0, 13346.0, 6321.0, 3115.0, 1679.0, 907.0, 532.0, 332.0, 178.0, 133.0, 71.0, 52.0, 34.0, 21.0, 14.0, 13.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09552001953125, -0.09244918823242188, -0.08937835693359375, -0.08630752563476562, -0.0832366943359375, -0.08016586303710938, -0.07709503173828125, -0.07402420043945312, -0.070953369140625, -0.06788253784179688, -0.06481170654296875, -0.061740875244140625, -0.0586700439453125, -0.055599212646484375, -0.05252838134765625, -0.049457550048828125, -0.04638671875, -0.043315887451171875, -0.04024505615234375, -0.037174224853515625, -0.0341033935546875, -0.031032562255859375, -0.02796173095703125, -0.024890899658203125, -0.021820068359375, -0.018749237060546875, -0.01567840576171875, -0.012607574462890625, -0.0095367431640625, -0.006465911865234375, -0.00339508056640625, -0.000324249267578125, 0.00274658203125, 0.005817413330078125, 0.00888824462890625, 0.011959075927734375, 0.0150299072265625, 0.018100738525390625, 0.02117156982421875, 0.024242401123046875, 0.027313232421875, 0.030384063720703125, 0.03345489501953125, 0.036525726318359375, 0.0395965576171875, 0.042667388916015625, 0.04573822021484375, 0.048809051513671875, 0.0518798828125, 0.054950714111328125, 0.05802154541015625, 0.061092376708984375, 0.0641632080078125, 0.06723403930664062, 0.07030487060546875, 0.07337570190429688, 0.076446533203125, 0.07951736450195312, 0.08258819580078125, 0.08565902709960938, 0.0887298583984375, 0.09180068969726562, 0.09487152099609375, 0.09794235229492188, 0.10101318359375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 10.0, 13.0, 10.0, 14.0, 9.0, 17.0, 21.0, 22.0, 24.0, 23.0, 25.0, 25.0, 28.0, 24.0, 32.0, 43.0, 36.0, 40.0, 30.0, 43.0, 39.0, 38.0, 37.0, 50.0, 29.0, 40.0, 37.0, 36.0, 34.0, 30.0, 22.0, 21.0, 13.0, 10.0, 8.0, 7.0, 11.0, 9.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.081787109375, -0.07947158813476562, -0.07715606689453125, -0.07484054565429688, -0.0725250244140625, -0.07020950317382812, -0.06789398193359375, -0.06557846069335938, -0.063262939453125, -0.060947418212890625, -0.05863189697265625, -0.056316375732421875, -0.0540008544921875, -0.051685333251953125, -0.04936981201171875, -0.047054290771484375, -0.04473876953125, -0.042423248291015625, -0.04010772705078125, -0.037792205810546875, -0.0354766845703125, -0.033161163330078125, -0.03084564208984375, -0.028530120849609375, -0.026214599609375, -0.023899078369140625, -0.02158355712890625, -0.019268035888671875, -0.0169525146484375, -0.014636993408203125, -0.01232147216796875, -0.010005950927734375, -0.0076904296875, -0.005374908447265625, -0.00305938720703125, -0.000743865966796875, 0.0015716552734375, 0.003887176513671875, 0.00620269775390625, 0.008518218994140625, 0.010833740234375, 0.013149261474609375, 0.01546478271484375, 0.017780303955078125, 0.0200958251953125, 0.022411346435546875, 0.02472686767578125, 0.027042388916015625, 0.02935791015625, 0.031673431396484375, 0.03398895263671875, 0.036304473876953125, 0.0386199951171875, 0.040935516357421875, 0.04325103759765625, 0.045566558837890625, 0.047882080078125, 0.050197601318359375, 0.05251312255859375, 0.054828643798828125, 0.0571441650390625, 0.059459686279296875, 0.06177520751953125, 0.06409072875976562, 0.06640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 8.0, 18.0, 28.0, 66.0, 108.0, 177.0, 296.0, 627.0, 1349.0, 3351.0, 10051.0, 38705.0, 197231.0, 1635151.0, 2011492.0, 233471.0, 44488.0, 11024.0, 3690.0, 1429.0, 670.0, 368.0, 197.0, 114.0, 58.0, 57.0, 19.0, 15.0, 6.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20361328125, -0.19635391235351562, -0.18909454345703125, -0.18183517456054688, -0.1745758056640625, -0.16731643676757812, -0.16005706787109375, -0.15279769897460938, -0.145538330078125, -0.13827896118164062, -0.13101959228515625, -0.12376022338867188, -0.1165008544921875, -0.10924148559570312, -0.10198211669921875, -0.09472274780273438, -0.08746337890625, -0.08020401000976562, -0.07294464111328125, -0.06568527221679688, -0.0584259033203125, -0.051166534423828125, -0.04390716552734375, -0.036647796630859375, -0.029388427734375, -0.022129058837890625, -0.01486968994140625, -0.007610321044921875, -0.0003509521484375, 0.006908416748046875, 0.01416778564453125, 0.021427154541015625, 0.0286865234375, 0.035945892333984375, 0.04320526123046875, 0.050464630126953125, 0.0577239990234375, 0.06498336791992188, 0.07224273681640625, 0.07950210571289062, 0.086761474609375, 0.09402084350585938, 0.10128021240234375, 0.10853958129882812, 0.1157989501953125, 0.12305831909179688, 0.13031768798828125, 0.13757705688476562, 0.14483642578125, 0.15209579467773438, 0.15935516357421875, 0.16661453247070312, 0.1738739013671875, 0.18113327026367188, 0.18839263916015625, 0.19565200805664062, 0.202911376953125, 0.21017074584960938, 0.21743011474609375, 0.22468948364257812, 0.2319488525390625, 0.23920822143554688, 0.24646759033203125, 0.2537269592285156, 0.260986328125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 14.0, 20.0, 27.0, 31.0, 50.0, 61.0, 92.0, 135.0, 204.0, 299.0, 441.0, 674.0, 715.0, 444.0, 283.0, 168.0, 125.0, 86.0, 57.0, 39.0, 23.0, 26.0, 20.0, 9.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1990966796875, -0.1930675506591797, -0.18703842163085938, -0.18100929260253906, -0.17498016357421875, -0.16895103454589844, -0.16292190551757812, -0.1568927764892578, -0.1508636474609375, -0.1448345184326172, -0.13880538940429688, -0.13277626037597656, -0.12674713134765625, -0.12071800231933594, -0.11468887329101562, -0.10865974426269531, -0.102630615234375, -0.09660148620605469, -0.09057235717773438, -0.08454322814941406, -0.07851409912109375, -0.07248497009277344, -0.06645584106445312, -0.06042671203613281, -0.0543975830078125, -0.04836845397949219, -0.042339324951171875, -0.03631019592285156, -0.03028106689453125, -0.024251937866210938, -0.018222808837890625, -0.012193679809570312, -0.00616455078125, -0.0001354217529296875, 0.005893707275390625, 0.011922836303710938, 0.01795196533203125, 0.023981094360351562, 0.030010223388671875, 0.03603935241699219, 0.0420684814453125, 0.04809761047363281, 0.054126739501953125, 0.06015586853027344, 0.06618499755859375, 0.07221412658691406, 0.07824325561523438, 0.08427238464355469, 0.090301513671875, 0.09633064270019531, 0.10235977172851562, 0.10838890075683594, 0.11441802978515625, 0.12044715881347656, 0.12647628784179688, 0.1325054168701172, 0.1385345458984375, 0.1445636749267578, 0.15059280395507812, 0.15662193298339844, 0.16265106201171875, 0.16868019104003906, 0.17470932006835938, 0.1807384490966797, 0.186767578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 9.0, 5.0, 16.0, 23.0, 36.0, 56.0, 61.0, 106.0, 96.0, 126.0, 114.0, 118.0, 85.0, 53.0, 41.0, 21.0, 16.0, 8.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4235928058624268, -1.389700174331665, -1.3558074235916138, -1.3219146728515625, -1.2880220413208008, -1.254129409790039, -1.2202366590499878, -1.1863439083099365, -1.1524512767791748, -1.118558645248413, -1.0846658945083618, -1.0507731437683105, -1.0168805122375488, -0.9829878211021423, -0.9490951299667358, -0.9152024388313293, -0.8813097476959229, -0.8474170565605164, -0.8135243654251099, -0.7796316742897034, -0.7457389831542969, -0.7118462920188904, -0.6779536008834839, -0.6440609097480774, -0.6101682186126709, -0.5762755274772644, -0.5423828363418579, -0.5084901452064514, -0.4745974540710449, -0.4407047629356384, -0.40681207180023193, -0.37291938066482544, -0.33902662992477417, -0.3051339387893677, -0.2712412476539612, -0.2373485565185547, -0.2034558653831482, -0.1695631742477417, -0.1356704831123352, -0.10177779197692871, -0.06788510084152222, -0.03399240970611572, -9.971857070922852e-05, 0.033792972564697266, 0.06768566370010376, 0.10157835483551025, 0.13547104597091675, 0.16936373710632324, 0.20325642824172974, 0.23714911937713623, 0.2710418105125427, 0.3049345016479492, 0.3388271927833557, 0.3727198839187622, 0.4066125750541687, 0.4405052661895752, 0.4743979573249817, 0.5082906484603882, 0.5421833395957947, 0.5760760307312012, 0.6099687218666077, 0.6438614130020142, 0.6777541041374207, 0.7116467952728271, 0.7455394864082336]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 7.0, 8.0, 9.0, 10.0, 9.0, 12.0, 13.0, 17.0, 36.0, 19.0, 27.0, 30.0, 40.0, 46.0, 33.0, 41.0, 32.0, 50.0, 47.0, 32.0, 36.0, 40.0, 34.0, 39.0, 28.0, 38.0, 38.0, 32.0, 24.0, 22.0, 24.0, 20.0, 12.0, 20.0, 8.0, 19.0, 12.0, 5.0, 5.0, 4.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4695877432823181, -0.4540618658065796, -0.43853598833084106, -0.42301008105278015, -0.4074842035770416, -0.3919583261013031, -0.3764324486255646, -0.36090654134750366, -0.34538066387176514, -0.3298547863960266, -0.3143289089202881, -0.2988030016422272, -0.28327712416648865, -0.2677512466907501, -0.2522253692150116, -0.23669947683811188, -0.22117359936237335, -0.20564772188663483, -0.1901218295097351, -0.17459595203399658, -0.15907005965709686, -0.14354418218135834, -0.12801828980445862, -0.11249241232872009, -0.09696652740240097, -0.08144064247608185, -0.06591475754976273, -0.0503888763487339, -0.03486299142241478, -0.019337110221385956, -0.0038112252950668335, 0.011714659631252289, 0.02724054455757141, 0.04276642948389053, 0.058292314410209656, 0.07381819188594818, 0.0893440842628479, 0.10486996173858643, 0.12039584666490555, 0.13592173159122467, 0.1514476239681244, 0.16697350144386292, 0.18249939382076263, 0.19802527129650116, 0.21355116367340088, 0.2290770411491394, 0.24460291862487793, 0.26012879610061646, 0.275654673576355, 0.2911805510520935, 0.30670642852783203, 0.32223233580589294, 0.33775821328163147, 0.35328409075737, 0.3688099682331085, 0.38433587551116943, 0.39986175298690796, 0.4153876304626465, 0.430913507938385, 0.4464394152164459, 0.46196529269218445, 0.477491170167923, 0.4930170476436615, 0.5085429549217224, 0.5240688323974609]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 11.0, 5.0, 18.0, 18.0, 31.0, 51.0, 65.0, 116.0, 135.0, 237.0, 334.0, 593.0, 891.0, 1317.0, 2216.0, 3509.0, 5736.0, 9697.0, 17526.0, 39819.0, 108661.0, 264821.0, 321201.0, 159908.0, 57591.0, 23600.0, 11884.0, 6979.0, 4305.0, 2696.0, 1642.0, 1005.0, 676.0, 465.0, 270.0, 188.0, 111.0, 83.0, 44.0, 36.0, 18.0, 10.0, 15.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.144775390625, -0.13998031616210938, -0.13518524169921875, -0.13039016723632812, -0.1255950927734375, -0.12080001831054688, -0.11600494384765625, -0.11120986938476562, -0.106414794921875, -0.10161972045898438, -0.09682464599609375, -0.09202957153320312, -0.0872344970703125, -0.08243942260742188, -0.07764434814453125, -0.07284927368164062, -0.06805419921875, -0.06325912475585938, -0.05846405029296875, -0.053668975830078125, -0.0488739013671875, -0.044078826904296875, -0.03928375244140625, -0.034488677978515625, -0.029693603515625, -0.024898529052734375, -0.02010345458984375, -0.015308380126953125, -0.0105133056640625, -0.005718231201171875, -0.00092315673828125, 0.003871917724609375, 0.0086669921875, 0.013462066650390625, 0.01825714111328125, 0.023052215576171875, 0.0278472900390625, 0.032642364501953125, 0.03743743896484375, 0.042232513427734375, 0.047027587890625, 0.051822662353515625, 0.05661773681640625, 0.061412811279296875, 0.0662078857421875, 0.07100296020507812, 0.07579803466796875, 0.08059310913085938, 0.08538818359375, 0.09018325805664062, 0.09497833251953125, 0.09977340698242188, 0.1045684814453125, 0.10936355590820312, 0.11415863037109375, 0.11895370483398438, 0.123748779296875, 0.12854385375976562, 0.13333892822265625, 0.13813400268554688, 0.1429290771484375, 0.14772415161132812, 0.15251922607421875, 0.15731430053710938, 0.162109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 6.0, 8.0, 9.0, 12.0, 14.0, 21.0, 22.0, 18.0, 30.0, 30.0, 22.0, 26.0, 27.0, 37.0, 37.0, 33.0, 38.0, 38.0, 42.0, 49.0, 38.0, 36.0, 40.0, 36.0, 40.0, 37.0, 30.0, 20.0, 35.0, 18.0, 18.0, 21.0, 23.0, 9.0, 14.0, 8.0, 17.0, 11.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.07379150390625, -0.07142257690429688, -0.06905364990234375, -0.06668472290039062, -0.0643157958984375, -0.061946868896484375, -0.05957794189453125, -0.057209014892578125, -0.054840087890625, -0.052471160888671875, -0.05010223388671875, -0.047733306884765625, -0.0453643798828125, -0.042995452880859375, -0.04062652587890625, -0.038257598876953125, -0.035888671875, -0.033519744873046875, -0.03115081787109375, -0.028781890869140625, -0.0264129638671875, -0.024044036865234375, -0.02167510986328125, -0.019306182861328125, -0.016937255859375, -0.014568328857421875, -0.01219940185546875, -0.009830474853515625, -0.0074615478515625, -0.005092620849609375, -0.00272369384765625, -0.000354766845703125, 0.00201416015625, 0.004383087158203125, 0.00675201416015625, 0.009120941162109375, 0.0114898681640625, 0.013858795166015625, 0.01622772216796875, 0.018596649169921875, 0.020965576171875, 0.023334503173828125, 0.02570343017578125, 0.028072357177734375, 0.0304412841796875, 0.032810211181640625, 0.03517913818359375, 0.037548065185546875, 0.0399169921875, 0.042285919189453125, 0.04465484619140625, 0.047023773193359375, 0.0493927001953125, 0.051761627197265625, 0.05413055419921875, 0.056499481201171875, 0.058868408203125, 0.061237335205078125, 0.06360626220703125, 0.06597518920898438, 0.0683441162109375, 0.07071304321289062, 0.07308197021484375, 0.07545089721679688, 0.07781982421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 8.0, 16.0, 13.0, 21.0, 33.0, 64.0, 106.0, 177.0, 229.0, 434.0, 750.0, 1463.0, 2494.0, 4940.0, 9965.0, 23509.0, 80909.0, 326941.0, 417963.0, 121382.0, 31736.0, 12510.0, 5996.0, 3105.0, 1633.0, 863.0, 533.0, 300.0, 158.0, 105.0, 65.0, 47.0, 26.0, 17.0, 14.0, 7.0, 4.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17330169677734375, -0.1666717529296875, -0.16004180908203125, -0.153411865234375, -0.14678192138671875, -0.1401519775390625, -0.13352203369140625, -0.12689208984375, -0.12026214599609375, -0.1136322021484375, -0.10700225830078125, -0.100372314453125, -0.09374237060546875, -0.0871124267578125, -0.08048248291015625, -0.0738525390625, -0.06722259521484375, -0.0605926513671875, -0.05396270751953125, -0.047332763671875, -0.04070281982421875, -0.0340728759765625, -0.02744293212890625, -0.02081298828125, -0.01418304443359375, -0.0075531005859375, -0.00092315673828125, 0.005706787109375, 0.01233673095703125, 0.0189666748046875, 0.02559661865234375, 0.0322265625, 0.03885650634765625, 0.0454864501953125, 0.05211639404296875, 0.058746337890625, 0.06537628173828125, 0.0720062255859375, 0.07863616943359375, 0.08526611328125, 0.09189605712890625, 0.0985260009765625, 0.10515594482421875, 0.111785888671875, 0.11841583251953125, 0.1250457763671875, 0.13167572021484375, 0.1383056640625, 0.14493560791015625, 0.1515655517578125, 0.15819549560546875, 0.164825439453125, 0.17145538330078125, 0.1780853271484375, 0.18471527099609375, 0.19134521484375, 0.19797515869140625, 0.2046051025390625, 0.21123504638671875, 0.217864990234375, 0.22449493408203125, 0.2311248779296875, 0.23775482177734375, 0.244384765625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 9.0, 6.0, 7.0, 5.0, 17.0, 14.0, 15.0, 20.0, 16.0, 26.0, 26.0, 36.0, 38.0, 41.0, 27.0, 33.0, 38.0, 52.0, 50.0, 41.0, 39.0, 52.0, 44.0, 41.0, 35.0, 29.0, 39.0, 33.0, 25.0, 14.0, 21.0, 15.0, 21.0, 15.0, 11.0, 10.0, 8.0, 10.0, 5.0, 6.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.308349609375, -0.30007362365722656, -0.2917976379394531, -0.2835216522216797, -0.27524566650390625, -0.2669696807861328, -0.2586936950683594, -0.25041770935058594, -0.2421417236328125, -0.23386573791503906, -0.22558975219726562, -0.2173137664794922, -0.20903778076171875, -0.2007617950439453, -0.19248580932617188, -0.18420982360839844, -0.175933837890625, -0.16765785217285156, -0.15938186645507812, -0.1511058807373047, -0.14282989501953125, -0.1345539093017578, -0.12627792358398438, -0.11800193786621094, -0.1097259521484375, -0.10144996643066406, -0.09317398071289062, -0.08489799499511719, -0.07662200927734375, -0.06834602355957031, -0.060070037841796875, -0.05179405212402344, -0.04351806640625, -0.03524208068847656, -0.026966094970703125, -0.018690109252929688, -0.01041412353515625, -0.0021381378173828125, 0.006137847900390625, 0.014413833618164062, 0.0226898193359375, 0.030965805053710938, 0.039241790771484375, 0.04751777648925781, 0.05579376220703125, 0.06406974792480469, 0.07234573364257812, 0.08062171936035156, 0.088897705078125, 0.09717369079589844, 0.10544967651367188, 0.11372566223144531, 0.12200164794921875, 0.1302776336669922, 0.13855361938476562, 0.14682960510253906, 0.1551055908203125, 0.16338157653808594, 0.17165756225585938, 0.1799335479736328, 0.18820953369140625, 0.1964855194091797, 0.20476150512695312, 0.21303749084472656, 0.2213134765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 8.0, 18.0, 22.0, 35.0, 57.0, 58.0, 107.0, 151.0, 226.0, 347.0, 461.0, 817.0, 1183.0, 1841.0, 2967.0, 5095.0, 8998.0, 17299.0, 37479.0, 94431.0, 243744.0, 340736.0, 170154.0, 64452.0, 26855.0, 12887.0, 7062.0, 4112.0, 2469.0, 1589.0, 986.0, 588.0, 412.0, 303.0, 180.0, 118.0, 110.0, 69.0, 47.0, 21.0, 23.0, 13.0, 5.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0614013671875, -0.05937480926513672, -0.05734825134277344, -0.055321693420410156, -0.053295135498046875, -0.051268577575683594, -0.04924201965332031, -0.04721546173095703, -0.04518890380859375, -0.04316234588623047, -0.04113578796386719, -0.039109230041503906, -0.037082672119140625, -0.035056114196777344, -0.03302955627441406, -0.03100299835205078, -0.0289764404296875, -0.02694988250732422, -0.024923324584960938, -0.022896766662597656, -0.020870208740234375, -0.018843650817871094, -0.016817092895507812, -0.014790534973144531, -0.01276397705078125, -0.010737419128417969, -0.008710861206054688, -0.006684303283691406, -0.004657745361328125, -0.0026311874389648438, -0.0006046295166015625, 0.0014219284057617188, 0.003448486328125, 0.005475044250488281, 0.0075016021728515625, 0.009528160095214844, 0.011554718017578125, 0.013581275939941406, 0.015607833862304688, 0.01763439178466797, 0.01966094970703125, 0.02168750762939453, 0.023714065551757812, 0.025740623474121094, 0.027767181396484375, 0.029793739318847656, 0.03182029724121094, 0.03384685516357422, 0.0358734130859375, 0.03789997100830078, 0.03992652893066406, 0.041953086853027344, 0.043979644775390625, 0.046006202697753906, 0.04803276062011719, 0.05005931854248047, 0.05208587646484375, 0.05411243438720703, 0.05613899230957031, 0.058165550231933594, 0.060192108154296875, 0.062218666076660156, 0.06424522399902344, 0.06627178192138672, 0.06829833984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 13.0, 12.0, 16.0, 32.0, 57.0, 74.0, 95.0, 130.0, 132.0, 125.0, 89.0, 60.0, 43.0, 30.0, 24.0, 9.0, 10.0, 8.0, 3.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9921531677246094e-05, -2.893805503845215e-05, -2.7954578399658203e-05, -2.6971101760864258e-05, -2.5987625122070312e-05, -2.5004148483276367e-05, -2.4020671844482422e-05, -2.3037195205688477e-05, -2.205371856689453e-05, -2.1070241928100586e-05, -2.008676528930664e-05, -1.9103288650512695e-05, -1.811981201171875e-05, -1.7136335372924805e-05, -1.615285873413086e-05, -1.5169382095336914e-05, -1.4185905456542969e-05, -1.3202428817749023e-05, -1.2218952178955078e-05, -1.1235475540161133e-05, -1.0251998901367188e-05, -9.268522262573242e-06, -8.285045623779297e-06, -7.3015689849853516e-06, -6.318092346191406e-06, -5.334615707397461e-06, -4.351139068603516e-06, -3.3676624298095703e-06, -2.384185791015625e-06, -1.4007091522216797e-06, -4.172325134277344e-07, 5.662441253662109e-07, 1.5497207641601562e-06, 2.5331974029541016e-06, 3.516674041748047e-06, 4.500150680541992e-06, 5.4836273193359375e-06, 6.467103958129883e-06, 7.450580596923828e-06, 8.434057235717773e-06, 9.417533874511719e-06, 1.0401010513305664e-05, 1.138448715209961e-05, 1.2367963790893555e-05, 1.33514404296875e-05, 1.4334917068481445e-05, 1.531839370727539e-05, 1.6301870346069336e-05, 1.728534698486328e-05, 1.8268823623657227e-05, 1.9252300262451172e-05, 2.0235776901245117e-05, 2.1219253540039062e-05, 2.2202730178833008e-05, 2.3186206817626953e-05, 2.41696834564209e-05, 2.5153160095214844e-05, 2.613663673400879e-05, 2.7120113372802734e-05, 2.810359001159668e-05, 2.9087066650390625e-05, 3.007054328918457e-05, 3.1054019927978516e-05, 3.203749656677246e-05, 3.3020973205566406e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 10.0, 13.0, 18.0, 26.0, 52.0, 93.0, 180.0, 330.0, 667.0, 1305.0, 2922.0, 6633.0, 15822.0, 40134.0, 112929.0, 290604.0, 340738.0, 148567.0, 52209.0, 20306.0, 8210.0, 3613.0, 1597.0, 756.0, 383.0, 202.0, 99.0, 66.0, 30.0, 23.0, 7.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0804443359375, -0.0781545639038086, -0.07586479187011719, -0.07357501983642578, -0.07128524780273438, -0.06899547576904297, -0.06670570373535156, -0.06441593170166016, -0.06212615966796875, -0.059836387634277344, -0.05754661560058594, -0.05525684356689453, -0.052967071533203125, -0.05067729949951172, -0.04838752746582031, -0.046097755432128906, -0.0438079833984375, -0.041518211364746094, -0.03922843933105469, -0.03693866729736328, -0.034648895263671875, -0.03235912322998047, -0.030069351196289062, -0.027779579162597656, -0.02548980712890625, -0.023200035095214844, -0.020910263061523438, -0.01862049102783203, -0.016330718994140625, -0.014040946960449219, -0.011751174926757812, -0.009461402893066406, -0.007171630859375, -0.004881858825683594, -0.0025920867919921875, -0.00030231475830078125, 0.001987457275390625, 0.004277229309082031, 0.0065670013427734375, 0.008856773376464844, 0.01114654541015625, 0.013436317443847656, 0.015726089477539062, 0.01801586151123047, 0.020305633544921875, 0.02259540557861328, 0.024885177612304688, 0.027174949645996094, 0.0294647216796875, 0.031754493713378906, 0.03404426574707031, 0.03633403778076172, 0.038623809814453125, 0.04091358184814453, 0.04320335388183594, 0.045493125915527344, 0.04778289794921875, 0.050072669982910156, 0.05236244201660156, 0.05465221405029297, 0.056941986083984375, 0.05923175811767578, 0.06152153015136719, 0.0638113021850586, 0.06610107421875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 3.0, 9.0, 8.0, 10.0, 17.0, 28.0, 22.0, 30.0, 38.0, 35.0, 62.0, 63.0, 64.0, 64.0, 86.0, 66.0, 62.0, 52.0, 49.0, 43.0, 29.0, 25.0, 22.0, 14.0, 19.0, 14.0, 6.0, 10.0, 6.0, 10.0, 4.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0638427734375, -0.06171894073486328, -0.05959510803222656, -0.057471275329589844, -0.055347442626953125, -0.053223609924316406, -0.05109977722167969, -0.04897594451904297, -0.04685211181640625, -0.04472827911376953, -0.04260444641113281, -0.040480613708496094, -0.038356781005859375, -0.036232948303222656, -0.03410911560058594, -0.03198528289794922, -0.0298614501953125, -0.02773761749267578, -0.025613784790039062, -0.023489952087402344, -0.021366119384765625, -0.019242286682128906, -0.017118453979492188, -0.014994621276855469, -0.01287078857421875, -0.010746955871582031, -0.008623123168945312, -0.006499290466308594, -0.004375457763671875, -0.0022516250610351562, -0.0001277923583984375, 0.0019960403442382812, 0.004119873046875, 0.006243705749511719, 0.008367538452148438, 0.010491371154785156, 0.012615203857421875, 0.014739036560058594, 0.016862869262695312, 0.01898670196533203, 0.02111053466796875, 0.02323436737060547, 0.025358200073242188, 0.027482032775878906, 0.029605865478515625, 0.031729698181152344, 0.03385353088378906, 0.03597736358642578, 0.0381011962890625, 0.04022502899169922, 0.04234886169433594, 0.044472694396972656, 0.046596527099609375, 0.048720359802246094, 0.05084419250488281, 0.05296802520751953, 0.05509185791015625, 0.05721569061279297, 0.05933952331542969, 0.061463356018066406, 0.06358718872070312, 0.06571102142333984, 0.06783485412597656, 0.06995868682861328, 0.07208251953125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 8.0, 9.0, 17.0, 28.0, 53.0, 68.0, 95.0, 145.0, 129.0, 118.0, 106.0, 74.0, 65.0, 31.0, 19.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.213486671447754, -1.178208351135254, -1.142930030822754, -1.1076518297195435, -1.0723735094070435, -1.0370951890945435, -1.001816987991333, -0.966538667678833, -0.931260347366333, -0.895982027053833, -0.8607037663459778, -0.8254255056381226, -0.7901471853256226, -0.7548688650131226, -0.7195906043052673, -0.6843123435974121, -0.6490340232849121, -0.6137557029724121, -0.5784774422645569, -0.5431991815567017, -0.5079208612442017, -0.47264257073402405, -0.43736428022384644, -0.4020859897136688, -0.3668076992034912, -0.3315294086933136, -0.296251118183136, -0.2609728276729584, -0.22569453716278076, -0.19041624665260315, -0.15513795614242554, -0.11985966563224792, -0.08458149433135986, -0.04930320382118225, -0.014024913311004639, 0.021253377199172974, 0.056531667709350586, 0.0918099582195282, 0.1270882487297058, 0.16236653923988342, 0.19764482975006104, 0.23292312026023865, 0.26820141077041626, 0.30347970128059387, 0.3387579917907715, 0.3740362823009491, 0.4093145728111267, 0.4445928633213043, 0.47987115383148193, 0.5151494741439819, 0.5504277348518372, 0.5857059955596924, 0.6209843158721924, 0.6562626361846924, 0.6915408968925476, 0.7268191576004028, 0.7620974779129028, 0.7973757982254028, 0.8326540589332581, 0.8679323196411133, 0.9032106399536133, 0.9384889602661133, 0.9737672209739685, 1.0090454816818237, 1.0443238019943237]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 12.0, 7.0, 10.0, 10.0, 10.0, 16.0, 17.0, 23.0, 20.0, 21.0, 23.0, 42.0, 35.0, 29.0, 45.0, 38.0, 35.0, 45.0, 44.0, 47.0, 38.0, 38.0, 35.0, 42.0, 37.0, 34.0, 29.0, 32.0, 20.0, 32.0, 19.0, 16.0, 15.0, 10.0, 16.0, 8.0, 11.0, 10.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376426815986633, -0.6176867485046387, -0.597730815410614, -0.5777749419212341, -0.5578190088272095, -0.5378630757331848, -0.5179071426391602, -0.4979512393474579, -0.4779953360557556, -0.45803940296173096, -0.4380834996700287, -0.41812756657600403, -0.39817166328430176, -0.3782157301902771, -0.35825979709625244, -0.33830389380455017, -0.3183479607105255, -0.29839202761650085, -0.2784361243247986, -0.2584801912307739, -0.23852428793907166, -0.218568354845047, -0.19861243665218353, -0.17865651845932007, -0.1587006002664566, -0.13874468207359314, -0.11878876388072968, -0.09883283823728561, -0.07887692004442215, -0.058921001851558685, -0.038965076208114624, -0.01900915801525116, 0.0009467601776123047, 0.02090268023312092, 0.04085860028862953, 0.060814522206783295, 0.08077044039964676, 0.10072635859251022, 0.12068228423595428, 0.14063820242881775, 0.1605941206216812, 0.18055003881454468, 0.20050595700740814, 0.2204618752002716, 0.24041780829429626, 0.26037371158599854, 0.2803296446800232, 0.30028557777404785, 0.3202414810657501, 0.3401974141597748, 0.36015331745147705, 0.3801092505455017, 0.400065153837204, 0.42002108693122864, 0.4399769902229309, 0.45993292331695557, 0.4798888564109802, 0.4998447895050049, 0.5198007225990295, 0.5397565960884094, 0.5597125291824341, 0.5796684622764587, 0.5996243953704834, 0.6195802688598633, 0.6395362019538879]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 16.0, 23.0, 34.0, 58.0, 80.0, 138.0, 178.0, 281.0, 416.0, 654.0, 1022.0, 1769.0, 2961.0, 4971.0, 8912.0, 17376.0, 34812.0, 72749.0, 161235.0, 363760.0, 795997.0, 1212475.0, 818184.0, 378772.0, 166260.0, 75055.0, 35639.0, 18054.0, 9462.0, 5009.0, 3022.0, 1711.0, 1078.0, 722.0, 468.0, 270.0, 202.0, 140.0, 94.0, 57.0, 47.0, 39.0, 16.0, 16.0, 12.0, 15.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07061767578125, -0.06814193725585938, -0.06566619873046875, -0.06319046020507812, -0.0607147216796875, -0.058238983154296875, -0.05576324462890625, -0.053287506103515625, -0.050811767578125, -0.048336029052734375, -0.04586029052734375, -0.043384552001953125, -0.0409088134765625, -0.038433074951171875, -0.03595733642578125, -0.033481597900390625, -0.031005859375, -0.028530120849609375, -0.02605438232421875, -0.023578643798828125, -0.0211029052734375, -0.018627166748046875, -0.01615142822265625, -0.013675689697265625, -0.011199951171875, -0.008724212646484375, -0.00624847412109375, -0.003772735595703125, -0.0012969970703125, 0.001178741455078125, 0.00365447998046875, 0.006130218505859375, 0.00860595703125, 0.011081695556640625, 0.01355743408203125, 0.016033172607421875, 0.0185089111328125, 0.020984649658203125, 0.02346038818359375, 0.025936126708984375, 0.028411865234375, 0.030887603759765625, 0.03336334228515625, 0.035839080810546875, 0.0383148193359375, 0.040790557861328125, 0.04326629638671875, 0.045742034912109375, 0.0482177734375, 0.050693511962890625, 0.05316925048828125, 0.055644989013671875, 0.0581207275390625, 0.060596466064453125, 0.06307220458984375, 0.06554794311523438, 0.068023681640625, 0.07049942016601562, 0.07297515869140625, 0.07545089721679688, 0.0779266357421875, 0.08040237426757812, 0.08287811279296875, 0.08535385131835938, 0.08782958984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 12.0, 4.0, 7.0, 17.0, 14.0, 11.0, 20.0, 20.0, 12.0, 27.0, 28.0, 28.0, 37.0, 35.0, 36.0, 29.0, 38.0, 46.0, 53.0, 53.0, 51.0, 44.0, 47.0, 44.0, 42.0, 37.0, 32.0, 32.0, 25.0, 22.0, 7.0, 22.0, 13.0, 11.0, 6.0, 4.0, 6.0, 11.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0911865234375, -0.08851146697998047, -0.08583641052246094, -0.0831613540649414, -0.08048629760742188, -0.07781124114990234, -0.07513618469238281, -0.07246112823486328, -0.06978607177734375, -0.06711101531982422, -0.06443595886230469, -0.061760902404785156, -0.059085845947265625, -0.056410789489746094, -0.05373573303222656, -0.05106067657470703, -0.0483856201171875, -0.04571056365966797, -0.04303550720214844, -0.040360450744628906, -0.037685394287109375, -0.035010337829589844, -0.03233528137207031, -0.02966022491455078, -0.02698516845703125, -0.02431011199951172, -0.021635055541992188, -0.018959999084472656, -0.016284942626953125, -0.013609886169433594, -0.010934829711914062, -0.008259773254394531, -0.005584716796875, -0.0029096603393554688, -0.0002346038818359375, 0.0024404525756835938, 0.005115509033203125, 0.007790565490722656, 0.010465621948242188, 0.013140678405761719, 0.01581573486328125, 0.01849079132080078, 0.021165847778320312, 0.023840904235839844, 0.026515960693359375, 0.029191017150878906, 0.03186607360839844, 0.03454113006591797, 0.0372161865234375, 0.03989124298095703, 0.04256629943847656, 0.045241355895996094, 0.047916412353515625, 0.050591468811035156, 0.05326652526855469, 0.05594158172607422, 0.05861663818359375, 0.06129169464111328, 0.06396675109863281, 0.06664180755615234, 0.06931686401367188, 0.0719919204711914, 0.07466697692871094, 0.07734203338623047, 0.08001708984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 10.0, 8.0, 23.0, 42.0, 40.0, 84.0, 150.0, 241.0, 418.0, 821.0, 1615.0, 3940.0, 11727.0, 48585.0, 312366.0, 2620844.0, 1038891.0, 119545.0, 23126.0, 6661.0, 2583.0, 1149.0, 591.0, 334.0, 170.0, 107.0, 84.0, 41.0, 24.0, 20.0, 17.0, 10.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2471923828125, -0.23888587951660156, -0.23057937622070312, -0.2222728729248047, -0.21396636962890625, -0.2056598663330078, -0.19735336303710938, -0.18904685974121094, -0.1807403564453125, -0.17243385314941406, -0.16412734985351562, -0.1558208465576172, -0.14751434326171875, -0.1392078399658203, -0.13090133666992188, -0.12259483337402344, -0.114288330078125, -0.10598182678222656, -0.09767532348632812, -0.08936882019042969, -0.08106231689453125, -0.07275581359863281, -0.06444931030273438, -0.05614280700683594, -0.0478363037109375, -0.03952980041503906, -0.031223297119140625, -0.022916793823242188, -0.01461029052734375, -0.0063037872314453125, 0.002002716064453125, 0.010309219360351562, 0.01861572265625, 0.026922225952148438, 0.035228729248046875, 0.04353523254394531, 0.05184173583984375, 0.06014823913574219, 0.06845474243164062, 0.07676124572753906, 0.0850677490234375, 0.09337425231933594, 0.10168075561523438, 0.10998725891113281, 0.11829376220703125, 0.1266002655029297, 0.13490676879882812, 0.14321327209472656, 0.151519775390625, 0.15982627868652344, 0.16813278198242188, 0.1764392852783203, 0.18474578857421875, 0.1930522918701172, 0.20135879516601562, 0.20966529846191406, 0.2179718017578125, 0.22627830505371094, 0.23458480834960938, 0.2428913116455078, 0.25119781494140625, 0.2595043182373047, 0.2678108215332031, 0.27611732482910156, 0.284423828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 16.0, 10.0, 27.0, 30.0, 59.0, 76.0, 119.0, 153.0, 242.0, 362.0, 520.0, 673.0, 582.0, 388.0, 257.0, 180.0, 108.0, 92.0, 50.0, 34.0, 16.0, 24.0, 11.0, 9.0, 7.0, 2.0, 4.0, 8.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2181396484375, -0.211456298828125, -0.20477294921875, -0.198089599609375, -0.19140625, -0.184722900390625, -0.17803955078125, -0.171356201171875, -0.1646728515625, -0.157989501953125, -0.15130615234375, -0.144622802734375, -0.137939453125, -0.131256103515625, -0.12457275390625, -0.117889404296875, -0.1112060546875, -0.104522705078125, -0.09783935546875, -0.091156005859375, -0.08447265625, -0.077789306640625, -0.07110595703125, -0.064422607421875, -0.0577392578125, -0.051055908203125, -0.04437255859375, -0.037689208984375, -0.031005859375, -0.024322509765625, -0.01763916015625, -0.010955810546875, -0.0042724609375, 0.002410888671875, 0.00909423828125, 0.015777587890625, 0.0224609375, 0.029144287109375, 0.03582763671875, 0.042510986328125, 0.0491943359375, 0.055877685546875, 0.06256103515625, 0.069244384765625, 0.075927734375, 0.082611083984375, 0.08929443359375, 0.095977783203125, 0.1026611328125, 0.109344482421875, 0.11602783203125, 0.122711181640625, 0.12939453125, 0.136077880859375, 0.14276123046875, 0.149444580078125, 0.1561279296875, 0.162811279296875, 0.16949462890625, 0.176177978515625, 0.182861328125, 0.189544677734375, 0.19622802734375, 0.202911376953125, 0.2095947265625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 1.0, 0.0, 6.0, 7.0, 13.0, 12.0, 36.0, 56.0, 97.0, 123.0, 160.0, 145.0, 125.0, 87.0, 65.0, 33.0, 14.0, 17.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0444986820220947, -1.9980562925338745, -1.9516139030456543, -1.9051713943481445, -1.8587290048599243, -1.812286615371704, -1.7658442258834839, -1.7194018363952637, -1.6729594469070435, -1.6265170574188232, -1.580074667930603, -1.5336322784423828, -1.487189769744873, -1.4407473802566528, -1.3943049907684326, -1.3478626012802124, -1.3014202117919922, -1.254977822303772, -1.2085354328155518, -1.162092924118042, -1.1156505346298218, -1.0692081451416016, -1.0227657556533813, -0.9763233661651611, -0.9298808574676514, -0.8834384679794312, -0.8369960188865662, -0.790553629398346, -0.7441112399101257, -0.6976687908172607, -0.6512264013290405, -0.6047840118408203, -0.5583415627479553, -0.5118991732597351, -0.4654567539691925, -0.4190143346786499, -0.3725719451904297, -0.3261295258998871, -0.2796871066093445, -0.23324471712112427, -0.18680229783058167, -0.14035989344120026, -0.09391748160123825, -0.047475069761276245, -0.0010326653718948364, 0.04540973901748657, 0.09185215830802917, 0.1382945477962494, 0.184736967086792, 0.2311793714761734, 0.2776217758655548, 0.3240641951560974, 0.3705065846443176, 0.41694900393486023, 0.46339142322540283, 0.509833812713623, 0.5562762022018433, 0.6027185916900635, 0.6491610407829285, 0.6956034302711487, 0.7420458197593689, 0.7884882688522339, 0.8349306583404541, 0.8813730478286743, 0.9278154969215393]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 5.0, 6.0, 9.0, 6.0, 8.0, 7.0, 10.0, 9.0, 14.0, 13.0, 15.0, 24.0, 17.0, 19.0, 26.0, 27.0, 25.0, 35.0, 38.0, 38.0, 48.0, 32.0, 39.0, 44.0, 36.0, 45.0, 33.0, 33.0, 35.0, 31.0, 39.0, 32.0, 25.0, 21.0, 19.0, 12.0, 20.0, 16.0, 9.0, 19.0, 17.0, 10.0, 7.0, 12.0, 5.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.4810076355934143, -0.46562087535858154, -0.4502341151237488, -0.434847354888916, -0.41946059465408325, -0.4040738344192505, -0.38868704438209534, -0.3733002841472626, -0.3579135239124298, -0.34252676367759705, -0.3271400034427643, -0.3117532432079315, -0.29636645317077637, -0.2809796929359436, -0.26559293270111084, -0.2502061724662781, -0.2348194122314453, -0.21943265199661255, -0.20404589176177979, -0.18865911662578583, -0.17327235639095306, -0.1578855961561203, -0.14249882102012634, -0.12711206078529358, -0.11172530055046082, -0.09633854031562805, -0.08095177263021469, -0.06556500494480133, -0.05017824470996857, -0.0347914844751358, -0.019404716789722443, -0.004017949104309082, 0.011368811130523682, 0.026755575090646744, 0.042142339050769806, 0.05752910301089287, 0.07291586697101593, 0.0883026272058487, 0.10368939489126205, 0.11907616257667542, 0.13446292281150818, 0.14984968304634094, 0.1652364432811737, 0.18062321841716766, 0.19600997865200043, 0.2113967388868332, 0.22678351402282715, 0.2421702742576599, 0.2575570344924927, 0.27294379472732544, 0.2883305549621582, 0.30371731519699097, 0.31910407543182373, 0.3344908356666565, 0.34987762570381165, 0.3652643859386444, 0.3806511461734772, 0.39603790640830994, 0.4114246666431427, 0.42681142687797546, 0.4421982169151306, 0.4575849771499634, 0.47297173738479614, 0.4883584976196289, 0.5037452578544617]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 1.0, 6.0, 9.0, 22.0, 20.0, 34.0, 57.0, 62.0, 102.0, 178.0, 232.0, 335.0, 487.0, 741.0, 1028.0, 1529.0, 2317.0, 3467.0, 5102.0, 7797.0, 12574.0, 23318.0, 51381.0, 118766.0, 223242.0, 260245.0, 173383.0, 80717.0, 34861.0, 17419.0, 9887.0, 6203.0, 4127.0, 2877.0, 1942.0, 1303.0, 942.0, 583.0, 415.0, 262.0, 184.0, 137.0, 83.0, 69.0, 35.0, 35.0, 20.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1307373046875, -0.1261119842529297, -0.12148666381835938, -0.11686134338378906, -0.11223602294921875, -0.10761070251464844, -0.10298538208007812, -0.09836006164550781, -0.0937347412109375, -0.08910942077636719, -0.08448410034179688, -0.07985877990722656, -0.07523345947265625, -0.07060813903808594, -0.06598281860351562, -0.06135749816894531, -0.056732177734375, -0.05210685729980469, -0.047481536865234375, -0.04285621643066406, -0.03823089599609375, -0.03360557556152344, -0.028980255126953125, -0.024354934692382812, -0.0197296142578125, -0.015104293823242188, -0.010478973388671875, -0.0058536529541015625, -0.00122833251953125, 0.0033969879150390625, 0.008022308349609375, 0.012647628784179688, 0.01727294921875, 0.021898269653320312, 0.026523590087890625, 0.031148910522460938, 0.03577423095703125, 0.04039955139160156, 0.045024871826171875, 0.04965019226074219, 0.0542755126953125, 0.05890083312988281, 0.06352615356445312, 0.06815147399902344, 0.07277679443359375, 0.07740211486816406, 0.08202743530273438, 0.08665275573730469, 0.091278076171875, 0.09590339660644531, 0.10052871704101562, 0.10515403747558594, 0.10977935791015625, 0.11440467834472656, 0.11902999877929688, 0.12365531921386719, 0.1282806396484375, 0.1329059600830078, 0.13753128051757812, 0.14215660095214844, 0.14678192138671875, 0.15140724182128906, 0.15603256225585938, 0.1606578826904297, 0.165283203125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 14.0, 10.0, 13.0, 23.0, 14.0, 25.0, 19.0, 27.0, 30.0, 24.0, 34.0, 37.0, 42.0, 36.0, 38.0, 42.0, 44.0, 34.0, 43.0, 49.0, 40.0, 48.0, 32.0, 37.0, 36.0, 37.0, 33.0, 23.0, 29.0, 12.0, 10.0, 14.0, 8.0, 7.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.11639404296875, -0.1134042739868164, -0.11041450500488281, -0.10742473602294922, -0.10443496704101562, -0.10144519805908203, -0.09845542907714844, -0.09546566009521484, -0.09247589111328125, -0.08948612213134766, -0.08649635314941406, -0.08350658416748047, -0.08051681518554688, -0.07752704620361328, -0.07453727722167969, -0.0715475082397461, -0.0685577392578125, -0.0655679702758789, -0.06257820129394531, -0.05958843231201172, -0.056598663330078125, -0.05360889434814453, -0.05061912536621094, -0.047629356384277344, -0.04463958740234375, -0.041649818420410156, -0.03866004943847656, -0.03567028045654297, -0.032680511474609375, -0.02969074249267578, -0.026700973510742188, -0.023711204528808594, -0.020721435546875, -0.017731666564941406, -0.014741897583007812, -0.011752128601074219, -0.008762359619140625, -0.005772590637207031, -0.0027828216552734375, 0.00020694732666015625, 0.00319671630859375, 0.006186485290527344, 0.009176254272460938, 0.012166023254394531, 0.015155792236328125, 0.01814556121826172, 0.021135330200195312, 0.024125099182128906, 0.0271148681640625, 0.030104637145996094, 0.03309440612792969, 0.03608417510986328, 0.039073944091796875, 0.04206371307373047, 0.04505348205566406, 0.048043251037597656, 0.05103302001953125, 0.054022789001464844, 0.05701255798339844, 0.06000232696533203, 0.06299209594726562, 0.06598186492919922, 0.06897163391113281, 0.0719614028930664, 0.074951171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 11.0, 23.0, 37.0, 64.0, 108.0, 203.0, 435.0, 912.0, 2214.0, 5132.0, 12881.0, 37343.0, 169599.0, 525596.0, 222187.0, 45880.0, 15278.0, 6076.0, 2484.0, 1065.0, 500.0, 242.0, 107.0, 68.0, 36.0, 24.0, 15.0, 8.0, 4.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.374755859375, -0.36528778076171875, -0.3558197021484375, -0.34635162353515625, -0.336883544921875, -0.32741546630859375, -0.3179473876953125, -0.30847930908203125, -0.29901123046875, -0.28954315185546875, -0.2800750732421875, -0.27060699462890625, -0.261138916015625, -0.25167083740234375, -0.2422027587890625, -0.23273468017578125, -0.2232666015625, -0.21379852294921875, -0.2043304443359375, -0.19486236572265625, -0.185394287109375, -0.17592620849609375, -0.1664581298828125, -0.15699005126953125, -0.14752197265625, -0.13805389404296875, -0.1285858154296875, -0.11911773681640625, -0.109649658203125, -0.10018157958984375, -0.0907135009765625, -0.08124542236328125, -0.07177734375, -0.06230926513671875, -0.0528411865234375, -0.04337310791015625, -0.033905029296875, -0.02443695068359375, -0.0149688720703125, -0.00550079345703125, 0.00396728515625, 0.01343536376953125, 0.0229034423828125, 0.03237152099609375, 0.041839599609375, 0.05130767822265625, 0.0607757568359375, 0.07024383544921875, 0.0797119140625, 0.08917999267578125, 0.0986480712890625, 0.10811614990234375, 0.117584228515625, 0.12705230712890625, 0.1365203857421875, 0.14598846435546875, 0.15545654296875, 0.16492462158203125, 0.1743927001953125, 0.18386077880859375, 0.193328857421875, 0.20279693603515625, 0.2122650146484375, 0.22173309326171875, 0.231201171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 8.0, 9.0, 15.0, 10.0, 12.0, 18.0, 19.0, 20.0, 27.0, 36.0, 32.0, 53.0, 48.0, 51.0, 67.0, 43.0, 58.0, 51.0, 54.0, 46.0, 39.0, 25.0, 35.0, 33.0, 29.0, 32.0, 20.0, 18.0, 20.0, 16.0, 10.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.327880859375, -0.31758880615234375, -0.3072967529296875, -0.29700469970703125, -0.286712646484375, -0.27642059326171875, -0.2661285400390625, -0.25583648681640625, -0.24554443359375, -0.23525238037109375, -0.2249603271484375, -0.21466827392578125, -0.204376220703125, -0.19408416748046875, -0.1837921142578125, -0.17350006103515625, -0.1632080078125, -0.15291595458984375, -0.1426239013671875, -0.13233184814453125, -0.122039794921875, -0.11174774169921875, -0.1014556884765625, -0.09116363525390625, -0.08087158203125, -0.07057952880859375, -0.0602874755859375, -0.04999542236328125, -0.039703369140625, -0.02941131591796875, -0.0191192626953125, -0.00882720947265625, 0.00146484375, 0.01175689697265625, 0.0220489501953125, 0.03234100341796875, 0.042633056640625, 0.05292510986328125, 0.0632171630859375, 0.07350921630859375, 0.08380126953125, 0.09409332275390625, 0.1043853759765625, 0.11467742919921875, 0.124969482421875, 0.13526153564453125, 0.1455535888671875, 0.15584564208984375, 0.1661376953125, 0.17642974853515625, 0.1867218017578125, 0.19701385498046875, 0.207305908203125, 0.21759796142578125, 0.2278900146484375, 0.23818206787109375, 0.24847412109375, 0.25876617431640625, 0.2690582275390625, 0.27935028076171875, 0.289642333984375, 0.29993438720703125, 0.3102264404296875, 0.32051849365234375, 0.330810546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 21.0, 29.0, 45.0, 94.0, 126.0, 231.0, 401.0, 736.0, 1346.0, 2486.0, 4461.0, 8680.0, 16961.0, 36191.0, 88717.0, 219649.0, 327593.0, 197866.0, 78319.0, 32276.0, 15221.0, 7797.0, 4222.0, 2183.0, 1219.0, 698.0, 414.0, 221.0, 134.0, 81.0, 64.0, 26.0, 19.0, 9.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07550048828125, -0.0732421875, -0.07098388671875, -0.0687255859375, -0.06646728515625, -0.064208984375, -0.06195068359375, -0.0596923828125, -0.05743408203125, -0.05517578125, -0.05291748046875, -0.0506591796875, -0.04840087890625, -0.046142578125, -0.04388427734375, -0.0416259765625, -0.03936767578125, -0.037109375, -0.03485107421875, -0.0325927734375, -0.03033447265625, -0.028076171875, -0.02581787109375, -0.0235595703125, -0.02130126953125, -0.01904296875, -0.01678466796875, -0.0145263671875, -0.01226806640625, -0.010009765625, -0.00775146484375, -0.0054931640625, -0.00323486328125, -0.0009765625, 0.00128173828125, 0.0035400390625, 0.00579833984375, 0.008056640625, 0.01031494140625, 0.0125732421875, 0.01483154296875, 0.01708984375, 0.01934814453125, 0.0216064453125, 0.02386474609375, 0.026123046875, 0.02838134765625, 0.0306396484375, 0.03289794921875, 0.03515625, 0.03741455078125, 0.0396728515625, 0.04193115234375, 0.044189453125, 0.04644775390625, 0.0487060546875, 0.05096435546875, 0.05322265625, 0.05548095703125, 0.0577392578125, 0.05999755859375, 0.062255859375, 0.06451416015625, 0.0667724609375, 0.06903076171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 6.0, 11.0, 16.0, 17.0, 12.0, 19.0, 37.0, 49.0, 62.0, 80.0, 97.0, 109.0, 106.0, 86.0, 87.0, 52.0, 28.0, 18.0, 30.0, 21.0, 9.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771615982055664e-05, -2.6747584342956543e-05, -2.5779008865356445e-05, -2.4810433387756348e-05, -2.384185791015625e-05, -2.2873282432556152e-05, -2.1904706954956055e-05, -2.0936131477355957e-05, -1.996755599975586e-05, -1.8998980522155762e-05, -1.8030405044555664e-05, -1.7061829566955566e-05, -1.609325408935547e-05, -1.5124678611755371e-05, -1.4156103134155273e-05, -1.3187527656555176e-05, -1.2218952178955078e-05, -1.125037670135498e-05, -1.0281801223754883e-05, -9.313225746154785e-06, -8.344650268554688e-06, -7.37607479095459e-06, -6.407499313354492e-06, -5.4389238357543945e-06, -4.470348358154297e-06, -3.5017728805541992e-06, -2.5331974029541016e-06, -1.564621925354004e-06, -5.960464477539062e-07, 3.725290298461914e-07, 1.341104507446289e-06, 2.3096799850463867e-06, 3.2782554626464844e-06, 4.246830940246582e-06, 5.21540641784668e-06, 6.183981895446777e-06, 7.152557373046875e-06, 8.121132850646973e-06, 9.08970832824707e-06, 1.0058283805847168e-05, 1.1026859283447266e-05, 1.1995434761047363e-05, 1.2964010238647461e-05, 1.3932585716247559e-05, 1.4901161193847656e-05, 1.5869736671447754e-05, 1.683831214904785e-05, 1.780688762664795e-05, 1.8775463104248047e-05, 1.9744038581848145e-05, 2.0712614059448242e-05, 2.168118953704834e-05, 2.2649765014648438e-05, 2.3618340492248535e-05, 2.4586915969848633e-05, 2.555549144744873e-05, 2.6524066925048828e-05, 2.7492642402648926e-05, 2.8461217880249023e-05, 2.942979335784912e-05, 3.039836883544922e-05, 3.1366944313049316e-05, 3.2335519790649414e-05, 3.330409526824951e-05, 3.427267074584961e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 1.0, 4.0, 16.0, 11.0, 23.0, 23.0, 46.0, 72.0, 106.0, 183.0, 293.0, 459.0, 852.0, 1558.0, 2869.0, 5640.0, 11152.0, 22688.0, 46818.0, 96577.0, 182797.0, 249812.0, 204327.0, 113350.0, 55195.0, 26475.0, 13118.0, 6680.0, 3270.0, 1784.0, 934.0, 576.0, 307.0, 195.0, 129.0, 81.0, 44.0, 27.0, 19.0, 17.0, 11.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.05682373046875, -0.05508136749267578, -0.05333900451660156, -0.051596641540527344, -0.049854278564453125, -0.048111915588378906, -0.04636955261230469, -0.04462718963623047, -0.04288482666015625, -0.04114246368408203, -0.03940010070800781, -0.037657737731933594, -0.035915374755859375, -0.034173011779785156, -0.03243064880371094, -0.03068828582763672, -0.0289459228515625, -0.02720355987548828, -0.025461196899414062, -0.023718833923339844, -0.021976470947265625, -0.020234107971191406, -0.018491744995117188, -0.01674938201904297, -0.01500701904296875, -0.013264656066894531, -0.011522293090820312, -0.009779930114746094, -0.008037567138671875, -0.006295204162597656, -0.0045528411865234375, -0.0028104782104492188, -0.001068115234375, 0.0006742477416992188, 0.0024166107177734375, 0.004158973693847656, 0.005901336669921875, 0.007643699645996094, 0.009386062622070312, 0.011128425598144531, 0.01287078857421875, 0.014613151550292969, 0.016355514526367188, 0.018097877502441406, 0.019840240478515625, 0.021582603454589844, 0.023324966430664062, 0.02506732940673828, 0.0268096923828125, 0.02855205535888672, 0.030294418334960938, 0.032036781311035156, 0.033779144287109375, 0.035521507263183594, 0.03726387023925781, 0.03900623321533203, 0.04074859619140625, 0.04249095916748047, 0.04423332214355469, 0.045975685119628906, 0.047718048095703125, 0.049460411071777344, 0.05120277404785156, 0.05294513702392578, 0.0546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 8.0, 9.0, 7.0, 13.0, 14.0, 15.0, 27.0, 20.0, 32.0, 34.0, 30.0, 45.0, 46.0, 56.0, 50.0, 53.0, 53.0, 43.0, 50.0, 52.0, 57.0, 40.0, 46.0, 33.0, 23.0, 24.0, 18.0, 15.0, 14.0, 16.0, 5.0, 8.0, 6.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.055999755859375, -0.05411195755004883, -0.052224159240722656, -0.050336360931396484, -0.04844856262207031, -0.04656076431274414, -0.04467296600341797, -0.0427851676940918, -0.040897369384765625, -0.03900957107543945, -0.03712177276611328, -0.03523397445678711, -0.03334617614746094, -0.031458377838134766, -0.029570579528808594, -0.027682781219482422, -0.02579498291015625, -0.023907184600830078, -0.022019386291503906, -0.020131587982177734, -0.018243789672851562, -0.01635599136352539, -0.014468193054199219, -0.012580394744873047, -0.010692596435546875, -0.008804798126220703, -0.006916999816894531, -0.005029201507568359, -0.0031414031982421875, -0.0012536048889160156, 0.0006341934204101562, 0.002521991729736328, 0.0044097900390625, 0.006297588348388672, 0.008185386657714844, 0.010073184967041016, 0.011960983276367188, 0.01384878158569336, 0.01573657989501953, 0.017624378204345703, 0.019512176513671875, 0.021399974822998047, 0.02328777313232422, 0.02517557144165039, 0.027063369750976562, 0.028951168060302734, 0.030838966369628906, 0.03272676467895508, 0.03461456298828125, 0.03650236129760742, 0.038390159606933594, 0.040277957916259766, 0.04216575622558594, 0.04405355453491211, 0.04594135284423828, 0.04782915115356445, 0.049716949462890625, 0.0516047477722168, 0.05349254608154297, 0.05538034439086914, 0.05726814270019531, 0.059155941009521484, 0.061043739318847656, 0.06293153762817383, 0.0648193359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 13.0, 19.0, 26.0, 42.0, 89.0, 94.0, 163.0, 180.0, 133.0, 93.0, 75.0, 37.0, 20.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0], "bins": [-2.639861583709717, -2.589292287826538, -2.5387229919433594, -2.4881536960601807, -2.437584400177002, -2.3870153427124023, -2.3364458084106445, -2.285876750946045, -2.235307455062866, -2.1847381591796875, -2.134168863296509, -2.08359956741333, -2.0330302715301514, -1.9824610948562622, -1.9318917989730835, -1.8813225030899048, -1.830753207206726, -1.7801839113235474, -1.7296146154403687, -1.6790454387664795, -1.6284761428833008, -1.577906847000122, -1.5273375511169434, -1.4767682552337646, -1.426198959350586, -1.3756296634674072, -1.3250603675842285, -1.2744910717010498, -1.2239218950271606, -1.173352599143982, -1.1227833032608032, -1.0722140073776245, -1.0216448307037354, -0.9710755348205566, -0.9205062985420227, -0.869937002658844, -0.8193677663803101, -0.7687984704971313, -0.7182291746139526, -0.6676598787307739, -0.61709064245224, -0.5665213465690613, -0.5159521102905273, -0.46538281440734863, -0.4148135483264923, -0.364244282245636, -0.3136749863624573, -0.26310572028160095, -0.21253645420074463, -0.1619671881198883, -0.11139790713787079, -0.06082862615585327, -0.010259360074996948, 0.040309906005859375, 0.09087920188903809, 0.1414484679698944, 0.19201773405075073, 0.24258700013160706, 0.2931562662124634, 0.3437255620956421, 0.3942948281764984, 0.44486409425735474, 0.49543339014053345, 0.5460026264190674, 0.5965719223022461]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 6.0, 8.0, 7.0, 10.0, 13.0, 8.0, 17.0, 21.0, 16.0, 23.0, 30.0, 27.0, 29.0, 36.0, 35.0, 50.0, 50.0, 44.0, 47.0, 47.0, 39.0, 37.0, 43.0, 40.0, 38.0, 37.0, 35.0, 35.0, 37.0, 25.0, 11.0, 23.0, 12.0, 12.0, 12.0, 6.0, 6.0, 12.0, 5.0, 5.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6483940482139587, -0.6258418560028076, -0.6032896637916565, -0.5807374715805054, -0.558185338973999, -0.5356331467628479, -0.5130809545516968, -0.49052876234054565, -0.4679765999317169, -0.4454244077205658, -0.42287224531173706, -0.40032005310058594, -0.3777678608894348, -0.3552156984806061, -0.33266350626945496, -0.3101113438606262, -0.2875591516494751, -0.265006959438324, -0.24245479702949524, -0.21990260481834412, -0.1973504275083542, -0.17479825019836426, -0.15224605798721313, -0.1296938806772232, -0.10714170336723328, -0.08458952605724335, -0.06203734129667282, -0.039485156536102295, -0.016932979226112366, 0.0056191980838775635, 0.028171390295028687, 0.050723567605018616, 0.07327568531036377, 0.0958278626203537, 0.11838004738092422, 0.14093223214149475, 0.16348440945148468, 0.1860365867614746, 0.20858877897262573, 0.23114095628261566, 0.2536931335926056, 0.2762453258037567, 0.29879748821258545, 0.3213496804237366, 0.3439018726348877, 0.36645403504371643, 0.38900622725486755, 0.4115583896636963, 0.4341105818748474, 0.45666277408599854, 0.47921493649482727, 0.5017671585083008, 0.5243192911148071, 0.5468714833259583, 0.5694236755371094, 0.5919758677482605, 0.6145280599594116, 0.6370802521705627, 0.6596324443817139, 0.6821845769882202, 0.7047367691993713, 0.7272889614105225, 0.7498411536216736, 0.7723933458328247, 0.794945478439331]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 8.0, 11.0, 10.0, 30.0, 35.0, 49.0, 68.0, 110.0, 158.0, 220.0, 352.0, 501.0, 824.0, 1204.0, 1824.0, 3010.0, 5053.0, 8500.0, 14974.0, 28347.0, 57062.0, 122208.0, 277363.0, 611958.0, 1094886.0, 1004432.0, 519785.0, 231717.0, 103538.0, 48887.0, 24340.0, 13193.0, 7354.0, 4509.0, 2759.0, 1686.0, 1084.0, 751.0, 425.0, 325.0, 220.0, 145.0, 104.0, 84.0, 52.0, 40.0, 32.0, 20.0, 12.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 4.0], "bins": [-0.08782958984375, -0.08507537841796875, -0.0823211669921875, -0.07956695556640625, -0.076812744140625, -0.07405853271484375, -0.0713043212890625, -0.06855010986328125, -0.0657958984375, -0.06304168701171875, -0.0602874755859375, -0.05753326416015625, -0.054779052734375, -0.05202484130859375, -0.0492706298828125, -0.04651641845703125, -0.04376220703125, -0.04100799560546875, -0.0382537841796875, -0.03549957275390625, -0.032745361328125, -0.02999114990234375, -0.0272369384765625, -0.02448272705078125, -0.021728515625, -0.01897430419921875, -0.0162200927734375, -0.01346588134765625, -0.010711669921875, -0.00795745849609375, -0.0052032470703125, -0.00244903564453125, 0.00030517578125, 0.00305938720703125, 0.0058135986328125, 0.00856781005859375, 0.011322021484375, 0.01407623291015625, 0.0168304443359375, 0.01958465576171875, 0.0223388671875, 0.02509307861328125, 0.0278472900390625, 0.03060150146484375, 0.033355712890625, 0.03610992431640625, 0.0388641357421875, 0.04161834716796875, 0.04437255859375, 0.04712677001953125, 0.0498809814453125, 0.05263519287109375, 0.055389404296875, 0.05814361572265625, 0.0608978271484375, 0.06365203857421875, 0.06640625, 0.06916046142578125, 0.0719146728515625, 0.07466888427734375, 0.077423095703125, 0.08017730712890625, 0.0829315185546875, 0.08568572998046875, 0.08843994140625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 3.0, 4.0, 8.0, 10.0, 7.0, 10.0, 12.0, 10.0, 13.0, 23.0, 26.0, 15.0, 33.0, 31.0, 41.0, 39.0, 47.0, 44.0, 57.0, 45.0, 42.0, 45.0, 44.0, 45.0, 27.0, 35.0, 43.0, 32.0, 30.0, 30.0, 36.0, 31.0, 13.0, 21.0, 10.0, 12.0, 4.0, 3.0, 6.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.0822153091430664, -0.07916450500488281, -0.07611370086669922, -0.07306289672851562, -0.07001209259033203, -0.06696128845214844, -0.06391048431396484, -0.06085968017578125, -0.057808876037597656, -0.05475807189941406, -0.05170726776123047, -0.048656463623046875, -0.04560565948486328, -0.04255485534667969, -0.039504051208496094, -0.0364532470703125, -0.033402442932128906, -0.030351638793945312, -0.02730083465576172, -0.024250030517578125, -0.02119922637939453, -0.018148422241210938, -0.015097618103027344, -0.01204681396484375, -0.008996009826660156, -0.0059452056884765625, -0.0028944015502929688, 0.000156402587890625, 0.0032072067260742188, 0.0062580108642578125, 0.009308815002441406, 0.012359619140625, 0.015410423278808594, 0.018461227416992188, 0.02151203155517578, 0.024562835693359375, 0.02761363983154297, 0.030664443969726562, 0.033715248107910156, 0.03676605224609375, 0.039816856384277344, 0.04286766052246094, 0.04591846466064453, 0.048969268798828125, 0.05202007293701172, 0.05507087707519531, 0.058121681213378906, 0.0611724853515625, 0.0642232894897461, 0.06727409362792969, 0.07032489776611328, 0.07337570190429688, 0.07642650604248047, 0.07947731018066406, 0.08252811431884766, 0.08557891845703125, 0.08862972259521484, 0.09168052673339844, 0.09473133087158203, 0.09778213500976562, 0.10083293914794922, 0.10388374328613281, 0.1069345474243164, 0.1099853515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 11.0, 11.0, 16.0, 20.0, 28.0, 29.0, 45.0, 68.0, 113.0, 155.0, 209.0, 381.0, 625.0, 1248.0, 2502.0, 5996.0, 18091.0, 70454.0, 421495.0, 2643435.0, 866584.0, 120107.0, 27212.0, 8508.0, 3350.0, 1543.0, 770.0, 421.0, 281.0, 175.0, 129.0, 83.0, 58.0, 42.0, 18.0, 21.0, 14.0, 13.0, 5.0, 7.0, 4.0, 3.0, 0.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548828125, -0.24683380126953125, -0.2387847900390625, -0.23073577880859375, -0.222686767578125, -0.21463775634765625, -0.2065887451171875, -0.19853973388671875, -0.19049072265625, -0.18244171142578125, -0.1743927001953125, -0.16634368896484375, -0.158294677734375, -0.15024566650390625, -0.1421966552734375, -0.13414764404296875, -0.1260986328125, -0.11804962158203125, -0.1100006103515625, -0.10195159912109375, -0.093902587890625, -0.08585357666015625, -0.0778045654296875, -0.06975555419921875, -0.06170654296875, -0.05365753173828125, -0.0456085205078125, -0.03755950927734375, -0.029510498046875, -0.02146148681640625, -0.0134124755859375, -0.00536346435546875, 0.002685546875, 0.01073455810546875, 0.0187835693359375, 0.02683258056640625, 0.034881591796875, 0.04293060302734375, 0.0509796142578125, 0.05902862548828125, 0.06707763671875, 0.07512664794921875, 0.0831756591796875, 0.09122467041015625, 0.099273681640625, 0.10732269287109375, 0.1153717041015625, 0.12342071533203125, 0.1314697265625, 0.13951873779296875, 0.1475677490234375, 0.15561676025390625, 0.163665771484375, 0.17171478271484375, 0.1797637939453125, 0.18781280517578125, 0.19586181640625, 0.20391082763671875, 0.2119598388671875, 0.22000885009765625, 0.228057861328125, 0.23610687255859375, 0.2441558837890625, 0.25220489501953125, 0.26025390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 8.0, 8.0, 18.0, 28.0, 52.0, 62.0, 113.0, 213.0, 293.0, 508.0, 808.0, 769.0, 453.0, 290.0, 172.0, 91.0, 59.0, 41.0, 28.0, 23.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28759765625, -0.2785758972167969, -0.26955413818359375, -0.2605323791503906, -0.2515106201171875, -0.24248886108398438, -0.23346710205078125, -0.22444534301757812, -0.215423583984375, -0.20640182495117188, -0.19738006591796875, -0.18835830688476562, -0.1793365478515625, -0.17031478881835938, -0.16129302978515625, -0.15227127075195312, -0.14324951171875, -0.13422775268554688, -0.12520599365234375, -0.11618423461914062, -0.1071624755859375, -0.09814071655273438, -0.08911895751953125, -0.08009719848632812, -0.071075439453125, -0.062053680419921875, -0.05303192138671875, -0.044010162353515625, -0.0349884033203125, -0.025966644287109375, -0.01694488525390625, -0.007923126220703125, 0.0010986328125, 0.010120391845703125, 0.01914215087890625, 0.028163909912109375, 0.0371856689453125, 0.046207427978515625, 0.05522918701171875, 0.06425094604492188, 0.073272705078125, 0.08229446411132812, 0.09131622314453125, 0.10033798217773438, 0.1093597412109375, 0.11838150024414062, 0.12740325927734375, 0.13642501831054688, 0.14544677734375, 0.15446853637695312, 0.16349029541015625, 0.17251205444335938, 0.1815338134765625, 0.19055557250976562, 0.19957733154296875, 0.20859909057617188, 0.217620849609375, 0.22664260864257812, 0.23566436767578125, 0.24468612670898438, 0.2537078857421875, 0.2627296447753906, 0.27175140380859375, 0.2807731628417969, 0.289794921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 27.0, 41.0, 102.0, 158.0, 207.0, 211.0, 121.0, 83.0, 25.0, 15.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.111668109893799, -3.0405683517456055, -2.969468355178833, -2.8983685970306396, -2.8272688388824463, -2.756168842315674, -2.6850690841674805, -2.613969326019287, -2.5428695678710938, -2.4717698097229004, -2.400669813156128, -2.3295700550079346, -2.258470296859741, -2.1873703002929688, -2.1162705421447754, -2.045170783996582, -1.9740707874298096, -1.9029709100723267, -1.8318711519241333, -1.7607712745666504, -1.689671516418457, -1.6185716390609741, -1.5474717617034912, -1.4763720035552979, -1.405272126197815, -1.334172248840332, -1.2630724906921387, -1.1919726133346558, -1.1208727359771729, -1.0497729778289795, -0.9786731004714966, -0.9075732827186584, -0.8364734649658203, -0.7653736472129822, -0.694273829460144, -0.6231739521026611, -0.552074134349823, -0.48097431659698486, -0.40987446904182434, -0.3387746214866638, -0.2676748037338257, -0.19657497107982635, -0.12547513842582703, -0.0543753057718277, 0.01672452688217163, 0.08782434463500977, 0.1589241921901703, 0.2300240397453308, 0.30112385749816895, 0.3722236752510071, 0.4433235228061676, 0.5144233703613281, 0.5855231881141663, 0.6566230058670044, 0.7277228832244873, 0.7988227009773254, 0.8699225187301636, 0.9410223364830017, 1.0121221542358398, 1.0832220315933228, 1.1543219089508057, 1.225421667098999, 1.296521544456482, 1.3676214218139648, 1.4387211799621582]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 5.0, 13.0, 15.0, 14.0, 13.0, 18.0, 14.0, 16.0, 26.0, 22.0, 17.0, 34.0, 21.0, 30.0, 31.0, 45.0, 29.0, 39.0, 35.0, 30.0, 43.0, 28.0, 41.0, 36.0, 34.0, 31.0, 36.0, 19.0, 23.0, 24.0, 28.0, 20.0, 12.0, 23.0, 14.0, 12.0, 17.0, 11.0, 7.0, 11.0, 6.0, 9.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46974408626556396, -0.45374083518981934, -0.4377375841140747, -0.4217343330383301, -0.40573111176490784, -0.3897278606891632, -0.3737246096134186, -0.35772135853767395, -0.3417181372642517, -0.3257148861885071, -0.30971163511276245, -0.2937083840370178, -0.2777051627635956, -0.26170191168785095, -0.24569866061210632, -0.2296954095363617, -0.21369215846061707, -0.19768890738487244, -0.181685671210289, -0.16568242013454437, -0.14967918395996094, -0.1336759328842163, -0.11767268180847168, -0.10166943818330765, -0.08566619455814362, -0.06966295093297958, -0.05365970358252525, -0.03765645623207092, -0.02165321260690689, -0.005649968981742859, 0.01035328209400177, 0.026356525719165802, 0.042359769344329834, 0.058363012969493866, 0.0743662565946579, 0.09036950767040253, 0.10637275129556656, 0.12237599492073059, 0.13837924599647522, 0.15438249707221985, 0.17038573324680328, 0.1863889843225479, 0.20239222049713135, 0.21839547157287598, 0.2343987226486206, 0.25040197372436523, 0.26640522480010986, 0.2824084460735321, 0.29841169714927673, 0.31441494822502136, 0.330418199300766, 0.34642142057418823, 0.36242467164993286, 0.3784279227256775, 0.3944311738014221, 0.41043442487716675, 0.4264376759529114, 0.442440927028656, 0.45844417810440063, 0.47444742918014526, 0.4904506504535675, 0.5064538717269897, 0.5224571228027344, 0.538460373878479, 0.5544636249542236]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 8.0, 11.0, 11.0, 23.0, 40.0, 51.0, 73.0, 100.0, 139.0, 213.0, 321.0, 444.0, 666.0, 1067.0, 1639.0, 2610.0, 4372.0, 7869.0, 15786.0, 36826.0, 92988.0, 208426.0, 293423.0, 212481.0, 95275.0, 37532.0, 16256.0, 8002.0, 4425.0, 2677.0, 1603.0, 1055.0, 685.0, 467.0, 308.0, 189.0, 151.0, 100.0, 63.0, 38.0, 48.0, 25.0, 19.0, 17.0, 8.0, 9.0, 1.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.15673828125, -0.15160179138183594, -0.14646530151367188, -0.1413288116455078, -0.13619232177734375, -0.1310558319091797, -0.12591934204101562, -0.12078285217285156, -0.1156463623046875, -0.11050987243652344, -0.10537338256835938, -0.10023689270019531, -0.09510040283203125, -0.08996391296386719, -0.08482742309570312, -0.07969093322753906, -0.074554443359375, -0.06941795349121094, -0.06428146362304688, -0.05914497375488281, -0.05400848388671875, -0.04887199401855469, -0.043735504150390625, -0.03859901428222656, -0.0334625244140625, -0.028326034545898438, -0.023189544677734375, -0.018053054809570312, -0.01291656494140625, -0.0077800750732421875, -0.002643585205078125, 0.0024929046630859375, 0.00762939453125, 0.012765884399414062, 0.017902374267578125, 0.023038864135742188, 0.02817535400390625, 0.03331184387207031, 0.038448333740234375, 0.04358482360839844, 0.0487213134765625, 0.05385780334472656, 0.058994293212890625, 0.06413078308105469, 0.06926727294921875, 0.07440376281738281, 0.07954025268554688, 0.08467674255371094, 0.089813232421875, 0.09494972229003906, 0.10008621215820312, 0.10522270202636719, 0.11035919189453125, 0.11549568176269531, 0.12063217163085938, 0.12576866149902344, 0.1309051513671875, 0.13604164123535156, 0.14117813110351562, 0.1463146209716797, 0.15145111083984375, 0.1565876007080078, 0.16172409057617188, 0.16686058044433594, 0.1719970703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 10.0, 13.0, 12.0, 18.0, 15.0, 21.0, 23.0, 41.0, 26.0, 41.0, 36.0, 42.0, 38.0, 39.0, 49.0, 42.0, 48.0, 37.0, 51.0, 44.0, 32.0, 39.0, 29.0, 41.0, 28.0, 32.0, 28.0, 15.0, 20.0, 14.0, 12.0, 12.0, 5.0, 12.0, 8.0, 2.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.11407470703125, -0.11064624786376953, -0.10721778869628906, -0.1037893295288086, -0.10036087036132812, -0.09693241119384766, -0.09350395202636719, -0.09007549285888672, -0.08664703369140625, -0.08321857452392578, -0.07979011535644531, -0.07636165618896484, -0.07293319702148438, -0.0695047378540039, -0.06607627868652344, -0.06264781951904297, -0.0592193603515625, -0.05579090118408203, -0.05236244201660156, -0.048933982849121094, -0.045505523681640625, -0.042077064514160156, -0.03864860534667969, -0.03522014617919922, -0.03179168701171875, -0.02836322784423828, -0.024934768676757812, -0.021506309509277344, -0.018077850341796875, -0.014649391174316406, -0.011220932006835938, -0.007792472839355469, -0.004364013671875, -0.0009355545043945312, 0.0024929046630859375, 0.005921363830566406, 0.009349822998046875, 0.012778282165527344, 0.016206741333007812, 0.01963520050048828, 0.02306365966796875, 0.02649211883544922, 0.029920578002929688, 0.033349037170410156, 0.036777496337890625, 0.040205955505371094, 0.04363441467285156, 0.04706287384033203, 0.0504913330078125, 0.05391979217529297, 0.05734825134277344, 0.060776710510253906, 0.06420516967773438, 0.06763362884521484, 0.07106208801269531, 0.07449054718017578, 0.07791900634765625, 0.08134746551513672, 0.08477592468261719, 0.08820438385009766, 0.09163284301757812, 0.0950613021850586, 0.09848976135253906, 0.10191822052001953, 0.1053466796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 4.0, 11.0, 18.0, 27.0, 33.0, 52.0, 78.0, 111.0, 208.0, 334.0, 543.0, 846.0, 1446.0, 2387.0, 4281.0, 8031.0, 16381.0, 38506.0, 100168.0, 231187.0, 310205.0, 194018.0, 79263.0, 30981.0, 13502.0, 6740.0, 3758.0, 2118.0, 1280.0, 733.0, 465.0, 283.0, 185.0, 113.0, 79.0, 55.0, 40.0, 36.0, 15.0, 10.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.153564453125, -0.14867019653320312, -0.14377593994140625, -0.13888168334960938, -0.1339874267578125, -0.12909317016601562, -0.12419891357421875, -0.11930465698242188, -0.114410400390625, -0.10951614379882812, -0.10462188720703125, -0.09972763061523438, -0.0948333740234375, -0.08993911743164062, -0.08504486083984375, -0.08015060424804688, -0.07525634765625, -0.07036209106445312, -0.06546783447265625, -0.060573577880859375, -0.0556793212890625, -0.050785064697265625, -0.04589080810546875, -0.040996551513671875, -0.036102294921875, -0.031208038330078125, -0.02631378173828125, -0.021419525146484375, -0.0165252685546875, -0.011631011962890625, -0.00673675537109375, -0.001842498779296875, 0.0030517578125, 0.007946014404296875, 0.01284027099609375, 0.017734527587890625, 0.0226287841796875, 0.027523040771484375, 0.03241729736328125, 0.037311553955078125, 0.042205810546875, 0.047100067138671875, 0.05199432373046875, 0.056888580322265625, 0.0617828369140625, 0.06667709350585938, 0.07157135009765625, 0.07646560668945312, 0.08135986328125, 0.08625411987304688, 0.09114837646484375, 0.09604263305664062, 0.1009368896484375, 0.10583114624023438, 0.11072540283203125, 0.11561965942382812, 0.120513916015625, 0.12540817260742188, 0.13030242919921875, 0.13519668579101562, 0.1400909423828125, 0.14498519897460938, 0.14987945556640625, 0.15477371215820312, 0.15966796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 12.0, 6.0, 14.0, 9.0, 10.0, 9.0, 19.0, 17.0, 26.0, 30.0, 30.0, 26.0, 44.0, 53.0, 42.0, 36.0, 42.0, 58.0, 53.0, 44.0, 47.0, 57.0, 42.0, 40.0, 37.0, 28.0, 34.0, 29.0, 23.0, 18.0, 12.0, 11.0, 10.0, 10.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35791015625, -0.3475914001464844, -0.33727264404296875, -0.3269538879394531, -0.3166351318359375, -0.3063163757324219, -0.29599761962890625, -0.2856788635253906, -0.275360107421875, -0.2650413513183594, -0.25472259521484375, -0.24440383911132812, -0.2340850830078125, -0.22376632690429688, -0.21344757080078125, -0.20312881469726562, -0.19281005859375, -0.18249130249023438, -0.17217254638671875, -0.16185379028320312, -0.1515350341796875, -0.14121627807617188, -0.13089752197265625, -0.12057876586914062, -0.110260009765625, -0.09994125366210938, -0.08962249755859375, -0.07930374145507812, -0.0689849853515625, -0.058666229248046875, -0.04834747314453125, -0.038028717041015625, -0.0277099609375, -0.017391204833984375, -0.00707244873046875, 0.003246307373046875, 0.0135650634765625, 0.023883819580078125, 0.03420257568359375, 0.044521331787109375, 0.054840087890625, 0.06515884399414062, 0.07547760009765625, 0.08579635620117188, 0.0961151123046875, 0.10643386840820312, 0.11675262451171875, 0.12707138061523438, 0.13739013671875, 0.14770889282226562, 0.15802764892578125, 0.16834640502929688, 0.1786651611328125, 0.18898391723632812, 0.19930267333984375, 0.20962142944335938, 0.219940185546875, 0.23025894165039062, 0.24057769775390625, 0.2508964538574219, 0.2612152099609375, 0.2715339660644531, 0.28185272216796875, 0.2921714782714844, 0.302490234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 11.0, 19.0, 22.0, 38.0, 38.0, 55.0, 77.0, 150.0, 184.0, 286.0, 440.0, 621.0, 1010.0, 1533.0, 2452.0, 4015.0, 6662.0, 11651.0, 20901.0, 41454.0, 89196.0, 191764.0, 282715.0, 201720.0, 94941.0, 43991.0, 22169.0, 11911.0, 6783.0, 4353.0, 2595.0, 1638.0, 1043.0, 723.0, 413.0, 334.0, 211.0, 132.0, 101.0, 64.0, 45.0, 35.0, 27.0, 9.0, 10.0, 5.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.055877685546875, -0.05416059494018555, -0.052443504333496094, -0.05072641372680664, -0.04900932312011719, -0.047292232513427734, -0.04557514190673828, -0.04385805130004883, -0.042140960693359375, -0.04042387008666992, -0.03870677947998047, -0.036989688873291016, -0.03527259826660156, -0.03355550765991211, -0.031838417053222656, -0.030121326446533203, -0.02840423583984375, -0.026687145233154297, -0.024970054626464844, -0.02325296401977539, -0.021535873413085938, -0.019818782806396484, -0.01810169219970703, -0.016384601593017578, -0.014667510986328125, -0.012950420379638672, -0.011233329772949219, -0.009516239166259766, -0.0077991485595703125, -0.006082057952880859, -0.004364967346191406, -0.002647876739501953, -0.0009307861328125, 0.0007863044738769531, 0.0025033950805664062, 0.004220485687255859, 0.0059375762939453125, 0.007654666900634766, 0.009371757507324219, 0.011088848114013672, 0.012805938720703125, 0.014523029327392578, 0.01624011993408203, 0.017957210540771484, 0.019674301147460938, 0.02139139175415039, 0.023108482360839844, 0.024825572967529297, 0.02654266357421875, 0.028259754180908203, 0.029976844787597656, 0.03169393539428711, 0.03341102600097656, 0.035128116607666016, 0.03684520721435547, 0.03856229782104492, 0.040279388427734375, 0.04199647903442383, 0.04371356964111328, 0.045430660247802734, 0.04714775085449219, 0.04886484146118164, 0.050581932067871094, 0.05229902267456055, 0.05401611328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 9.0, 9.0, 17.0, 30.0, 51.0, 78.0, 101.0, 129.0, 147.0, 115.0, 90.0, 62.0, 48.0, 31.0, 17.0, 5.0, 9.0, 6.0, 8.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.2809715270996094e-05, -5.150213837623596e-05, -5.019456148147583e-05, -4.88869845867157e-05, -4.7579407691955566e-05, -4.6271830797195435e-05, -4.49642539024353e-05, -4.365667700767517e-05, -4.234910011291504e-05, -4.104152321815491e-05, -3.9733946323394775e-05, -3.8426369428634644e-05, -3.711879253387451e-05, -3.581121563911438e-05, -3.450363874435425e-05, -3.3196061849594116e-05, -3.1888484954833984e-05, -3.058090806007385e-05, -2.927333116531372e-05, -2.796575427055359e-05, -2.6658177375793457e-05, -2.5350600481033325e-05, -2.4043023586273193e-05, -2.273544669151306e-05, -2.142786979675293e-05, -2.0120292901992798e-05, -1.8812716007232666e-05, -1.7505139112472534e-05, -1.6197562217712402e-05, -1.488998532295227e-05, -1.3582408428192139e-05, -1.2274831533432007e-05, -1.0967254638671875e-05, -9.659677743911743e-06, -8.352100849151611e-06, -7.0445239543914795e-06, -5.736947059631348e-06, -4.429370164871216e-06, -3.121793270111084e-06, -1.8142163753509521e-06, -5.066394805908203e-07, 8.009374141693115e-07, 2.1085143089294434e-06, 3.416091203689575e-06, 4.723668098449707e-06, 6.031244993209839e-06, 7.338821887969971e-06, 8.646398782730103e-06, 9.953975677490234e-06, 1.1261552572250366e-05, 1.2569129467010498e-05, 1.387670636177063e-05, 1.5184283256530762e-05, 1.6491860151290894e-05, 1.7799437046051025e-05, 1.9107013940811157e-05, 2.041459083557129e-05, 2.172216773033142e-05, 2.3029744625091553e-05, 2.4337321519851685e-05, 2.5644898414611816e-05, 2.6952475309371948e-05, 2.826005220413208e-05, 2.9567629098892212e-05, 3.0875205993652344e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 3.0, 8.0, 11.0, 6.0, 16.0, 22.0, 24.0, 52.0, 64.0, 118.0, 150.0, 202.0, 335.0, 550.0, 812.0, 1539.0, 2767.0, 4981.0, 9648.0, 19505.0, 42603.0, 100612.0, 221547.0, 299379.0, 190346.0, 82783.0, 35430.0, 16618.0, 8148.0, 4343.0, 2410.0, 1346.0, 821.0, 479.0, 264.0, 209.0, 130.0, 80.0, 60.0, 45.0, 24.0, 18.0, 15.0, 15.0, 4.0, 6.0, 4.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.06658935546875, -0.06465291976928711, -0.06271648406982422, -0.06078004837036133, -0.05884361267089844, -0.05690717697143555, -0.054970741271972656, -0.053034305572509766, -0.051097869873046875, -0.049161434173583984, -0.047224998474121094, -0.0452885627746582, -0.04335212707519531, -0.04141569137573242, -0.03947925567626953, -0.03754281997680664, -0.03560638427734375, -0.03366994857788086, -0.03173351287841797, -0.029797077178955078, -0.027860641479492188, -0.025924205780029297, -0.023987770080566406, -0.022051334381103516, -0.020114898681640625, -0.018178462982177734, -0.016242027282714844, -0.014305591583251953, -0.012369155883789062, -0.010432720184326172, -0.008496284484863281, -0.006559848785400391, -0.0046234130859375, -0.0026869773864746094, -0.0007505416870117188, 0.0011858940124511719, 0.0031223297119140625, 0.005058765411376953, 0.006995201110839844, 0.008931636810302734, 0.010868072509765625, 0.012804508209228516, 0.014740943908691406, 0.016677379608154297, 0.018613815307617188, 0.020550251007080078, 0.02248668670654297, 0.02442312240600586, 0.02635955810546875, 0.02829599380493164, 0.03023242950439453, 0.03216886520385742, 0.03410530090332031, 0.0360417366027832, 0.037978172302246094, 0.039914608001708984, 0.041851043701171875, 0.043787479400634766, 0.045723915100097656, 0.04766035079956055, 0.04959678649902344, 0.05153322219848633, 0.05346965789794922, 0.05540609359741211, 0.057342529296875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 14.0, 12.0, 22.0, 29.0, 28.0, 35.0, 25.0, 47.0, 41.0, 58.0, 66.0, 77.0, 61.0, 76.0, 62.0, 69.0, 60.0, 46.0, 29.0, 24.0, 28.0, 14.0, 8.0, 9.0, 8.0, 8.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07232666015625, -0.06984901428222656, -0.06737136840820312, -0.06489372253417969, -0.06241607666015625, -0.05993843078613281, -0.057460784912109375, -0.05498313903808594, -0.0525054931640625, -0.05002784729003906, -0.047550201416015625, -0.04507255554199219, -0.04259490966796875, -0.04011726379394531, -0.037639617919921875, -0.03516197204589844, -0.032684326171875, -0.030206680297851562, -0.027729034423828125, -0.025251388549804688, -0.02277374267578125, -0.020296096801757812, -0.017818450927734375, -0.015340805053710938, -0.0128631591796875, -0.010385513305664062, -0.007907867431640625, -0.0054302215576171875, -0.00295257568359375, -0.0004749298095703125, 0.002002716064453125, 0.0044803619384765625, 0.0069580078125, 0.009435653686523438, 0.011913299560546875, 0.014390945434570312, 0.01686859130859375, 0.019346237182617188, 0.021823883056640625, 0.024301528930664062, 0.0267791748046875, 0.029256820678710938, 0.031734466552734375, 0.03421211242675781, 0.03668975830078125, 0.03916740417480469, 0.041645050048828125, 0.04412269592285156, 0.046600341796875, 0.04907798767089844, 0.051555633544921875, 0.05403327941894531, 0.05651092529296875, 0.05898857116699219, 0.061466217041015625, 0.06394386291503906, 0.0664215087890625, 0.06889915466308594, 0.07137680053710938, 0.07385444641113281, 0.07633209228515625, 0.07880973815917969, 0.08128738403320312, 0.08376502990722656, 0.08624267578125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 10.0, 15.0, 32.0, 67.0, 73.0, 108.0, 119.0, 150.0, 123.0, 103.0, 73.0, 42.0, 31.0, 19.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8345469236373901, -0.7884669899940491, -0.742387056350708, -0.6963070631027222, -0.6502271890640259, -0.60414719581604, -0.558067262172699, -0.5119873285293579, -0.46590739488601685, -0.4198274612426758, -0.3737475275993347, -0.32766756415367126, -0.2815876305103302, -0.23550769686698914, -0.18942773342132568, -0.14334779977798462, -0.09726786613464355, -0.05118792504072189, -0.005107983946800232, 0.040971964597702026, 0.08705189824104309, 0.13313183188438416, 0.1792117953300476, 0.22529172897338867, 0.27137166261672974, 0.3174515962600708, 0.36353152990341187, 0.4096114933490753, 0.4556914269924164, 0.5017713308334351, 0.5478513240814209, 0.593931257724762, 0.6400113105773926, 0.6860912442207336, 0.7321711778640747, 0.7782511711120605, 0.8243310451507568, 0.8704110383987427, 0.9164909720420837, 0.9625709056854248, 1.008650779724121, 1.054730772972107, 1.1008106470108032, 1.146890640258789, 1.1929705142974854, 1.2390505075454712, 1.285130500793457, 1.3312103748321533, 1.3772903680801392, 1.423370361328125, 1.4694502353668213, 1.5155302286148071, 1.5616101026535034, 1.6076900959014893, 1.6537699699401855, 1.6998499631881714, 1.7459299564361572, 1.792009949684143, 1.8380898237228394, 1.8841698169708252, 1.9302496910095215, 1.9763296842575073, 2.022409677505493, 2.0684895515441895, 2.1145694255828857]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 5.0, 6.0, 1.0, 4.0, 6.0, 5.0, 12.0, 9.0, 12.0, 9.0, 8.0, 13.0, 22.0, 18.0, 20.0, 21.0, 17.0, 27.0, 29.0, 28.0, 34.0, 45.0, 35.0, 41.0, 41.0, 46.0, 38.0, 41.0, 48.0, 34.0, 30.0, 34.0, 34.0, 30.0, 30.0, 37.0, 21.0, 25.0, 22.0, 10.0, 9.0, 8.0, 11.0, 4.0, 12.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6399747729301453, -0.6183943748474121, -0.5968139171600342, -0.575233519077301, -0.5536531209945679, -0.5320726633071899, -0.5104922652244568, -0.48891183733940125, -0.4673314094543457, -0.44575098156929016, -0.424170583486557, -0.40259015560150146, -0.3810097277164459, -0.3594292998313904, -0.3378489017486572, -0.3162684738636017, -0.29468807578086853, -0.273107647895813, -0.25152724981307983, -0.2299468219280243, -0.20836639404296875, -0.1867859810590744, -0.16520556807518005, -0.1436251401901245, -0.12204472720623016, -0.10046430677175522, -0.07888388633728027, -0.057303473353385925, -0.03572305291891098, -0.014142632484436035, 0.007437780499458313, 0.029018208384513855, 0.0505986213684082, 0.07217904180288315, 0.0937594622373581, 0.11533987522125244, 0.13692030310630798, 0.15850071609020233, 0.18008112907409668, 0.20166155695915222, 0.22324196994304657, 0.24482238292694092, 0.26640281081199646, 0.287983238697052, 0.30956363677978516, 0.3311440646648407, 0.35272449254989624, 0.3743048906326294, 0.39588531851768494, 0.4174657464027405, 0.43904614448547363, 0.4606265723705292, 0.4822070002555847, 0.5037873983383179, 0.5253678560256958, 0.546948254108429, 0.5685286521911621, 0.5901090502738953, 0.6116895079612732, 0.6332699060440063, 0.6548503041267395, 0.6764307618141174, 0.6980111598968506, 0.7195916175842285, 0.7411720156669617]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 11.0, 7.0, 14.0, 20.0, 35.0, 40.0, 66.0, 94.0, 138.0, 212.0, 328.0, 554.0, 914.0, 1537.0, 2724.0, 5116.0, 10483.0, 24154.0, 67621.0, 240049.0, 914862.0, 1824662.0, 791967.0, 207923.0, 59290.0, 21552.0, 9402.0, 4640.0, 2364.0, 1308.0, 820.0, 463.0, 321.0, 198.0, 134.0, 84.0, 60.0, 36.0, 25.0, 18.0, 15.0, 6.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.12955665588378906, -0.12483596801757812, -0.12011528015136719, -0.11539459228515625, -0.11067390441894531, -0.10595321655273438, -0.10123252868652344, -0.0965118408203125, -0.09179115295410156, -0.08707046508789062, -0.08234977722167969, -0.07762908935546875, -0.07290840148925781, -0.06818771362304688, -0.06346702575683594, -0.058746337890625, -0.05402565002441406, -0.049304962158203125, -0.04458427429199219, -0.03986358642578125, -0.03514289855957031, -0.030422210693359375, -0.025701522827148438, -0.0209808349609375, -0.016260147094726562, -0.011539459228515625, -0.0068187713623046875, -0.00209808349609375, 0.0026226043701171875, 0.007343292236328125, 0.012063980102539062, 0.01678466796875, 0.021505355834960938, 0.026226043701171875, 0.030946731567382812, 0.03566741943359375, 0.04038810729980469, 0.045108795166015625, 0.04982948303222656, 0.0545501708984375, 0.05927085876464844, 0.06399154663085938, 0.06871223449707031, 0.07343292236328125, 0.07815361022949219, 0.08287429809570312, 0.08759498596191406, 0.092315673828125, 0.09703636169433594, 0.10175704956054688, 0.10647773742675781, 0.11119842529296875, 0.11591911315917969, 0.12063980102539062, 0.12536048889160156, 0.1300811767578125, 0.13480186462402344, 0.13952255249023438, 0.1442432403564453, 0.14896392822265625, 0.1536846160888672, 0.15840530395507812, 0.16312599182128906, 0.1678466796875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 9.0, 11.0, 19.0, 8.0, 15.0, 11.0, 26.0, 24.0, 25.0, 34.0, 28.0, 28.0, 43.0, 32.0, 31.0, 34.0, 39.0, 50.0, 28.0, 36.0, 44.0, 43.0, 43.0, 34.0, 37.0, 33.0, 32.0, 21.0, 27.0, 19.0, 10.0, 22.0, 16.0, 15.0, 13.0, 7.0, 6.0, 7.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09521484375, -0.0922555923461914, -0.08929634094238281, -0.08633708953857422, -0.08337783813476562, -0.08041858673095703, -0.07745933532714844, -0.07450008392333984, -0.07154083251953125, -0.06858158111572266, -0.06562232971191406, -0.06266307830810547, -0.059703826904296875, -0.05674457550048828, -0.05378532409667969, -0.050826072692871094, -0.0478668212890625, -0.044907569885253906, -0.04194831848144531, -0.03898906707763672, -0.036029815673828125, -0.03307056427001953, -0.030111312866210938, -0.027152061462402344, -0.02419281005859375, -0.021233558654785156, -0.018274307250976562, -0.015315055847167969, -0.012355804443359375, -0.009396553039550781, -0.0064373016357421875, -0.0034780502319335938, -0.000518798828125, 0.0024404525756835938, 0.0053997039794921875, 0.008358955383300781, 0.011318206787109375, 0.014277458190917969, 0.017236709594726562, 0.020195960998535156, 0.02315521240234375, 0.026114463806152344, 0.029073715209960938, 0.03203296661376953, 0.034992218017578125, 0.03795146942138672, 0.04091072082519531, 0.043869972229003906, 0.0468292236328125, 0.049788475036621094, 0.05274772644042969, 0.05570697784423828, 0.058666229248046875, 0.06162548065185547, 0.06458473205566406, 0.06754398345947266, 0.07050323486328125, 0.07346248626708984, 0.07642173767089844, 0.07938098907470703, 0.08234024047851562, 0.08529949188232422, 0.08825874328613281, 0.0912179946899414, 0.09417724609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 6.0, 0.0, 7.0, 2.0, 12.0, 14.0, 17.0, 25.0, 30.0, 52.0, 57.0, 74.0, 101.0, 152.0, 218.0, 332.0, 470.0, 719.0, 1187.0, 1825.0, 3153.0, 5974.0, 11895.0, 26458.0, 69777.0, 235859.0, 1157529.0, 2061672.0, 431866.0, 111506.0, 38481.0, 16388.0, 7781.0, 4170.0, 2339.0, 1398.0, 889.0, 575.0, 384.0, 241.0, 169.0, 127.0, 86.0, 77.0, 59.0, 37.0, 24.0, 18.0, 15.0, 16.0, 7.0, 10.0, 4.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.168212890625, -0.16282272338867188, -0.15743255615234375, -0.15204238891601562, -0.1466522216796875, -0.14126205444335938, -0.13587188720703125, -0.13048171997070312, -0.125091552734375, -0.11970138549804688, -0.11431121826171875, -0.10892105102539062, -0.1035308837890625, -0.09814071655273438, -0.09275054931640625, -0.08736038208007812, -0.08197021484375, -0.07658004760742188, -0.07118988037109375, -0.06579971313476562, -0.0604095458984375, -0.055019378662109375, -0.04962921142578125, -0.044239044189453125, -0.038848876953125, -0.033458709716796875, -0.02806854248046875, -0.022678375244140625, -0.0172882080078125, -0.011898040771484375, -0.00650787353515625, -0.001117706298828125, 0.0042724609375, 0.009662628173828125, 0.01505279541015625, 0.020442962646484375, 0.0258331298828125, 0.031223297119140625, 0.03661346435546875, 0.042003631591796875, 0.047393798828125, 0.052783966064453125, 0.05817413330078125, 0.06356430053710938, 0.0689544677734375, 0.07434463500976562, 0.07973480224609375, 0.08512496948242188, 0.09051513671875, 0.09590530395507812, 0.10129547119140625, 0.10668563842773438, 0.1120758056640625, 0.11746597290039062, 0.12285614013671875, 0.12824630737304688, 0.133636474609375, 0.13902664184570312, 0.14441680908203125, 0.14980697631835938, 0.1551971435546875, 0.16058731079101562, 0.16597747802734375, 0.17136764526367188, 0.1767578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 8.0, 12.0, 3.0, 12.0, 8.0, 19.0, 16.0, 31.0, 35.0, 47.0, 73.0, 93.0, 123.0, 164.0, 252.0, 337.0, 543.0, 651.0, 495.0, 363.0, 207.0, 173.0, 111.0, 74.0, 58.0, 52.0, 27.0, 22.0, 12.0, 14.0, 7.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1810302734375, -0.17464256286621094, -0.16825485229492188, -0.1618671417236328, -0.15547943115234375, -0.1490917205810547, -0.14270401000976562, -0.13631629943847656, -0.1299285888671875, -0.12354087829589844, -0.11715316772460938, -0.11076545715332031, -0.10437774658203125, -0.09799003601074219, -0.09160232543945312, -0.08521461486816406, -0.078826904296875, -0.07243919372558594, -0.06605148315429688, -0.05966377258300781, -0.05327606201171875, -0.04688835144042969, -0.040500640869140625, -0.03411293029785156, -0.0277252197265625, -0.021337509155273438, -0.014949798583984375, -0.008562088012695312, -0.00217437744140625, 0.0042133331298828125, 0.010601043701171875, 0.016988754272460938, 0.02337646484375, 0.029764175415039062, 0.036151885986328125, 0.04253959655761719, 0.04892730712890625, 0.05531501770019531, 0.061702728271484375, 0.06809043884277344, 0.0744781494140625, 0.08086585998535156, 0.08725357055664062, 0.09364128112792969, 0.10002899169921875, 0.10641670227050781, 0.11280441284179688, 0.11919212341308594, 0.125579833984375, 0.13196754455566406, 0.13835525512695312, 0.1447429656982422, 0.15113067626953125, 0.1575183868408203, 0.16390609741210938, 0.17029380798339844, 0.1766815185546875, 0.18306922912597656, 0.18945693969726562, 0.1958446502685547, 0.20223236083984375, 0.2086200714111328, 0.21500778198242188, 0.22139549255371094, 0.227783203125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 4.0, 10.0, 12.0, 21.0, 23.0, 49.0, 67.0, 105.0, 108.0, 118.0, 130.0, 104.0, 84.0, 61.0, 32.0, 33.0, 11.0, 7.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0017781257629395, -1.9552096128463745, -1.90864098072052, -1.862072467803955, -1.8155038356781006, -1.7689353227615356, -1.7223668098449707, -1.6757981777191162, -1.6292295455932617, -1.5826610326766968, -1.5360924005508423, -1.4895238876342773, -1.4429552555084229, -1.396386742591858, -1.349818229675293, -1.3032495975494385, -1.2566810846328735, -1.2101125717163086, -1.163543939590454, -1.1169754266738892, -1.0704067945480347, -1.0238382816314697, -0.97726970911026, -0.9307011365890503, -0.8841325640678406, -0.8375639915466309, -0.7909954190254211, -0.7444268465042114, -0.6978583335876465, -0.651289701461792, -0.604721188545227, -0.5581526160240173, -0.5115839242935181, -0.46501535177230835, -0.41844677925109863, -0.3718782365322113, -0.3253096640110016, -0.27874109148979187, -0.23217254877090454, -0.18560397624969482, -0.1390354037284851, -0.09246683865785599, -0.04589827358722687, 0.0006702840328216553, 0.04723885655403137, 0.09380742907524109, 0.14037597179412842, 0.18694454431533813, 0.23351311683654785, 0.28008168935775757, 0.3266502618789673, 0.3732188045978546, 0.41978737711906433, 0.46635594964027405, 0.5129244923591614, 0.5594930648803711, 0.6060616374015808, 0.6526302099227905, 0.6991987824440002, 0.74576735496521, 0.7923358678817749, 0.8389045000076294, 0.8854730129241943, 0.932041585445404, 0.9786101579666138]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 13.0, 1.0, 19.0, 20.0, 17.0, 16.0, 31.0, 26.0, 23.0, 28.0, 47.0, 48.0, 25.0, 54.0, 54.0, 58.0, 42.0, 44.0, 50.0, 53.0, 31.0, 35.0, 38.0, 37.0, 27.0, 28.0, 23.0, 22.0, 11.0, 9.0, 11.0, 6.0, 7.0, 3.0, 9.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7122649550437927, -0.6911649107933044, -0.6700649261474609, -0.6489648818969727, -0.6278648376464844, -0.6067648530006409, -0.5856648087501526, -0.5645648241043091, -0.5434647798538208, -0.5223647356033325, -0.501264750957489, -0.48016470670700073, -0.45906469225883484, -0.43796467781066895, -0.41686463356018066, -0.39576461911201477, -0.3746645748615265, -0.3535645604133606, -0.3324645161628723, -0.3113645017147064, -0.2902644872665405, -0.26916444301605225, -0.24806442856788635, -0.22696441411972046, -0.20586438477039337, -0.18476435542106628, -0.1636643409729004, -0.1425643116235733, -0.12146428972482681, -0.10036426782608032, -0.07926423847675323, -0.05816422402858734, -0.037064194679260254, -0.015964170917868614, 0.0051358528435230255, 0.026235878467559814, 0.047335900366306305, 0.0684359222650528, 0.08953595161437988, 0.11063596606254578, 0.13173599541187286, 0.15283602476119995, 0.17393603920936584, 0.19503606855869293, 0.21613609790802002, 0.2372361123561859, 0.2583361268043518, 0.2794361710548401, 0.300536185503006, 0.3216361999511719, 0.34273624420166016, 0.36383625864982605, 0.38493627309799194, 0.4060363173484802, 0.4271363317966461, 0.448236346244812, 0.4693363904953003, 0.4904364049434662, 0.5115364193916321, 0.5326364636421204, 0.5537365078926086, 0.5748364925384521, 0.5959365367889404, 0.6170365810394287, 0.6381365656852722]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 11.0, 10.0, 24.0, 28.0, 37.0, 68.0, 100.0, 147.0, 290.0, 516.0, 895.0, 1654.0, 3606.0, 7611.0, 17217.0, 41435.0, 98245.0, 202637.0, 286987.0, 209409.0, 101650.0, 42702.0, 17991.0, 7752.0, 3597.0, 1752.0, 908.0, 497.0, 294.0, 175.0, 117.0, 57.0, 44.0, 25.0, 23.0, 15.0, 9.0, 7.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13046836853027344, -0.12604904174804688, -0.12162971496582031, -0.11721038818359375, -0.11279106140136719, -0.10837173461914062, -0.10395240783691406, -0.0995330810546875, -0.09511375427246094, -0.09069442749023438, -0.08627510070800781, -0.08185577392578125, -0.07743644714355469, -0.07301712036132812, -0.06859779357910156, -0.064178466796875, -0.05975914001464844, -0.055339813232421875, -0.05092048645019531, -0.04650115966796875, -0.04208183288574219, -0.037662506103515625, -0.03324317932128906, -0.0288238525390625, -0.024404525756835938, -0.019985198974609375, -0.015565872192382812, -0.01114654541015625, -0.0067272186279296875, -0.002307891845703125, 0.0021114349365234375, 0.00653076171875, 0.010950088500976562, 0.015369415283203125, 0.019788742065429688, 0.02420806884765625, 0.028627395629882812, 0.033046722412109375, 0.03746604919433594, 0.0418853759765625, 0.04630470275878906, 0.050724029541015625, 0.05514335632324219, 0.05956268310546875, 0.06398200988769531, 0.06840133666992188, 0.07282066345214844, 0.077239990234375, 0.08165931701660156, 0.08607864379882812, 0.09049797058105469, 0.09491729736328125, 0.09933662414550781, 0.10375595092773438, 0.10817527770996094, 0.1125946044921875, 0.11701393127441406, 0.12143325805664062, 0.1258525848388672, 0.13027191162109375, 0.1346912384033203, 0.13911056518554688, 0.14352989196777344, 0.14794921875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 3.0, 5.0, 6.0, 6.0, 9.0, 16.0, 10.0, 17.0, 15.0, 32.0, 30.0, 33.0, 31.0, 42.0, 29.0, 31.0, 45.0, 39.0, 51.0, 44.0, 47.0, 52.0, 40.0, 39.0, 49.0, 40.0, 26.0, 31.0, 35.0, 16.0, 27.0, 11.0, 18.0, 10.0, 16.0, 16.0, 6.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10491943359375, -0.10126972198486328, -0.09762001037597656, -0.09397029876708984, -0.09032058715820312, -0.0866708755493164, -0.08302116394042969, -0.07937145233154297, -0.07572174072265625, -0.07207202911376953, -0.06842231750488281, -0.0647726058959961, -0.061122894287109375, -0.057473182678222656, -0.05382347106933594, -0.05017375946044922, -0.0465240478515625, -0.04287433624267578, -0.03922462463378906, -0.035574913024902344, -0.031925201416015625, -0.028275489807128906, -0.024625778198242188, -0.02097606658935547, -0.01732635498046875, -0.013676643371582031, -0.010026931762695312, -0.006377220153808594, -0.002727508544921875, 0.0009222030639648438, 0.0045719146728515625, 0.008221626281738281, 0.011871337890625, 0.015521049499511719, 0.019170761108398438, 0.022820472717285156, 0.026470184326171875, 0.030119895935058594, 0.03376960754394531, 0.03741931915283203, 0.04106903076171875, 0.04471874237060547, 0.04836845397949219, 0.052018165588378906, 0.055667877197265625, 0.059317588806152344, 0.06296730041503906, 0.06661701202392578, 0.0702667236328125, 0.07391643524169922, 0.07756614685058594, 0.08121585845947266, 0.08486557006835938, 0.0885152816772461, 0.09216499328613281, 0.09581470489501953, 0.09946441650390625, 0.10311412811279297, 0.10676383972167969, 0.1104135513305664, 0.11406326293945312, 0.11771297454833984, 0.12136268615722656, 0.12501239776611328, 0.128662109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 25.0, 24.0, 42.0, 59.0, 110.0, 152.0, 237.0, 379.0, 686.0, 1127.0, 2047.0, 3829.0, 7533.0, 15084.0, 30591.0, 62301.0, 120900.0, 205762.0, 263726.0, 160844.0, 86641.0, 43366.0, 20908.0, 10257.0, 5391.0, 2902.0, 1487.0, 806.0, 487.0, 306.0, 194.0, 123.0, 74.0, 47.0, 38.0, 21.0, 11.0, 10.0, 1.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1173095703125, -0.11407279968261719, -0.11083602905273438, -0.10759925842285156, -0.10436248779296875, -0.10112571716308594, -0.09788894653320312, -0.09465217590332031, -0.0914154052734375, -0.08817863464355469, -0.08494186401367188, -0.08170509338378906, -0.07846832275390625, -0.07523155212402344, -0.07199478149414062, -0.06875801086425781, -0.065521240234375, -0.06228446960449219, -0.059047698974609375, -0.05581092834472656, -0.05257415771484375, -0.04933738708496094, -0.046100616455078125, -0.04286384582519531, -0.0396270751953125, -0.03639030456542969, -0.033153533935546875, -0.029916763305664062, -0.02667999267578125, -0.023443222045898438, -0.020206451416015625, -0.016969680786132812, -0.01373291015625, -0.010496139526367188, -0.007259368896484375, -0.0040225982666015625, -0.00078582763671875, 0.0024509429931640625, 0.005687713623046875, 0.008924484252929688, 0.0121612548828125, 0.015398025512695312, 0.018634796142578125, 0.021871566772460938, 0.02510833740234375, 0.028345108032226562, 0.031581878662109375, 0.03481864929199219, 0.038055419921875, 0.04129219055175781, 0.044528961181640625, 0.04776573181152344, 0.05100250244140625, 0.05423927307128906, 0.057476043701171875, 0.06071281433105469, 0.0639495849609375, 0.06718635559082031, 0.07042312622070312, 0.07365989685058594, 0.07689666748046875, 0.08013343811035156, 0.08337020874023438, 0.08660697937011719, 0.08984375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 1.0, 5.0, 7.0, 16.0, 5.0, 6.0, 5.0, 11.0, 16.0, 26.0, 18.0, 16.0, 26.0, 26.0, 28.0, 22.0, 32.0, 30.0, 37.0, 34.0, 42.0, 54.0, 28.0, 37.0, 43.0, 48.0, 43.0, 26.0, 32.0, 27.0, 23.0, 29.0, 25.0, 31.0, 21.0, 15.0, 22.0, 8.0, 11.0, 9.0, 10.0, 9.0, 4.0, 10.0, 4.0, 4.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.260498046875, -0.2522697448730469, -0.24404144287109375, -0.23581314086914062, -0.2275848388671875, -0.21935653686523438, -0.21112823486328125, -0.20289993286132812, -0.194671630859375, -0.18644332885742188, -0.17821502685546875, -0.16998672485351562, -0.1617584228515625, -0.15353012084960938, -0.14530181884765625, -0.13707351684570312, -0.12884521484375, -0.12061691284179688, -0.11238861083984375, -0.10416030883789062, -0.0959320068359375, -0.08770370483398438, -0.07947540283203125, -0.07124710083007812, -0.063018798828125, -0.054790496826171875, -0.04656219482421875, -0.038333892822265625, -0.0301055908203125, -0.021877288818359375, -0.01364898681640625, -0.005420684814453125, 0.0028076171875, 0.011035919189453125, 0.01926422119140625, 0.027492523193359375, 0.0357208251953125, 0.043949127197265625, 0.05217742919921875, 0.060405731201171875, 0.068634033203125, 0.07686233520507812, 0.08509063720703125, 0.09331893920898438, 0.1015472412109375, 0.10977554321289062, 0.11800384521484375, 0.12623214721679688, 0.13446044921875, 0.14268875122070312, 0.15091705322265625, 0.15914535522460938, 0.1673736572265625, 0.17560195922851562, 0.18383026123046875, 0.19205856323242188, 0.200286865234375, 0.20851516723632812, 0.21674346923828125, 0.22497177124023438, 0.2332000732421875, 0.24142837524414062, 0.24965667724609375, 0.2578849792480469, 0.26611328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 6.0, 9.0, 3.0, 15.0, 12.0, 20.0, 26.0, 49.0, 53.0, 80.0, 111.0, 146.0, 209.0, 278.0, 431.0, 728.0, 1189.0, 1981.0, 3625.0, 7137.0, 14941.0, 34277.0, 82514.0, 191271.0, 339595.0, 207908.0, 90696.0, 37600.0, 16296.0, 7789.0, 3897.0, 2161.0, 1214.0, 768.0, 430.0, 307.0, 194.0, 165.0, 122.0, 84.0, 80.0, 38.0, 30.0, 22.0, 14.0, 13.0, 5.0, 5.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.035675048828125, -0.03454446792602539, -0.03341388702392578, -0.03228330612182617, -0.031152725219726562, -0.030022144317626953, -0.028891563415527344, -0.027760982513427734, -0.026630401611328125, -0.025499820709228516, -0.024369239807128906, -0.023238658905029297, -0.022108078002929688, -0.020977497100830078, -0.01984691619873047, -0.01871633529663086, -0.01758575439453125, -0.01645517349243164, -0.015324592590332031, -0.014194011688232422, -0.013063430786132812, -0.011932849884033203, -0.010802268981933594, -0.009671688079833984, -0.008541107177734375, -0.007410526275634766, -0.006279945373535156, -0.005149364471435547, -0.0040187835693359375, -0.002888202667236328, -0.0017576217651367188, -0.0006270408630371094, 0.0005035400390625, 0.0016341209411621094, 0.0027647018432617188, 0.003895282745361328, 0.0050258636474609375, 0.006156444549560547, 0.007287025451660156, 0.008417606353759766, 0.009548187255859375, 0.010678768157958984, 0.011809349060058594, 0.012939929962158203, 0.014070510864257812, 0.015201091766357422, 0.01633167266845703, 0.01746225357055664, 0.01859283447265625, 0.01972341537475586, 0.02085399627685547, 0.021984577178955078, 0.023115158081054688, 0.024245738983154297, 0.025376319885253906, 0.026506900787353516, 0.027637481689453125, 0.028768062591552734, 0.029898643493652344, 0.031029224395751953, 0.03215980529785156, 0.03329038619995117, 0.03442096710205078, 0.03555154800415039, 0.03668212890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 7.0, 9.0, 5.0, 7.0, 6.0, 8.0, 16.0, 16.0, 32.0, 38.0, 42.0, 65.0, 70.0, 95.0, 76.0, 80.0, 86.0, 68.0, 63.0, 50.0, 32.0, 40.0, 26.0, 14.0, 9.0, 11.0, 9.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7821788787841797e-05, -1.7262063920497894e-05, -1.6702339053153992e-05, -1.614261418581009e-05, -1.5582889318466187e-05, -1.5023164451122284e-05, -1.4463439583778381e-05, -1.3903714716434479e-05, -1.3343989849090576e-05, -1.2784264981746674e-05, -1.2224540114402771e-05, -1.1664815247058868e-05, -1.1105090379714966e-05, -1.0545365512371063e-05, -9.98564064502716e-06, -9.425915777683258e-06, -8.866190910339355e-06, -8.306466042995453e-06, -7.74674117565155e-06, -7.187016308307648e-06, -6.627291440963745e-06, -6.0675665736198425e-06, -5.50784170627594e-06, -4.948116838932037e-06, -4.388391971588135e-06, -3.828667104244232e-06, -3.2689422369003296e-06, -2.709217369556427e-06, -2.1494925022125244e-06, -1.5897676348686218e-06, -1.0300427675247192e-06, -4.7031790018081665e-07, 8.940696716308594e-08, 6.491318345069885e-07, 1.2088567018508911e-06, 1.7685815691947937e-06, 2.3283064365386963e-06, 2.888031303882599e-06, 3.4477561712265015e-06, 4.007481038570404e-06, 4.567205905914307e-06, 5.126930773258209e-06, 5.686655640602112e-06, 6.246380507946014e-06, 6.806105375289917e-06, 7.36583024263382e-06, 7.925555109977722e-06, 8.485279977321625e-06, 9.045004844665527e-06, 9.60472971200943e-06, 1.0164454579353333e-05, 1.0724179446697235e-05, 1.1283904314041138e-05, 1.184362918138504e-05, 1.2403354048728943e-05, 1.2963078916072845e-05, 1.3522803783416748e-05, 1.408252865076065e-05, 1.4642253518104553e-05, 1.5201978385448456e-05, 1.576170325279236e-05, 1.632142812013626e-05, 1.6881152987480164e-05, 1.7440877854824066e-05, 1.800060272216797e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 10.0, 13.0, 14.0, 35.0, 40.0, 82.0, 113.0, 187.0, 341.0, 647.0, 1153.0, 2193.0, 4365.0, 8713.0, 19109.0, 41604.0, 90683.0, 185693.0, 312646.0, 198257.0, 97449.0, 44952.0, 20736.0, 9665.0, 4683.0, 2349.0, 1217.0, 692.0, 387.0, 197.0, 123.0, 65.0, 53.0, 30.0, 22.0, 15.0, 8.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03986382484436035, -0.0387425422668457, -0.037621259689331055, -0.036499977111816406, -0.03537869453430176, -0.03425741195678711, -0.03313612937927246, -0.03201484680175781, -0.030893564224243164, -0.029772281646728516, -0.028650999069213867, -0.02752971649169922, -0.02640843391418457, -0.025287151336669922, -0.024165868759155273, -0.023044586181640625, -0.021923303604125977, -0.020802021026611328, -0.01968073844909668, -0.01855945587158203, -0.017438173294067383, -0.016316890716552734, -0.015195608139038086, -0.014074325561523438, -0.012953042984008789, -0.01183176040649414, -0.010710477828979492, -0.009589195251464844, -0.008467912673950195, -0.007346630096435547, -0.0062253475189208984, -0.00510406494140625, -0.0039827823638916016, -0.002861499786376953, -0.0017402172088623047, -0.0006189346313476562, 0.0005023479461669922, 0.0016236305236816406, 0.002744913101196289, 0.0038661956787109375, 0.004987478256225586, 0.006108760833740234, 0.007230043411254883, 0.008351325988769531, 0.00947260856628418, 0.010593891143798828, 0.011715173721313477, 0.012836456298828125, 0.013957738876342773, 0.015079021453857422, 0.01620030403137207, 0.01732158660888672, 0.018442869186401367, 0.019564151763916016, 0.020685434341430664, 0.021806716918945312, 0.02292799949645996, 0.02404928207397461, 0.025170564651489258, 0.026291847229003906, 0.027413129806518555, 0.028534412384033203, 0.02965569496154785, 0.0307769775390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 12.0, 6.0, 15.0, 18.0, 18.0, 38.0, 40.0, 44.0, 67.0, 93.0, 95.0, 85.0, 91.0, 87.0, 54.0, 37.0, 50.0, 35.0, 26.0, 12.0, 14.0, 8.0, 9.0, 3.0, 1.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.056671142578125, -0.05480146408081055, -0.052931785583496094, -0.05106210708618164, -0.04919242858886719, -0.047322750091552734, -0.04545307159423828, -0.04358339309692383, -0.041713714599609375, -0.03984403610229492, -0.03797435760498047, -0.036104679107666016, -0.03423500061035156, -0.03236532211303711, -0.030495643615722656, -0.028625965118408203, -0.02675628662109375, -0.024886608123779297, -0.023016929626464844, -0.02114725112915039, -0.019277572631835938, -0.017407894134521484, -0.015538215637207031, -0.013668537139892578, -0.011798858642578125, -0.009929180145263672, -0.008059501647949219, -0.006189823150634766, -0.0043201446533203125, -0.0024504661560058594, -0.0005807876586914062, 0.0012888908386230469, 0.0031585693359375, 0.005028247833251953, 0.006897926330566406, 0.00876760482788086, 0.010637283325195312, 0.012506961822509766, 0.014376640319824219, 0.016246318817138672, 0.018115997314453125, 0.019985675811767578, 0.02185535430908203, 0.023725032806396484, 0.025594711303710938, 0.02746438980102539, 0.029334068298339844, 0.031203746795654297, 0.03307342529296875, 0.0349431037902832, 0.036812782287597656, 0.03868246078491211, 0.04055213928222656, 0.042421817779541016, 0.04429149627685547, 0.04616117477416992, 0.048030853271484375, 0.04990053176879883, 0.05177021026611328, 0.053639888763427734, 0.05550956726074219, 0.05737924575805664, 0.059248924255371094, 0.06111860275268555, 0.06298828125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 10.0, 16.0, 44.0, 83.0, 107.0, 159.0, 185.0, 161.0, 99.0, 63.0, 39.0, 15.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9325789213180542, -1.8860880136489868, -1.8395971059799194, -1.7931063175201416, -1.7466154098510742, -1.7001245021820068, -1.6536335945129395, -1.607142686843872, -1.5606517791748047, -1.5141608715057373, -1.46766996383667, -1.4211790561676025, -1.3746882677078247, -1.3281973600387573, -1.28170645236969, -1.2352155447006226, -1.1887247562408447, -1.1422338485717773, -1.09574294090271, -1.0492520332336426, -1.0027612447738647, -0.9562703371047974, -0.90977942943573, -0.8632885217666626, -0.8167976140975952, -0.7703067064285278, -0.7238158583641052, -0.6773249506950378, -0.6308340430259705, -0.5843431949615479, -0.5378522872924805, -0.4913613796234131, -0.4448704719543457, -0.3983795940876007, -0.3518886864185333, -0.30539780855178833, -0.25890690088272095, -0.21241602301597595, -0.16592514514923096, -0.11943423748016357, -0.07294335961341858, -0.02645247057080269, 0.020038418471813202, 0.0665293037891388, 0.11302019655704498, 0.15951108932495117, 0.20600196719169617, 0.25249287486076355, 0.29898375272750854, 0.34547463059425354, 0.3919655382633209, 0.4384564161300659, 0.4849473237991333, 0.5314382314682007, 0.5779290795326233, 0.6244199872016907, 0.6709108352661133, 0.7174017429351807, 0.7638925909996033, 0.8103834986686707, 0.856874406337738, 0.9033652544021606, 0.949856162071228, 0.9963470697402954, 1.0428379774093628]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 2.0, 7.0, 3.0, 9.0, 6.0, 8.0, 17.0, 12.0, 8.0, 15.0, 30.0, 28.0, 37.0, 28.0, 29.0, 41.0, 29.0, 46.0, 43.0, 46.0, 42.0, 40.0, 37.0, 46.0, 39.0, 46.0, 36.0, 24.0, 39.0, 21.0, 27.0, 16.0, 12.0, 24.0, 28.0, 14.0, 16.0, 9.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7928367853164673, -0.7700680494308472, -0.747299313545227, -0.7245305776596069, -0.7017619013786316, -0.6789931654930115, -0.6562244296073914, -0.6334556937217712, -0.6106870174407959, -0.5879182815551758, -0.5651495456695557, -0.5423808097839355, -0.5196121335029602, -0.4968433976173401, -0.47407466173171997, -0.45130592584609985, -0.42853718996047974, -0.4057684540748596, -0.3829997479915619, -0.3602310121059418, -0.33746230602264404, -0.3146935701370239, -0.2919248342514038, -0.2691560983657837, -0.24638739228248596, -0.22361867129802704, -0.20084995031356812, -0.178081214427948, -0.15531249344348907, -0.13254377245903015, -0.10977503657341003, -0.08700631558895111, -0.06423765420913696, -0.04146892949938774, -0.01870020478963852, 0.004068523645401001, 0.026837244629859924, 0.04960596561431885, 0.07237470149993896, 0.09514342248439789, 0.11791214346885681, 0.14068086445331573, 0.16344958543777466, 0.18621832132339478, 0.2089870423078537, 0.23175576329231262, 0.25452449917793274, 0.27729320526123047, 0.3000619411468506, 0.3228306770324707, 0.34559938311576843, 0.36836811900138855, 0.3911368250846863, 0.4139055609703064, 0.4366742968559265, 0.45944303274154663, 0.48221173882484436, 0.5049804449081421, 0.5277491807937622, 0.5505179166793823, 0.5732866525650024, 0.5960553884506226, 0.6188241243362427, 0.641592800617218, 0.6643615365028381]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 5.0, 11.0, 12.0, 16.0, 17.0, 34.0, 48.0, 63.0, 89.0, 143.0, 241.0, 349.0, 504.0, 830.0, 1294.0, 2256.0, 3783.0, 7175.0, 14911.0, 35200.0, 95214.0, 282952.0, 697985.0, 1120665.0, 1028335.0, 561798.0, 213215.0, 72951.0, 27707.0, 11977.0, 5911.0, 3245.0, 1935.0, 1176.0, 738.0, 467.0, 322.0, 215.0, 161.0, 100.0, 67.0, 45.0, 32.0, 27.0, 14.0, 21.0, 7.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.131591796875, -0.12770557403564453, -0.12381935119628906, -0.1199331283569336, -0.11604690551757812, -0.11216068267822266, -0.10827445983886719, -0.10438823699951172, -0.10050201416015625, -0.09661579132080078, -0.09272956848144531, -0.08884334564208984, -0.08495712280273438, -0.0810708999633789, -0.07718467712402344, -0.07329845428466797, -0.0694122314453125, -0.06552600860595703, -0.06163978576660156, -0.057753562927246094, -0.053867340087890625, -0.049981117248535156, -0.04609489440917969, -0.04220867156982422, -0.03832244873046875, -0.03443622589111328, -0.030550003051757812, -0.026663780212402344, -0.022777557373046875, -0.018891334533691406, -0.015005111694335938, -0.011118888854980469, -0.007232666015625, -0.0033464431762695312, 0.0005397796630859375, 0.004426002502441406, 0.008312225341796875, 0.012198448181152344, 0.016084671020507812, 0.01997089385986328, 0.02385711669921875, 0.02774333953857422, 0.03162956237792969, 0.035515785217285156, 0.039402008056640625, 0.043288230895996094, 0.04717445373535156, 0.05106067657470703, 0.0549468994140625, 0.05883312225341797, 0.06271934509277344, 0.0666055679321289, 0.07049179077148438, 0.07437801361083984, 0.07826423645019531, 0.08215045928955078, 0.08603668212890625, 0.08992290496826172, 0.09380912780761719, 0.09769535064697266, 0.10158157348632812, 0.1054677963256836, 0.10935401916503906, 0.11324024200439453, 0.11712646484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 2.0, 5.0, 7.0, 12.0, 12.0, 21.0, 19.0, 26.0, 31.0, 29.0, 19.0, 35.0, 26.0, 24.0, 36.0, 60.0, 40.0, 49.0, 58.0, 46.0, 51.0, 47.0, 36.0, 43.0, 34.0, 38.0, 27.0, 18.0, 32.0, 32.0, 14.0, 21.0, 15.0, 7.0, 12.0, 2.0, 6.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10711669921875, -0.10350608825683594, -0.09989547729492188, -0.09628486633300781, -0.09267425537109375, -0.08906364440917969, -0.08545303344726562, -0.08184242248535156, -0.0782318115234375, -0.07462120056152344, -0.07101058959960938, -0.06739997863769531, -0.06378936767578125, -0.06017875671386719, -0.056568145751953125, -0.05295753479003906, -0.049346923828125, -0.04573631286621094, -0.042125701904296875, -0.03851509094238281, -0.03490447998046875, -0.03129386901855469, -0.027683258056640625, -0.024072647094726562, -0.0204620361328125, -0.016851425170898438, -0.013240814208984375, -0.009630203247070312, -0.00601959228515625, -0.0024089813232421875, 0.001201629638671875, 0.0048122406005859375, 0.0084228515625, 0.012033462524414062, 0.015644073486328125, 0.019254684448242188, 0.02286529541015625, 0.026475906372070312, 0.030086517333984375, 0.03369712829589844, 0.0373077392578125, 0.04091835021972656, 0.044528961181640625, 0.04813957214355469, 0.05175018310546875, 0.05536079406738281, 0.058971405029296875, 0.06258201599121094, 0.066192626953125, 0.06980323791503906, 0.07341384887695312, 0.07702445983886719, 0.08063507080078125, 0.08424568176269531, 0.08785629272460938, 0.09146690368652344, 0.0950775146484375, 0.09868812561035156, 0.10229873657226562, 0.10590934753417969, 0.10951995849609375, 0.11313056945800781, 0.11674118041992188, 0.12035179138183594, 0.12396240234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 11.0, 11.0, 14.0, 28.0, 28.0, 48.0, 75.0, 126.0, 223.0, 342.0, 617.0, 1215.0, 2603.0, 6715.0, 21980.0, 100928.0, 817952.0, 2715149.0, 438378.0, 63315.0, 15215.0, 5066.0, 2026.0, 958.0, 476.0, 282.0, 161.0, 108.0, 64.0, 49.0, 27.0, 20.0, 18.0, 7.0, 9.0, 8.0, 4.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.260498046875, -0.25244903564453125, -0.2444000244140625, -0.23635101318359375, -0.228302001953125, -0.22025299072265625, -0.2122039794921875, -0.20415496826171875, -0.19610595703125, -0.18805694580078125, -0.1800079345703125, -0.17195892333984375, -0.163909912109375, -0.15586090087890625, -0.1478118896484375, -0.13976287841796875, -0.1317138671875, -0.12366485595703125, -0.1156158447265625, -0.10756683349609375, -0.099517822265625, -0.09146881103515625, -0.0834197998046875, -0.07537078857421875, -0.06732177734375, -0.05927276611328125, -0.0512237548828125, -0.04317474365234375, -0.035125732421875, -0.02707672119140625, -0.0190277099609375, -0.01097869873046875, -0.0029296875, 0.00511932373046875, 0.0131683349609375, 0.02121734619140625, 0.029266357421875, 0.03731536865234375, 0.0453643798828125, 0.05341339111328125, 0.06146240234375, 0.06951141357421875, 0.0775604248046875, 0.08560943603515625, 0.093658447265625, 0.10170745849609375, 0.1097564697265625, 0.11780548095703125, 0.1258544921875, 0.13390350341796875, 0.1419525146484375, 0.15000152587890625, 0.158050537109375, 0.16609954833984375, 0.1741485595703125, 0.18219757080078125, 0.19024658203125, 0.19829559326171875, 0.2063446044921875, 0.21439361572265625, 0.222442626953125, 0.23049163818359375, 0.2385406494140625, 0.24658966064453125, 0.254638671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 10.0, 10.0, 13.0, 16.0, 18.0, 29.0, 35.0, 51.0, 79.0, 93.0, 134.0, 175.0, 241.0, 334.0, 351.0, 400.0, 387.0, 374.0, 313.0, 236.0, 208.0, 141.0, 104.0, 76.0, 63.0, 47.0, 35.0, 26.0, 14.0, 13.0, 13.0, 8.0, 8.0, 4.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.268798828125, -0.2613258361816406, -0.25385284423828125, -0.24637985229492188, -0.2389068603515625, -0.23143386840820312, -0.22396087646484375, -0.21648788452148438, -0.209014892578125, -0.20154190063476562, -0.19406890869140625, -0.18659591674804688, -0.1791229248046875, -0.17164993286132812, -0.16417694091796875, -0.15670394897460938, -0.14923095703125, -0.14175796508789062, -0.13428497314453125, -0.12681198120117188, -0.1193389892578125, -0.11186599731445312, -0.10439300537109375, -0.09692001342773438, -0.089447021484375, -0.08197402954101562, -0.07450103759765625, -0.06702804565429688, -0.0595550537109375, -0.052082061767578125, -0.04460906982421875, -0.037136077880859375, -0.0296630859375, -0.022190093994140625, -0.01471710205078125, -0.007244110107421875, 0.0002288818359375, 0.007701873779296875, 0.01517486572265625, 0.022647857666015625, 0.030120849609375, 0.037593841552734375, 0.04506683349609375, 0.052539825439453125, 0.0600128173828125, 0.06748580932617188, 0.07495880126953125, 0.08243179321289062, 0.08990478515625, 0.09737777709960938, 0.10485076904296875, 0.11232376098632812, 0.1197967529296875, 0.12726974487304688, 0.13474273681640625, 0.14221572875976562, 0.149688720703125, 0.15716171264648438, 0.16463470458984375, 0.17210769653320312, 0.1795806884765625, 0.18705368041992188, 0.19452667236328125, 0.20199966430664062, 0.20947265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 9.0, 8.0, 21.0, 19.0, 27.0, 41.0, 54.0, 88.0, 88.0, 101.0, 105.0, 92.0, 84.0, 78.0, 36.0, 44.0, 26.0, 18.0, 17.0, 9.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.466874122619629, -2.396544933319092, -2.3262155055999756, -2.2558860778808594, -2.1855568885803223, -2.115227699279785, -2.044898271560669, -1.9745689630508423, -1.9042396545410156, -1.833910346031189, -1.7635810375213623, -1.6932517290115356, -1.622922420501709, -1.5525931119918823, -1.4822638034820557, -1.411934494972229, -1.3416051864624023, -1.2712758779525757, -1.200946569442749, -1.1306172609329224, -1.0602879524230957, -0.989958643913269, -0.9196293354034424, -0.8493000268936157, -0.7789707183837891, -0.7086414098739624, -0.6383121013641357, -0.5679827928543091, -0.4976534843444824, -0.42732417583465576, -0.3569948673248291, -0.28666555881500244, -0.21633625030517578, -0.14600694179534912, -0.07567763328552246, -0.005348324775695801, 0.06498098373413086, 0.13531029224395752, 0.20563960075378418, 0.27596890926361084, 0.3462982177734375, 0.41662752628326416, 0.4869568347930908, 0.5572861433029175, 0.6276154518127441, 0.6979447603225708, 0.7682740688323975, 0.8386033773422241, 0.9089326858520508, 0.9792619943618774, 1.049591302871704, 1.1199206113815308, 1.1902499198913574, 1.260579228401184, 1.3309085369110107, 1.4012378454208374, 1.471567153930664, 1.5418964624404907, 1.6122257709503174, 1.682555079460144, 1.7528843879699707, 1.8232136964797974, 1.893543004989624, 1.9638723134994507, 2.0342016220092773]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 8.0, 10.0, 11.0, 11.0, 13.0, 16.0, 17.0, 16.0, 24.0, 26.0, 31.0, 27.0, 45.0, 33.0, 36.0, 40.0, 44.0, 33.0, 36.0, 40.0, 40.0, 46.0, 48.0, 41.0, 42.0, 35.0, 26.0, 35.0, 23.0, 20.0, 16.0, 25.0, 15.0, 9.0, 11.0, 10.0, 5.0, 5.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.0696709156036377, -1.0385854244232178, -1.0074998140335083, -0.9764142632484436, -0.9453287124633789, -0.9142431616783142, -0.8831576108932495, -0.8520721197128296, -0.8209865093231201, -0.7899009585380554, -0.7588154077529907, -0.727729856967926, -0.6966443061828613, -0.6655587553977966, -0.6344732046127319, -0.603387713432312, -0.5723021626472473, -0.5412166118621826, -0.5101310610771179, -0.4790455102920532, -0.4479599595069885, -0.41687440872192383, -0.3857888877391815, -0.3547033369541168, -0.3236177861690521, -0.2925322353839874, -0.26144668459892273, -0.23036114871501923, -0.19927559792995453, -0.16819004714488983, -0.13710451126098633, -0.10601896047592163, -0.07493340969085693, -0.043847862631082535, -0.012762315571308136, 0.018323227763175964, 0.04940877854824066, 0.08049432933330536, 0.11157986521720886, 0.14266541600227356, 0.17375096678733826, 0.20483651757240295, 0.23592206835746765, 0.26700758934020996, 0.29809314012527466, 0.32917869091033936, 0.36026424169540405, 0.39134979248046875, 0.42243534326553345, 0.45352089405059814, 0.48460644483566284, 0.5156919956207275, 0.5467775464057922, 0.5778630971908569, 0.6089485883712769, 0.6400341987609863, 0.6711196899414062, 0.702205240726471, 0.7332907915115356, 0.7643763422966003, 0.795461893081665, 0.8265474438667297, 0.8576329946517944, 0.8887184858322144, 0.9198040962219238]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 10.0, 10.0, 12.0, 18.0, 15.0, 32.0, 36.0, 67.0, 118.0, 207.0, 431.0, 1001.0, 2400.0, 6808.0, 24195.0, 108145.0, 445487.0, 356325.0, 76634.0, 17774.0, 5259.0, 1930.0, 770.0, 369.0, 192.0, 98.0, 49.0, 42.0, 26.0, 24.0, 14.0, 18.0, 9.0, 12.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13134765625, -0.12663841247558594, -0.12192916870117188, -0.11721992492675781, -0.11251068115234375, -0.10780143737792969, -0.10309219360351562, -0.09838294982910156, -0.0936737060546875, -0.08896446228027344, -0.08425521850585938, -0.07954597473144531, -0.07483673095703125, -0.07012748718261719, -0.06541824340820312, -0.06070899963378906, -0.055999755859375, -0.05129051208496094, -0.046581268310546875, -0.04187202453613281, -0.03716278076171875, -0.03245353698730469, -0.027744293212890625, -0.023035049438476562, -0.0183258056640625, -0.013616561889648438, -0.008907318115234375, -0.0041980743408203125, 0.00051116943359375, 0.0052204132080078125, 0.009929656982421875, 0.014638900756835938, 0.01934814453125, 0.024057388305664062, 0.028766632080078125, 0.03347587585449219, 0.03818511962890625, 0.04289436340332031, 0.047603607177734375, 0.05231285095214844, 0.0570220947265625, 0.06173133850097656, 0.06644058227539062, 0.07114982604980469, 0.07585906982421875, 0.08056831359863281, 0.08527755737304688, 0.08998680114746094, 0.094696044921875, 0.09940528869628906, 0.10411453247070312, 0.10882377624511719, 0.11353302001953125, 0.11824226379394531, 0.12295150756835938, 0.12766075134277344, 0.1323699951171875, 0.13707923889160156, 0.14178848266601562, 0.1464977264404297, 0.15120697021484375, 0.1559162139892578, 0.16062545776367188, 0.16533470153808594, 0.1700439453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 9.0, 8.0, 10.0, 13.0, 9.0, 10.0, 17.0, 26.0, 28.0, 31.0, 31.0, 33.0, 33.0, 35.0, 42.0, 52.0, 38.0, 47.0, 32.0, 36.0, 42.0, 36.0, 36.0, 44.0, 35.0, 41.0, 36.0, 32.0, 28.0, 25.0, 20.0, 13.0, 15.0, 12.0, 11.0, 11.0, 3.0, 9.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14892578125, -0.14438438415527344, -0.13984298706054688, -0.1353015899658203, -0.13076019287109375, -0.1262187957763672, -0.12167739868164062, -0.11713600158691406, -0.1125946044921875, -0.10805320739746094, -0.10351181030273438, -0.09897041320800781, -0.09442901611328125, -0.08988761901855469, -0.08534622192382812, -0.08080482482910156, -0.076263427734375, -0.07172203063964844, -0.06718063354492188, -0.06263923645019531, -0.05809783935546875, -0.05355644226074219, -0.049015045166015625, -0.04447364807128906, -0.0399322509765625, -0.03539085388183594, -0.030849456787109375, -0.026308059692382812, -0.02176666259765625, -0.017225265502929688, -0.012683868408203125, -0.008142471313476562, -0.00360107421875, 0.0009403228759765625, 0.005481719970703125, 0.010023117065429688, 0.01456451416015625, 0.019105911254882812, 0.023647308349609375, 0.028188705444335938, 0.0327301025390625, 0.03727149963378906, 0.041812896728515625, 0.04635429382324219, 0.05089569091796875, 0.05543708801269531, 0.059978485107421875, 0.06451988220214844, 0.069061279296875, 0.07360267639160156, 0.07814407348632812, 0.08268547058105469, 0.08722686767578125, 0.09176826477050781, 0.09630966186523438, 0.10085105895996094, 0.1053924560546875, 0.10993385314941406, 0.11447525024414062, 0.11901664733886719, 0.12355804443359375, 0.1280994415283203, 0.13264083862304688, 0.13718223571777344, 0.1417236328125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 5.0, 14.0, 13.0, 34.0, 40.0, 78.0, 85.0, 148.0, 226.0, 407.0, 748.0, 1343.0, 2490.0, 5531.0, 13341.0, 37357.0, 129306.0, 527623.0, 234151.0, 60453.0, 19985.0, 7811.0, 3492.0, 1677.0, 875.0, 479.0, 287.0, 174.0, 126.0, 81.0, 48.0, 37.0, 17.0, 15.0, 11.0, 9.0, 2.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09547996520996094, -0.09226608276367188, -0.08905220031738281, -0.08583831787109375, -0.08262443542480469, -0.07941055297851562, -0.07619667053222656, -0.0729827880859375, -0.06976890563964844, -0.06655502319335938, -0.06334114074707031, -0.06012725830078125, -0.05691337585449219, -0.053699493408203125, -0.05048561096191406, -0.047271728515625, -0.04405784606933594, -0.040843963623046875, -0.03763008117675781, -0.03441619873046875, -0.031202316284179688, -0.027988433837890625, -0.024774551391601562, -0.0215606689453125, -0.018346786499023438, -0.015132904052734375, -0.011919021606445312, -0.00870513916015625, -0.0054912567138671875, -0.002277374267578125, 0.0009365081787109375, 0.004150390625, 0.0073642730712890625, 0.010578155517578125, 0.013792037963867188, 0.01700592041015625, 0.020219802856445312, 0.023433685302734375, 0.026647567749023438, 0.0298614501953125, 0.03307533264160156, 0.036289215087890625, 0.03950309753417969, 0.04271697998046875, 0.04593086242675781, 0.049144744873046875, 0.05235862731933594, 0.055572509765625, 0.05878639221191406, 0.062000274658203125, 0.06521415710449219, 0.06842803955078125, 0.07164192199707031, 0.07485580444335938, 0.07806968688964844, 0.0812835693359375, 0.08449745178222656, 0.08771133422851562, 0.09092521667480469, 0.09413909912109375, 0.09735298156738281, 0.10056686401367188, 0.10378074645996094, 0.10699462890625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 7.0, 0.0, 4.0, 7.0, 6.0, 10.0, 12.0, 24.0, 16.0, 17.0, 22.0, 30.0, 40.0, 34.0, 42.0, 33.0, 59.0, 61.0, 61.0, 55.0, 62.0, 50.0, 50.0, 37.0, 38.0, 38.0, 25.0, 29.0, 26.0, 22.0, 18.0, 6.0, 11.0, 13.0, 4.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.402099609375, -0.3903541564941406, -0.37860870361328125, -0.3668632507324219, -0.3551177978515625, -0.3433723449707031, -0.33162689208984375, -0.3198814392089844, -0.308135986328125, -0.2963905334472656, -0.28464508056640625, -0.2728996276855469, -0.2611541748046875, -0.24940872192382812, -0.23766326904296875, -0.22591781616210938, -0.21417236328125, -0.20242691040039062, -0.19068145751953125, -0.17893600463867188, -0.1671905517578125, -0.15544509887695312, -0.14369964599609375, -0.13195419311523438, -0.120208740234375, -0.10846328735351562, -0.09671783447265625, -0.08497238159179688, -0.0732269287109375, -0.061481475830078125, -0.04973602294921875, -0.037990570068359375, -0.0262451171875, -0.014499664306640625, -0.00275421142578125, 0.008991241455078125, 0.0207366943359375, 0.032482147216796875, 0.04422760009765625, 0.055973052978515625, 0.067718505859375, 0.07946395874023438, 0.09120941162109375, 0.10295486450195312, 0.1147003173828125, 0.12644577026367188, 0.13819122314453125, 0.14993667602539062, 0.16168212890625, 0.17342758178710938, 0.18517303466796875, 0.19691848754882812, 0.2086639404296875, 0.22040939331054688, 0.23215484619140625, 0.24390029907226562, 0.255645751953125, 0.2673912048339844, 0.27913665771484375, 0.2908821105957031, 0.3026275634765625, 0.3143730163574219, 0.32611846923828125, 0.3378639221191406, 0.349609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 13.0, 18.0, 11.0, 29.0, 34.0, 74.0, 148.0, 356.0, 1202.0, 8175.0, 192736.0, 812020.0, 29966.0, 2653.0, 598.0, 235.0, 111.0, 57.0, 38.0, 32.0, 17.0, 8.0, 6.0, 6.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.080078125, -0.07759380340576172, -0.07510948181152344, -0.07262516021728516, -0.07014083862304688, -0.0676565170288086, -0.06517219543457031, -0.06268787384033203, -0.06020355224609375, -0.05771923065185547, -0.05523490905761719, -0.052750587463378906, -0.050266265869140625, -0.047781944274902344, -0.04529762268066406, -0.04281330108642578, -0.0403289794921875, -0.03784465789794922, -0.03536033630371094, -0.032876014709472656, -0.030391693115234375, -0.027907371520996094, -0.025423049926757812, -0.02293872833251953, -0.02045440673828125, -0.01797008514404297, -0.015485763549804688, -0.013001441955566406, -0.010517120361328125, -0.008032798767089844, -0.0055484771728515625, -0.0030641555786132812, -0.000579833984375, 0.0019044876098632812, 0.0043888092041015625, 0.006873130798339844, 0.009357452392578125, 0.011841773986816406, 0.014326095581054688, 0.01681041717529297, 0.01929473876953125, 0.02177906036376953, 0.024263381958007812, 0.026747703552246094, 0.029232025146484375, 0.031716346740722656, 0.03420066833496094, 0.03668498992919922, 0.0391693115234375, 0.04165363311767578, 0.04413795471191406, 0.046622276306152344, 0.049106597900390625, 0.051590919494628906, 0.05407524108886719, 0.05655956268310547, 0.05904388427734375, 0.06152820587158203, 0.06401252746582031, 0.0664968490600586, 0.06898117065429688, 0.07146549224853516, 0.07394981384277344, 0.07643413543701172, 0.07891845703125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 4.0, 2.0, 2.0, 11.0, 11.0, 11.0, 15.0, 23.0, 33.0, 37.0, 31.0, 40.0, 56.0, 47.0, 60.0, 74.0, 73.0, 63.0, 60.0, 68.0, 56.0, 49.0, 34.0, 34.0, 26.0, 23.0, 16.0, 9.0, 5.0, 6.0, 6.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.64267349243164e-06, -8.352100849151611e-06, -8.061528205871582e-06, -7.770955562591553e-06, -7.4803829193115234e-06, -7.189810276031494e-06, -6.899237632751465e-06, -6.6086649894714355e-06, -6.318092346191406e-06, -6.027519702911377e-06, -5.736947059631348e-06, -5.446374416351318e-06, -5.155801773071289e-06, -4.86522912979126e-06, -4.5746564865112305e-06, -4.284083843231201e-06, -3.993511199951172e-06, -3.7029385566711426e-06, -3.4123659133911133e-06, -3.121793270111084e-06, -2.8312206268310547e-06, -2.5406479835510254e-06, -2.250075340270996e-06, -1.959502696990967e-06, -1.6689300537109375e-06, -1.3783574104309082e-06, -1.087784767150879e-06, -7.972121238708496e-07, -5.066394805908203e-07, -2.1606683731079102e-07, 7.450580596923828e-08, 3.650784492492676e-07, 6.556510925292969e-07, 9.462237358093262e-07, 1.2367963790893555e-06, 1.5273690223693848e-06, 1.817941665649414e-06, 2.1085143089294434e-06, 2.3990869522094727e-06, 2.689659595489502e-06, 2.9802322387695312e-06, 3.2708048820495605e-06, 3.56137752532959e-06, 3.851950168609619e-06, 4.1425228118896484e-06, 4.433095455169678e-06, 4.723668098449707e-06, 5.014240741729736e-06, 5.304813385009766e-06, 5.595386028289795e-06, 5.885958671569824e-06, 6.1765313148498535e-06, 6.467103958129883e-06, 6.757676601409912e-06, 7.048249244689941e-06, 7.338821887969971e-06, 7.62939453125e-06, 7.91996717453003e-06, 8.210539817810059e-06, 8.501112461090088e-06, 8.791685104370117e-06, 9.082257747650146e-06, 9.372830390930176e-06, 9.663403034210205e-06, 9.953975677490234e-06]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 6.0, 2.0, 12.0, 10.0, 9.0, 21.0, 22.0, 25.0, 36.0, 40.0, 79.0, 97.0, 145.0, 313.0, 607.0, 1113.0, 2578.0, 7552.0, 26993.0, 122689.0, 577120.0, 240273.0, 49170.0, 12260.0, 4009.0, 1593.0, 784.0, 369.0, 233.0, 128.0, 66.0, 54.0, 41.0, 28.0, 19.0, 16.0, 11.0, 8.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.048065185546875, -0.04671907424926758, -0.045372962951660156, -0.044026851654052734, -0.04268074035644531, -0.04133462905883789, -0.03998851776123047, -0.03864240646362305, -0.037296295166015625, -0.0359501838684082, -0.03460407257080078, -0.03325796127319336, -0.03191184997558594, -0.030565738677978516, -0.029219627380371094, -0.027873516082763672, -0.02652740478515625, -0.025181293487548828, -0.023835182189941406, -0.022489070892333984, -0.021142959594726562, -0.01979684829711914, -0.01845073699951172, -0.017104625701904297, -0.015758514404296875, -0.014412403106689453, -0.013066291809082031, -0.01172018051147461, -0.010374069213867188, -0.009027957916259766, -0.007681846618652344, -0.006335735321044922, -0.0049896240234375, -0.003643512725830078, -0.0022974014282226562, -0.0009512901306152344, 0.0003948211669921875, 0.0017409324645996094, 0.0030870437622070312, 0.004433155059814453, 0.005779266357421875, 0.007125377655029297, 0.008471488952636719, 0.00981760025024414, 0.011163711547851562, 0.012509822845458984, 0.013855934143066406, 0.015202045440673828, 0.01654815673828125, 0.017894268035888672, 0.019240379333496094, 0.020586490631103516, 0.021932601928710938, 0.02327871322631836, 0.02462482452392578, 0.025970935821533203, 0.027317047119140625, 0.028663158416748047, 0.03000926971435547, 0.03135538101196289, 0.03270149230957031, 0.034047603607177734, 0.035393714904785156, 0.03673982620239258, 0.0380859375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 5.0, 12.0, 10.0, 23.0, 33.0, 49.0, 79.0, 119.0, 137.0, 122.0, 116.0, 93.0, 80.0, 43.0, 38.0, 17.0, 11.0, 8.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09429931640625, -0.09129714965820312, -0.08829498291015625, -0.08529281616210938, -0.0822906494140625, -0.07928848266601562, -0.07628631591796875, -0.07328414916992188, -0.070281982421875, -0.06727981567382812, -0.06427764892578125, -0.061275482177734375, -0.0582733154296875, -0.055271148681640625, -0.05226898193359375, -0.049266815185546875, -0.0462646484375, -0.043262481689453125, -0.04026031494140625, -0.037258148193359375, -0.0342559814453125, -0.031253814697265625, -0.02825164794921875, -0.025249481201171875, -0.022247314453125, -0.019245147705078125, -0.01624298095703125, -0.013240814208984375, -0.0102386474609375, -0.007236480712890625, -0.00423431396484375, -0.001232147216796875, 0.00177001953125, 0.004772186279296875, 0.00777435302734375, 0.010776519775390625, 0.0137786865234375, 0.016780853271484375, 0.01978302001953125, 0.022785186767578125, 0.025787353515625, 0.028789520263671875, 0.03179168701171875, 0.034793853759765625, 0.0377960205078125, 0.040798187255859375, 0.04380035400390625, 0.046802520751953125, 0.0498046875, 0.052806854248046875, 0.05580902099609375, 0.058811187744140625, 0.0618133544921875, 0.06481552124023438, 0.06781768798828125, 0.07081985473632812, 0.073822021484375, 0.07682418823242188, 0.07982635498046875, 0.08282852172851562, 0.0858306884765625, 0.08883285522460938, 0.09183502197265625, 0.09483718872070312, 0.09783935546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 11.0, 5.0, 9.0, 14.0, 28.0, 65.0, 146.0, 228.0, 229.0, 131.0, 79.0, 30.0, 18.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.843483328819275, -1.790568232536316, -1.7376530170440674, -1.6847379207611084, -1.6318227052688599, -1.5789076089859009, -1.5259923934936523, -1.4730772972106934, -1.4201622009277344, -1.3672471046447754, -1.3143318891525269, -1.2614167928695679, -1.2085015773773193, -1.1555864810943604, -1.1026713848114014, -1.0497561693191528, -0.9968409538269043, -0.9439257979393005, -0.8910106420516968, -0.8380955457687378, -0.7851803302764893, -0.7322652339935303, -0.6793500781059265, -0.6264349222183228, -0.573519766330719, -0.5206046104431152, -0.4676894545555115, -0.4147743284702301, -0.36185917258262634, -0.3089440166950226, -0.2560288906097412, -0.20311373472213745, -0.15019869804382324, -0.09728354960680008, -0.044368401169776917, 0.00854673981666565, 0.06146189570426941, 0.11437705159187317, 0.16729217767715454, 0.2202073335647583, 0.27312248945236206, 0.3260376453399658, 0.3789528012275696, 0.43186792731285095, 0.4847830832004547, 0.5376982688903809, 0.5906133651733398, 0.6435285210609436, 0.6964436769485474, 0.7493588328361511, 0.8022739887237549, 0.8551890850067139, 0.9081043004989624, 0.9610193967819214, 1.01393461227417, 1.066849708557129, 1.119764804840088, 1.1726799011230469, 1.2255951166152954, 1.2785102128982544, 1.331425428390503, 1.384340524673462, 1.437255620956421, 1.4901708364486694, 1.543086051940918]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 18.0, 14.0, 9.0, 17.0, 21.0, 17.0, 25.0, 33.0, 20.0, 30.0, 34.0, 49.0, 39.0, 56.0, 58.0, 44.0, 44.0, 52.0, 39.0, 45.0, 31.0, 35.0, 32.0, 27.0, 21.0, 24.0, 21.0, 22.0, 14.0, 17.0, 15.0, 7.0, 6.0, 7.0, 7.0, 9.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9225377440452576, -0.8934921026229858, -0.8644464612007141, -0.8354008197784424, -0.8063551187515259, -0.7773095369338989, -0.7482638359069824, -0.7192181944847107, -0.690172553062439, -0.6611269116401672, -0.6320812702178955, -0.6030356287956238, -0.573989987373352, -0.5449442863464355, -0.5158986449241638, -0.4868530035018921, -0.45780736207962036, -0.42876172065734863, -0.3997160792350769, -0.3706704080104828, -0.34162476658821106, -0.31257912516593933, -0.2835334539413452, -0.2544878125190735, -0.22544217109680176, -0.19639652967453003, -0.1673508733510971, -0.13830521702766418, -0.10925957560539246, -0.08021393418312073, -0.051168277859687805, -0.022122621536254883, 0.006923079490661621, 0.03596872836351395, 0.06501437723636627, 0.0940600261092186, 0.12310567498207092, 0.15215131640434265, 0.18119697272777557, 0.2102426290512085, 0.23928827047348022, 0.26833391189575195, 0.2973795533180237, 0.3264252245426178, 0.3554708659648895, 0.38451650738716125, 0.41356217861175537, 0.4426078200340271, 0.47165346145629883, 0.5006991028785706, 0.5297447443008423, 0.558790385723114, 0.5878360271453857, 0.6168817281723022, 0.645927369594574, 0.6749730110168457, 0.7040186524391174, 0.7330642938613892, 0.7621099352836609, 0.7911555767059326, 0.8202012777328491, 0.8492468595504761, 0.8782925605773926, 0.9073382019996643, 0.936383843421936]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 6.0, 3.0, 2.0, 7.0, 3.0, 11.0, 9.0, 11.0, 7.0, 17.0, 20.0, 22.0, 15.0, 30.0, 44.0, 60.0, 132.0, 270.0, 107.0, 58.0, 32.0, 27.0, 23.0, 24.0, 20.0, 8.0, 13.0, 13.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1295166015625, -0.12315940856933594, -0.11680221557617188, -0.11044502258300781, -0.10408782958984375, -0.09773063659667969, -0.09137344360351562, -0.08501625061035156, -0.0786590576171875, -0.07230186462402344, -0.06594467163085938, -0.05958747863769531, -0.05323028564453125, -0.04687309265136719, -0.040515899658203125, -0.03415870666503906, -0.027801513671875, -0.021444320678710938, -0.015087127685546875, -0.008729934692382812, -0.00237274169921875, 0.0039844512939453125, 0.010341644287109375, 0.016698837280273438, 0.0230560302734375, 0.029413223266601562, 0.035770416259765625, 0.04212760925292969, 0.04848480224609375, 0.05484199523925781, 0.061199188232421875, 0.06755638122558594, 0.07391357421875, 0.08027076721191406, 0.08662796020507812, 0.09298515319824219, 0.09934234619140625, 0.10569953918457031, 0.11205673217773438, 0.11841392517089844, 0.1247711181640625, 0.13112831115722656, 0.13748550415039062, 0.1438426971435547, 0.15019989013671875, 0.1565570831298828, 0.16291427612304688, 0.16927146911621094, 0.175628662109375, 0.18198585510253906, 0.18834304809570312, 0.1947002410888672, 0.20105743408203125, 0.2074146270751953, 0.21377182006835938, 0.22012901306152344, 0.2264862060546875, 0.23284339904785156, 0.23920059204101562, 0.2455577850341797, 0.25191497802734375, 0.2582721710205078, 0.2646293640136719, 0.27098655700683594, 0.27734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 1.0, 1.0, 2.0, 5.0, 4.0, 15.0, 11.0, 28.0, 32.0, 52.0, 94.0, 126.0, 277.0, 569.0, 1254.0, 3309.0, 12030.0, 309843.0, 8036637.0, 16832.0, 4359.0, 1584.0, 675.0, 332.0, 208.0, 107.0, 57.0, 42.0, 23.0, 28.0, 22.0, 9.0, 8.0, 8.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8093006610870361, -0.7880585789680481, -0.7668164968490601, -0.745574414730072, -0.724332332611084, -0.703090250492096, -0.6818481683731079, -0.6606060266494751, -0.6393640041351318, -0.6181219220161438, -0.5968798398971558, -0.5756377577781677, -0.5543956756591797, -0.5331535935401917, -0.5119115114212036, -0.4906693994998932, -0.46942728757858276, -0.4481852054595947, -0.4269431233406067, -0.40570104122161865, -0.3844589591026306, -0.3632168769836426, -0.34197476506233215, -0.3207326829433441, -0.2994906008243561, -0.27824851870536804, -0.25700643658638, -0.23576433956623077, -0.21452225744724274, -0.1932801753282547, -0.17203807830810547, -0.15079599618911743, -0.1295539140701294, -0.10831183195114136, -0.08706974238157272, -0.06582765281200409, -0.04458557069301605, -0.023343488574028015, -0.002101391553878784, 0.019140690565109253, 0.04038277268409729, 0.061624858528375626, 0.08286694437265396, 0.1041090339422226, 0.12535111606121063, 0.14659319818019867, 0.1678352952003479, 0.18907737731933594, 0.21031945943832397, 0.231561541557312, 0.25280362367630005, 0.2740457057952881, 0.2952877879142761, 0.31652987003326416, 0.3377719819545746, 0.3590140640735626, 0.38025614619255066, 0.4014982283115387, 0.42274031043052673, 0.44398242235183716, 0.4652245044708252, 0.48646658658981323, 0.5077086687088013, 0.5289507508277893, 0.5501928329467773]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 2.0, 8.0, 3.0, 4.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44891950488090515, -0.4265523850917816, -0.4041852653026581, -0.38181814551353455, -0.359451025724411, -0.3370839059352875, -0.31471681594848633, -0.2923496961593628, -0.26998257637023926, -0.24761545658111572, -0.2252483367919922, -0.20288121700286865, -0.18051409721374512, -0.15814697742462158, -0.13577987253665924, -0.1134127527475357, -0.09104561805725098, -0.06867849826812744, -0.046311382204294205, -0.023944266140460968, -0.0015771463513374329, 0.020789973437786102, 0.04315708577632904, 0.06552420556545258, 0.08789132535457611, 0.11025844514369965, 0.13262556493282318, 0.15499266982078552, 0.17735978960990906, 0.1997269093990326, 0.22209402918815613, 0.24446114897727966, 0.2668282389640808, 0.28919535875320435, 0.3115624785423279, 0.3339295983314514, 0.35629671812057495, 0.3786638379096985, 0.401030957698822, 0.42339807748794556, 0.4457651972770691, 0.4681323170661926, 0.49049943685531616, 0.5128665566444397, 0.5352336764335632, 0.5576007962226868, 0.5799679160118103, 0.6023350358009338, 0.6247020959854126, 0.6470692157745361, 0.6694363355636597, 0.6918034553527832, 0.7141705751419067, 0.7365376949310303, 0.7589048147201538, 0.7812719345092773, 0.8036390542984009, 0.8260061740875244, 0.848373293876648, 0.8707404136657715, 0.893107533454895, 0.9154746532440186, 0.9378417730331421, 0.9602088928222656, 0.9825760126113892]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 7.0, 1.0, 9.0, 8.0, 14.0, 11.0, 18.0, 22.0, 24.0, 37.0, 38.0, 26.0, 53.0, 49.0, 63.0, 52.0, 65.0, 57.0, 62.0, 58.0, 48.0, 55.0, 38.0, 30.0, 34.0, 37.0, 17.0, 14.0, 13.0, 12.0, 7.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.074462890625, -0.07196044921875, -0.0694580078125, -0.06695556640625, -0.064453125, -0.06195068359375, -0.0594482421875, -0.05694580078125, -0.054443359375, -0.05194091796875, -0.0494384765625, -0.04693603515625, -0.04443359375, -0.04193115234375, -0.0394287109375, -0.03692626953125, -0.034423828125, -0.03192138671875, -0.0294189453125, -0.02691650390625, -0.0244140625, -0.02191162109375, -0.0194091796875, -0.01690673828125, -0.014404296875, -0.01190185546875, -0.0093994140625, -0.00689697265625, -0.00439453125, -0.00189208984375, 0.0006103515625, 0.00311279296875, 0.005615234375, 0.00811767578125, 0.0106201171875, 0.01312255859375, 0.015625, 0.01812744140625, 0.0206298828125, 0.02313232421875, 0.025634765625, 0.02813720703125, 0.0306396484375, 0.03314208984375, 0.03564453125, 0.03814697265625, 0.0406494140625, 0.04315185546875, 0.045654296875, 0.04815673828125, 0.0506591796875, 0.05316162109375, 0.0556640625, 0.05816650390625, 0.0606689453125, 0.06317138671875, 0.065673828125, 0.06817626953125, 0.0706787109375, 0.07318115234375, 0.07568359375, 0.07818603515625, 0.0806884765625, 0.08319091796875, 0.085693359375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 13.0, 12.0, 20.0, 28.0, 18.0, 34.0, 42.0, 64.0, 107.0, 126.0, 199.0, 285.0, 407.0, 700.0, 1032.0, 1642.0, 2665.0, 4698.0, 8524.0, 16473.0, 38126.0, 109717.0, 189562.0, 86204.0, 31432.0, 14263.0, 7246.0, 4105.0, 2388.0, 1417.0, 898.0, 585.0, 364.0, 242.0, 183.0, 104.0, 87.0, 67.0, 47.0, 28.0, 25.0, 25.0, 15.0, 9.0, 11.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.4677734375, -1.4238128662109375, -1.379852294921875, -1.3358917236328125, -1.29193115234375, -1.2479705810546875, -1.204010009765625, -1.1600494384765625, -1.1160888671875, -1.0721282958984375, -1.028167724609375, -0.9842071533203125, -0.94024658203125, -0.8962860107421875, -0.852325439453125, -0.8083648681640625, -0.764404296875, -0.7204437255859375, -0.676483154296875, -0.6325225830078125, -0.58856201171875, -0.5446014404296875, -0.500640869140625, -0.4566802978515625, -0.4127197265625, -0.3687591552734375, -0.324798583984375, -0.2808380126953125, -0.23687744140625, -0.1929168701171875, -0.148956298828125, -0.1049957275390625, -0.06103515625, -0.0170745849609375, 0.026885986328125, 0.0708465576171875, 0.11480712890625, 0.1587677001953125, 0.202728271484375, 0.2466888427734375, 0.2906494140625, 0.3346099853515625, 0.378570556640625, 0.4225311279296875, 0.46649169921875, 0.5104522705078125, 0.554412841796875, 0.5983734130859375, 0.642333984375, 0.6862945556640625, 0.730255126953125, 0.7742156982421875, 0.81817626953125, 0.8621368408203125, 0.906097412109375, 0.9500579833984375, 0.9940185546875, 1.0379791259765625, 1.081939697265625, 1.1259002685546875, 1.16986083984375, 1.2138214111328125, 1.257781982421875, 1.3017425537109375, 1.345703125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 2.0, 3.0, 6.0, 6.0, 11.0, 19.0, 15.0, 21.0, 26.0, 27.0, 27.0, 52.0, 41.0, 49.0, 54.0, 57.0, 52.0, 66.0, 64.0, 49.0, 53.0, 49.0, 43.0, 35.0, 40.0, 28.0, 28.0, 21.0, 10.0, 11.0, 11.0, 6.0, 4.0, 2.0, 9.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.22021484375, -0.21476364135742188, -0.20931243896484375, -0.20386123657226562, -0.1984100341796875, -0.19295883178710938, -0.18750762939453125, -0.18205642700195312, -0.176605224609375, -0.17115402221679688, -0.16570281982421875, -0.16025161743164062, -0.1548004150390625, -0.14934921264648438, -0.14389801025390625, -0.13844680786132812, -0.13299560546875, -0.12754440307617188, -0.12209320068359375, -0.11664199829101562, -0.1111907958984375, -0.10573959350585938, -0.10028839111328125, -0.09483718872070312, -0.089385986328125, -0.08393478393554688, -0.07848358154296875, -0.07303237915039062, -0.0675811767578125, -0.062129974365234375, -0.05667877197265625, -0.051227569580078125, -0.0457763671875, -0.040325164794921875, -0.03487396240234375, -0.029422760009765625, -0.0239715576171875, -0.018520355224609375, -0.01306915283203125, -0.007617950439453125, -0.002166748046875, 0.003284454345703125, 0.00873565673828125, 0.014186859130859375, 0.0196380615234375, 0.025089263916015625, 0.03054046630859375, 0.035991668701171875, 0.04144287109375, 0.046894073486328125, 0.05234527587890625, 0.057796478271484375, 0.0632476806640625, 0.06869888305664062, 0.07415008544921875, 0.07960128784179688, 0.085052490234375, 0.09050369262695312, 0.09595489501953125, 0.10140609741210938, 0.1068572998046875, 0.11230850219726562, 0.11775970458984375, 0.12321090698242188, 0.128662109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 3.0, 9.0, 17.0, 17.0, 12.0, 25.0, 27.0, 43.0, 54.0, 57.0, 52.0, 39.0, 29.0, 25.0, 17.0, 8.0, 5.0, 6.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5446550846099854, -0.5246884822845459, -0.5047218799591064, -0.484755277633667, -0.46478867530822754, -0.4448220729827881, -0.424855500459671, -0.40488889813423157, -0.3849222958087921, -0.36495569348335266, -0.3449890911579132, -0.32502248883247375, -0.3050559163093567, -0.28508931398391724, -0.2651227116584778, -0.24515610933303833, -0.22518950700759888, -0.20522290468215942, -0.18525630235671997, -0.1652897149324417, -0.14532311260700226, -0.1253565102815628, -0.10538991540670395, -0.08542332053184509, -0.06545671820640564, -0.045490119606256485, -0.02552352100610733, -0.005556922405958176, 0.014409676194190979, 0.03437627851963043, 0.05434287339448929, 0.07430946826934814, 0.0942760705947876, 0.11424267292022705, 0.1342092752456665, 0.15417586266994476, 0.17414246499538422, 0.19410906732082367, 0.21407565474510193, 0.23404225707054138, 0.25400885939598083, 0.2739754617214203, 0.29394206404685974, 0.3139086663722992, 0.33387523889541626, 0.3538418412208557, 0.37380844354629517, 0.3937750458717346, 0.4137416481971741, 0.4337082505226135, 0.453674852848053, 0.47364145517349243, 0.4936080574989319, 0.5135746598243713, 0.5335412621498108, 0.5535078048706055, 0.5734744071960449, 0.5934410095214844, 0.6134076118469238, 0.6333742141723633, 0.6533408164978027, 0.6733074188232422, 0.6932740211486816, 0.7132406234741211, 0.7332072257995605]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 7.0, 3.0, 5.0, 6.0, 12.0, 12.0, 9.0, 10.0, 14.0, 17.0, 42.0, 80.0, 108.0, 57.0, 20.0, 15.0, 17.0, 5.0, 9.0, 6.0, 5.0, 6.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7455165982246399, -0.720504879951477, -0.6954931616783142, -0.6704814434051514, -0.6454697847366333, -0.6204580068588257, -0.5954463481903076, -0.5704346299171448, -0.5454229116439819, -0.5204111933708191, -0.49539947509765625, -0.4703877866268158, -0.44537606835365295, -0.4203643500804901, -0.39535266160964966, -0.3703409433364868, -0.345329225063324, -0.32031750679016113, -0.2953057885169983, -0.27029410004615784, -0.245282381772995, -0.22027066349983215, -0.1952589601278305, -0.17024725675582886, -0.14523553848266602, -0.12022382766008377, -0.09521211683750153, -0.07020040601491928, -0.045188695192337036, -0.020176976919174194, 0.004834726452827454, 0.0298464298248291, 0.05485814809799194, 0.07986985892057419, 0.10488156974315643, 0.12989327311515808, 0.15490499138832092, 0.17991670966148376, 0.2049284130334854, 0.22994011640548706, 0.2549518346786499, 0.27996355295181274, 0.3049752712249756, 0.32998695969581604, 0.3549986779689789, 0.3800103962421417, 0.4050220847129822, 0.430033802986145, 0.45504552125930786, 0.4800572395324707, 0.5050689578056335, 0.5300806760787964, 0.5550923347473145, 0.5801041126251221, 0.6051157712936401, 0.630127489566803, 0.6551392078399658, 0.6801509261131287, 0.7051626443862915, 0.7301743626594543, 0.7551860809326172, 0.7801977396011353, 0.8052094578742981, 0.8302211761474609, 0.8552328944206238]}, "eval/loss": 1.9121204614639282, "eval/bleu": 2.0001405343797235e-14, "eval/runtime": 2596.1075, "eval/samples_per_second": 5.685, "eval/steps_per_second": 0.711} \ No newline at end of file +{"train/loss": 1.288, "train/learning_rate": 9.405963302752294e-05, "train/epoch": 2.16, "train/global_step": 3500, "_runtime": 50225, "_timestamp": 1651822523, "_step": 3506, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 9.0, 37.0, 77.0, 194.0, 261.0, 226.0, 108.0, 64.0, 28.0, 6.0, 3.0], "bins": [-4.193824768066406, -4.121095180511475, -4.048366069793701, -3.9756367206573486, -3.902907371520996, -3.8301777839660645, -3.757448434829712, -3.6847190856933594, -3.611989736557007, -3.5392603874206543, -3.4665310382843018, -3.393801689147949, -3.3210721015930176, -3.248342752456665, -3.1756134033203125, -3.10288405418396, -3.0301547050476074, -2.957425355911255, -2.8846960067749023, -2.81196665763855, -2.7392373085021973, -2.6665077209472656, -2.593778371810913, -2.5210490226745605, -2.448319673538208, -2.3755903244018555, -2.302860975265503, -2.2301316261291504, -2.1574020385742188, -2.084672689437866, -2.0119433403015137, -1.9392139911651611, -1.8664848804473877, -1.7937555313110352, -1.7210261821746826, -1.6482967138290405, -1.575567364692688, -1.5028380155563354, -1.4301085472106934, -1.3573791980743408, -1.2846498489379883, -1.2119204998016357, -1.1391911506652832, -1.0664616823196411, -0.9937323331832886, -0.921002984046936, -0.8482735753059387, -0.7755441665649414, -0.7028148174285889, -0.6300854682922363, -0.557356059551239, -0.4846266806125641, -0.41189730167388916, -0.33916792273521423, -0.2664385437965393, -0.193709135055542, -0.12097975611686707, -0.04825037717819214, 0.024479001760482788, 0.09720838069915771, 0.16993775963783264, 0.24266713857650757, 0.3153965175151825, 0.3881259262561798, 0.46085527539253235]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 10.0, 6.0, 6.0, 12.0, 12.0, 16.0, 18.0, 20.0, 26.0, 19.0, 27.0, 21.0, 26.0, 31.0, 36.0, 36.0, 34.0, 40.0, 40.0, 41.0, 43.0, 39.0, 34.0, 32.0, 35.0, 36.0, 34.0, 33.0, 25.0, 31.0, 14.0, 27.0, 18.0, 30.0, 12.0, 14.0, 10.0, 7.0, 8.0, 7.0, 8.0, 9.0, 2.0, 6.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.7703433036804199, -0.7468107342720032, -0.7232781648635864, -0.6997455358505249, -0.6762129664421082, -0.6526803970336914, -0.6291478276252747, -0.6056152582168579, -0.5820826292037964, -0.5585500597953796, -0.5350174903869629, -0.5114848613739014, -0.4879522919654846, -0.46441972255706787, -0.4408871531486511, -0.4173545837402344, -0.3938220143318176, -0.3702894449234009, -0.34675684571266174, -0.323224276304245, -0.29969167709350586, -0.2761591076850891, -0.25262653827667236, -0.22909395396709442, -0.20556136965751648, -0.18202878534793854, -0.1584962010383606, -0.13496363162994385, -0.1114310473203659, -0.08789846301078796, -0.06436589360237122, -0.040833309292793274, -0.017300784587860107, 0.006231795996427536, 0.02976437658071518, 0.053296953439712524, 0.07682953774929047, 0.10036212205886841, 0.12389469146728516, 0.1474272757768631, 0.17095986008644104, 0.19449244439601898, 0.21802502870559692, 0.24155759811401367, 0.2650901675224304, 0.28862276673316956, 0.3121553361415863, 0.33568793535232544, 0.3592205047607422, 0.38275307416915894, 0.40628567337989807, 0.4298182427883148, 0.45335084199905396, 0.4768834114074707, 0.5004159808158875, 0.5239485502243042, 0.5474811792373657, 0.5710137486457825, 0.5945463180541992, 0.6180789470672607, 0.6416115164756775, 0.6651440858840942, 0.688676655292511, 0.7122092247009277, 0.7357417941093445]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 2.0, 7.0, 7.0, 9.0, 10.0, 13.0, 21.0, 39.0, 40.0, 73.0, 102.0, 135.0, 211.0, 345.0, 525.0, 800.0, 1292.0, 2252.0, 3907.0, 7417.0, 14680.0, 33012.0, 87782.0, 268560.0, 1118390.0, 1971024.0, 459177.0, 134966.0, 48014.0, 20266.0, 9465.0, 4950.0, 2651.0, 1570.0, 934.0, 596.0, 354.0, 210.0, 171.0, 97.0, 55.0, 53.0, 30.0, 25.0, 12.0, 7.0, 7.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.041015625, -1.0086822509765625, -0.976348876953125, -0.9440155029296875, -0.91168212890625, -0.8793487548828125, -0.847015380859375, -0.8146820068359375, -0.7823486328125, -0.7500152587890625, -0.717681884765625, -0.6853485107421875, -0.65301513671875, -0.6206817626953125, -0.588348388671875, -0.5560150146484375, -0.523681640625, -0.4913482666015625, -0.459014892578125, -0.4266815185546875, -0.39434814453125, -0.3620147705078125, -0.329681396484375, -0.2973480224609375, -0.2650146484375, -0.2326812744140625, -0.200347900390625, -0.1680145263671875, -0.13568115234375, -0.1033477783203125, -0.071014404296875, -0.0386810302734375, -0.00634765625, 0.0259857177734375, 0.058319091796875, 0.0906524658203125, 0.12298583984375, 0.1553192138671875, 0.187652587890625, 0.2199859619140625, 0.2523193359375, 0.2846527099609375, 0.316986083984375, 0.3493194580078125, 0.38165283203125, 0.4139862060546875, 0.446319580078125, 0.4786529541015625, 0.510986328125, 0.5433197021484375, 0.575653076171875, 0.6079864501953125, 0.64031982421875, 0.6726531982421875, 0.704986572265625, 0.7373199462890625, 0.7696533203125, 0.8019866943359375, 0.834320068359375, 0.8666534423828125, 0.89898681640625, 0.9313201904296875, 0.963653564453125, 0.9959869384765625, 1.0283203125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 3.0, 7.0, 13.0, 16.0, 18.0, 18.0, 21.0, 19.0, 16.0, 24.0, 22.0, 27.0, 34.0, 37.0, 32.0, 35.0, 43.0, 43.0, 40.0, 40.0, 28.0, 32.0, 37.0, 46.0, 34.0, 34.0, 35.0, 27.0, 26.0, 18.0, 24.0, 27.0, 19.0, 15.0, 13.0, 11.0, 13.0, 3.0, 5.0, 6.0, 11.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-1.0927734375, -1.0614395141601562, -1.0301055908203125, -0.9987716674804688, -0.967437744140625, -0.9361038208007812, -0.9047698974609375, -0.8734359741210938, -0.84210205078125, -0.8107681274414062, -0.7794342041015625, -0.7481002807617188, -0.716766357421875, -0.6854324340820312, -0.6540985107421875, -0.6227645874023438, -0.5914306640625, -0.5600967407226562, -0.5287628173828125, -0.49742889404296875, -0.466094970703125, -0.43476104736328125, -0.4034271240234375, -0.37209320068359375, -0.34075927734375, -0.30942535400390625, -0.2780914306640625, -0.24675750732421875, -0.215423583984375, -0.18408966064453125, -0.1527557373046875, -0.12142181396484375, -0.090087890625, -0.05875396728515625, -0.0274200439453125, 0.00391387939453125, 0.035247802734375, 0.06658172607421875, 0.0979156494140625, 0.12924957275390625, 0.16058349609375, 0.19191741943359375, 0.2232513427734375, 0.25458526611328125, 0.285919189453125, 0.31725311279296875, 0.3485870361328125, 0.37992095947265625, 0.4112548828125, 0.44258880615234375, 0.4739227294921875, 0.5052566528320312, 0.536590576171875, 0.5679244995117188, 0.5992584228515625, 0.6305923461914062, 0.66192626953125, 0.6932601928710938, 0.7245941162109375, 0.7559280395507812, 0.787261962890625, 0.8185958862304688, 0.8499298095703125, 0.8812637329101562, 0.91259765625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 18.0, 15.0, 26.0, 45.0, 74.0, 119.0, 224.0, 804.0, 4077684.0, 114119.0, 671.0, 168.0, 88.0, 61.0, 47.0, 26.0, 27.0, 14.0, 17.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4765625, -14.8551025390625, -14.233642578125, -13.6121826171875, -12.99072265625, -12.3692626953125, -11.747802734375, -11.1263427734375, -10.5048828125, -9.8834228515625, -9.261962890625, -8.6405029296875, -8.01904296875, -7.3975830078125, -6.776123046875, -6.1546630859375, -5.533203125, -4.9117431640625, -4.290283203125, -3.6688232421875, -3.04736328125, -2.4259033203125, -1.804443359375, -1.1829833984375, -0.5615234375, 0.0599365234375, 0.681396484375, 1.3028564453125, 1.92431640625, 2.5457763671875, 3.167236328125, 3.7886962890625, 4.41015625, 5.0316162109375, 5.653076171875, 6.2745361328125, 6.89599609375, 7.5174560546875, 8.138916015625, 8.7603759765625, 9.3818359375, 10.0032958984375, 10.624755859375, 11.2462158203125, 11.86767578125, 12.4891357421875, 13.110595703125, 13.7320556640625, 14.353515625, 14.9749755859375, 15.596435546875, 16.2178955078125, 16.83935546875, 17.4608154296875, 18.082275390625, 18.7037353515625, 19.3251953125, 19.9466552734375, 20.568115234375, 21.1895751953125, 21.81103515625, 22.4324951171875, 23.053955078125, 23.6754150390625, 24.296875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 9.0, 5.0, 7.0, 17.0, 25.0, 29.0, 45.0, 73.0, 117.0, 211.0, 546.0, 1543.0, 806.0, 259.0, 126.0, 83.0, 55.0, 33.0, 34.0, 23.0, 12.0, 6.0, 10.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.63427734375, -0.61212158203125, -0.5899658203125, -0.56781005859375, -0.545654296875, -0.52349853515625, -0.5013427734375, -0.47918701171875, -0.45703125, -0.43487548828125, -0.4127197265625, -0.39056396484375, -0.368408203125, -0.34625244140625, -0.3240966796875, -0.30194091796875, -0.27978515625, -0.25762939453125, -0.2354736328125, -0.21331787109375, -0.191162109375, -0.16900634765625, -0.1468505859375, -0.12469482421875, -0.1025390625, -0.08038330078125, -0.0582275390625, -0.03607177734375, -0.013916015625, 0.00823974609375, 0.0303955078125, 0.05255126953125, 0.07470703125, 0.09686279296875, 0.1190185546875, 0.14117431640625, 0.163330078125, 0.18548583984375, 0.2076416015625, 0.22979736328125, 0.251953125, 0.27410888671875, 0.2962646484375, 0.31842041015625, 0.340576171875, 0.36273193359375, 0.3848876953125, 0.40704345703125, 0.42919921875, 0.45135498046875, 0.4735107421875, 0.49566650390625, 0.517822265625, 0.53997802734375, 0.5621337890625, 0.58428955078125, 0.6064453125, 0.62860107421875, 0.6507568359375, 0.67291259765625, 0.695068359375, 0.71722412109375, 0.7393798828125, 0.76153564453125, 0.78369140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 10.0, 13.0, 8.0, 33.0, 40.0, 49.0, 62.0, 84.0, 94.0, 108.0, 91.0, 87.0, 79.0, 57.0, 60.0, 41.0, 35.0, 19.0, 8.0, 8.0, 10.0, 3.0, 5.0, 4.0], "bins": [-3.4270503520965576, -3.358222484588623, -3.2893948554992676, -3.220566987991333, -3.1517391204833984, -3.082911491394043, -3.0140836238861084, -2.945255994796753, -2.8764281272888184, -2.807600259780884, -2.7387726306915283, -2.6699447631835938, -2.6011171340942383, -2.5322892665863037, -2.463461399078369, -2.3946337699890137, -2.325805902481079, -2.2569780349731445, -2.188150405883789, -2.1193225383758545, -2.05049467086792, -1.9816670417785645, -1.9128391742706299, -1.8440114259719849, -1.7751836776733398, -1.7063559293746948, -1.6375281810760498, -1.5687003135681152, -1.4998725652694702, -1.4310448169708252, -1.3622169494628906, -1.2933892011642456, -1.2245616912841797, -1.1557339429855347, -1.0869061946868896, -1.018078327178955, -0.9492505788803101, -0.880422830581665, -0.8115950226783752, -0.7427672147750854, -0.6739394664764404, -0.6051117181777954, -0.5362839102745056, -0.4674561321735382, -0.3986283540725708, -0.3298005759716034, -0.260972797870636, -0.19214501976966858, -0.12331724166870117, -0.054489463567733765, 0.014338314533233643, 0.08316609263420105, 0.15199387073516846, 0.22082164883613586, 0.28964942693710327, 0.3584772050380707, 0.4273049831390381, 0.4961327612400055, 0.5649605393409729, 0.6337883472442627, 0.7026160955429077, 0.7714438438415527, 0.8402716517448425, 0.9090994596481323, 0.9779272079467773]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 13.0, 8.0, 9.0, 13.0, 10.0, 14.0, 18.0, 21.0, 26.0, 33.0, 22.0, 20.0, 34.0, 30.0, 32.0, 27.0, 34.0, 37.0, 45.0, 38.0, 44.0, 43.0, 35.0, 30.0, 31.0, 29.0, 30.0, 27.0, 22.0, 35.0, 26.0, 29.0, 17.0, 12.0, 19.0, 8.0, 8.0, 11.0, 15.0, 11.0, 11.0, 3.0, 3.0, 0.0, 2.0, 6.0, 1.0, 1.0, 2.0], "bins": [-1.1258944272994995, -1.0940678119659424, -1.0622411966323853, -1.0304145812988281, -0.998587965965271, -0.9667613506317139, -0.934934675693512, -0.9031080603599548, -0.8712814450263977, -0.8394548296928406, -0.8076282143592834, -0.7758015990257263, -0.7439749240875244, -0.7121483087539673, -0.6803216934204102, -0.648495078086853, -0.6166684627532959, -0.5848418474197388, -0.5530152320861816, -0.5211886167526245, -0.489361971616745, -0.45753535628318787, -0.42570871114730835, -0.3938820958137512, -0.3620554804801941, -0.33022886514663696, -0.29840224981307983, -0.2665756046772003, -0.2347489893436432, -0.20292237401008606, -0.17109574377536774, -0.13926911354064941, -0.10744249820709229, -0.07561587542295456, -0.043789252638816833, -0.011962629854679108, 0.019863992929458618, 0.05169060826301575, 0.08351723849773407, 0.11534386873245239, 0.14717048406600952, 0.17899709939956665, 0.21082372963428497, 0.2426503598690033, 0.2744769752025604, 0.30630359053611755, 0.33813023567199707, 0.3699568510055542, 0.40178346633911133, 0.43361008167266846, 0.4654366970062256, 0.4972633421421051, 0.5290899276733398, 0.560916543006897, 0.5927432179450989, 0.624569833278656, 0.6563964486122131, 0.6882230639457703, 0.7200496792793274, 0.7518762946128845, 0.7837029695510864, 0.8155295848846436, 0.8473562002182007, 0.8791828155517578, 0.9110094308853149]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 9.0, 22.0, 26.0, 41.0, 70.0, 102.0, 179.0, 261.0, 421.0, 611.0, 1038.0, 1810.0, 2790.0, 4619.0, 7722.0, 13357.0, 23442.0, 41633.0, 76159.0, 136183.0, 206498.0, 209763.0, 140955.0, 78961.0, 43352.0, 24095.0, 13887.0, 8028.0, 4750.0, 2955.0, 1780.0, 1141.0, 735.0, 426.0, 249.0, 178.0, 121.0, 65.0, 37.0, 32.0, 16.0, 15.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3229522705078125, -0.311431884765625, -0.2999114990234375, -0.28839111328125, -0.2768707275390625, -0.265350341796875, -0.2538299560546875, -0.2423095703125, -0.2307891845703125, -0.219268798828125, -0.2077484130859375, -0.19622802734375, -0.1847076416015625, -0.173187255859375, -0.1616668701171875, -0.150146484375, -0.1386260986328125, -0.127105712890625, -0.1155853271484375, -0.10406494140625, -0.0925445556640625, -0.081024169921875, -0.0695037841796875, -0.0579833984375, -0.0464630126953125, -0.034942626953125, -0.0234222412109375, -0.01190185546875, -0.0003814697265625, 0.011138916015625, 0.0226593017578125, 0.0341796875, 0.0457000732421875, 0.057220458984375, 0.0687408447265625, 0.08026123046875, 0.0917816162109375, 0.103302001953125, 0.1148223876953125, 0.1263427734375, 0.1378631591796875, 0.149383544921875, 0.1609039306640625, 0.17242431640625, 0.1839447021484375, 0.195465087890625, 0.2069854736328125, 0.218505859375, 0.2300262451171875, 0.241546630859375, 0.2530670166015625, 0.26458740234375, 0.2761077880859375, 0.287628173828125, 0.2991485595703125, 0.3106689453125, 0.3221893310546875, 0.333709716796875, 0.3452301025390625, 0.35675048828125, 0.3682708740234375, 0.379791259765625, 0.3913116455078125, 0.40283203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 4.0, 8.0, 10.0, 10.0, 13.0, 20.0, 14.0, 27.0, 20.0, 32.0, 25.0, 25.0, 34.0, 26.0, 33.0, 26.0, 37.0, 46.0, 29.0, 42.0, 53.0, 33.0, 40.0, 44.0, 37.0, 31.0, 27.0, 24.0, 25.0, 21.0, 19.0, 25.0, 17.0, 11.0, 20.0, 14.0, 13.0, 7.0, 15.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 3.0, 4.0], "bins": [-0.79345703125, -0.7706298828125, -0.747802734375, -0.7249755859375, -0.7021484375, -0.6793212890625, -0.656494140625, -0.6336669921875, -0.61083984375, -0.5880126953125, -0.565185546875, -0.5423583984375, -0.51953125, -0.4967041015625, -0.473876953125, -0.4510498046875, -0.42822265625, -0.4053955078125, -0.382568359375, -0.3597412109375, -0.3369140625, -0.3140869140625, -0.291259765625, -0.2684326171875, -0.24560546875, -0.2227783203125, -0.199951171875, -0.1771240234375, -0.154296875, -0.1314697265625, -0.108642578125, -0.0858154296875, -0.06298828125, -0.0401611328125, -0.017333984375, 0.0054931640625, 0.0283203125, 0.0511474609375, 0.073974609375, 0.0968017578125, 0.11962890625, 0.1424560546875, 0.165283203125, 0.1881103515625, 0.2109375, 0.2337646484375, 0.256591796875, 0.2794189453125, 0.30224609375, 0.3250732421875, 0.347900390625, 0.3707275390625, 0.3935546875, 0.4163818359375, 0.439208984375, 0.4620361328125, 0.48486328125, 0.5076904296875, 0.530517578125, 0.5533447265625, 0.576171875, 0.5989990234375, 0.621826171875, 0.6446533203125, 0.66748046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 9.0, 5.0, 14.0, 17.0, 19.0, 35.0, 29.0, 56.0, 66.0, 88.0, 137.0, 209.0, 323.0, 568.0, 1046.0, 2199.0, 4980.0, 13798.0, 45708.0, 192412.0, 500398.0, 211482.0, 49904.0, 14667.0, 5463.0, 2297.0, 1055.0, 529.0, 343.0, 195.0, 127.0, 99.0, 64.0, 45.0, 43.0, 18.0, 21.0, 18.0, 15.0, 12.0, 14.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6259765625, -0.6067352294921875, -0.587493896484375, -0.5682525634765625, -0.54901123046875, -0.5297698974609375, -0.510528564453125, -0.4912872314453125, -0.4720458984375, -0.4528045654296875, -0.433563232421875, -0.4143218994140625, -0.39508056640625, -0.3758392333984375, -0.356597900390625, -0.3373565673828125, -0.318115234375, -0.2988739013671875, -0.279632568359375, -0.2603912353515625, -0.24114990234375, -0.2219085693359375, -0.202667236328125, -0.1834259033203125, -0.1641845703125, -0.1449432373046875, -0.125701904296875, -0.1064605712890625, -0.08721923828125, -0.0679779052734375, -0.048736572265625, -0.0294952392578125, -0.01025390625, 0.0089874267578125, 0.028228759765625, 0.0474700927734375, 0.06671142578125, 0.0859527587890625, 0.105194091796875, 0.1244354248046875, 0.1436767578125, 0.1629180908203125, 0.182159423828125, 0.2014007568359375, 0.22064208984375, 0.2398834228515625, 0.259124755859375, 0.2783660888671875, 0.297607421875, 0.3168487548828125, 0.336090087890625, 0.3553314208984375, 0.37457275390625, 0.3938140869140625, 0.413055419921875, 0.4322967529296875, 0.4515380859375, 0.4707794189453125, 0.490020751953125, 0.5092620849609375, 0.52850341796875, 0.5477447509765625, 0.566986083984375, 0.5862274169921875, 0.60546875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 8.0, 10.0, 10.0, 4.0, 11.0, 13.0, 10.0, 12.0, 18.0, 16.0, 25.0, 24.0, 31.0, 35.0, 23.0, 29.0, 27.0, 33.0, 35.0, 41.0, 41.0, 36.0, 59.0, 40.0, 33.0, 45.0, 40.0, 36.0, 31.0, 29.0, 29.0, 27.0, 26.0, 17.0, 20.0, 17.0, 8.0, 7.0, 10.0, 7.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.541015625, -1.4907684326171875, -1.440521240234375, -1.3902740478515625, -1.34002685546875, -1.2897796630859375, -1.239532470703125, -1.1892852783203125, -1.1390380859375, -1.0887908935546875, -1.038543701171875, -0.9882965087890625, -0.93804931640625, -0.8878021240234375, -0.837554931640625, -0.7873077392578125, -0.737060546875, -0.6868133544921875, -0.636566162109375, -0.5863189697265625, -0.53607177734375, -0.4858245849609375, -0.435577392578125, -0.3853302001953125, -0.3350830078125, -0.2848358154296875, -0.234588623046875, -0.1843414306640625, -0.13409423828125, -0.0838470458984375, -0.033599853515625, 0.0166473388671875, 0.06689453125, 0.1171417236328125, 0.167388916015625, 0.2176361083984375, 0.26788330078125, 0.3181304931640625, 0.368377685546875, 0.4186248779296875, 0.4688720703125, 0.5191192626953125, 0.569366455078125, 0.6196136474609375, 0.66986083984375, 0.7201080322265625, 0.770355224609375, 0.8206024169921875, 0.870849609375, 0.9210968017578125, 0.971343994140625, 1.0215911865234375, 1.07183837890625, 1.1220855712890625, 1.172332763671875, 1.2225799560546875, 1.2728271484375, 1.3230743408203125, 1.373321533203125, 1.4235687255859375, 1.47381591796875, 1.5240631103515625, 1.574310302734375, 1.6245574951171875, 1.6748046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 4.0, 4.0, 5.0, 11.0, 10.0, 15.0, 12.0, 25.0, 29.0, 43.0, 76.0, 105.0, 133.0, 195.0, 323.0, 459.0, 832.0, 1305.0, 2597.0, 5152.0, 11022.0, 30933.0, 146879.0, 629825.0, 162527.0, 32937.0, 11629.0, 5055.0, 2599.0, 1422.0, 836.0, 509.0, 350.0, 191.0, 151.0, 100.0, 79.0, 49.0, 35.0, 21.0, 11.0, 15.0, 14.0, 4.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.3066062927246094, -0.29656219482421875, -0.2865180969238281, -0.2764739990234375, -0.2664299011230469, -0.25638580322265625, -0.24634170532226562, -0.236297607421875, -0.22625350952148438, -0.21620941162109375, -0.20616531372070312, -0.1961212158203125, -0.18607711791992188, -0.17603302001953125, -0.16598892211914062, -0.15594482421875, -0.14590072631835938, -0.13585662841796875, -0.12581253051757812, -0.1157684326171875, -0.10572433471679688, -0.09568023681640625, -0.08563613891601562, -0.075592041015625, -0.06554794311523438, -0.05550384521484375, -0.045459747314453125, -0.0354156494140625, -0.025371551513671875, -0.01532745361328125, -0.005283355712890625, 0.0047607421875, 0.014804840087890625, 0.02484893798828125, 0.034893035888671875, 0.0449371337890625, 0.054981231689453125, 0.06502532958984375, 0.07506942749023438, 0.085113525390625, 0.09515762329101562, 0.10520172119140625, 0.11524581909179688, 0.1252899169921875, 0.13533401489257812, 0.14537811279296875, 0.15542221069335938, 0.16546630859375, 0.17551040649414062, 0.18555450439453125, 0.19559860229492188, 0.2056427001953125, 0.21568679809570312, 0.22573089599609375, 0.23577499389648438, 0.245819091796875, 0.2558631896972656, 0.26590728759765625, 0.2759513854980469, 0.2859954833984375, 0.2960395812988281, 0.30608367919921875, 0.3161277770996094, 0.326171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 10.0, 12.0, 13.0, 13.0, 33.0, 23.0, 46.0, 77.0, 90.0, 114.0, 129.0, 125.0, 86.0, 80.0, 37.0, 28.0, 21.0, 21.0, 8.0, 5.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016033649444580078, -0.00015447288751602173, -0.00014860928058624268, -0.00014274567365646362, -0.00013688206672668457, -0.00013101845979690552, -0.00012515485286712646, -0.00011929124593734741, -0.00011342763900756836, -0.0001075640320777893, -0.00010170042514801025, -9.58368182182312e-05, -8.997321128845215e-05, -8.41096043586731e-05, -7.824599742889404e-05, -7.238239049911499e-05, -6.651878356933594e-05, -6.0655176639556885e-05, -5.479156970977783e-05, -4.892796277999878e-05, -4.3064355850219727e-05, -3.7200748920440674e-05, -3.133714199066162e-05, -2.547353506088257e-05, -1.9609928131103516e-05, -1.3746321201324463e-05, -7.88271427154541e-06, -2.0191073417663574e-06, 3.844499588012695e-06, 9.708106517791748e-06, 1.55717134475708e-05, 2.1435320377349854e-05, 2.7298927307128906e-05, 3.316253423690796e-05, 3.902614116668701e-05, 4.4889748096466064e-05, 5.075335502624512e-05, 5.661696195602417e-05, 6.248056888580322e-05, 6.834417581558228e-05, 7.420778274536133e-05, 8.007138967514038e-05, 8.593499660491943e-05, 9.179860353469849e-05, 9.766221046447754e-05, 0.00010352581739425659, 0.00010938942432403564, 0.0001152530312538147, 0.00012111663818359375, 0.0001269802451133728, 0.00013284385204315186, 0.0001387074589729309, 0.00014457106590270996, 0.00015043467283248901, 0.00015629827976226807, 0.00016216188669204712, 0.00016802549362182617, 0.00017388910055160522, 0.00017975270748138428, 0.00018561631441116333, 0.00019147992134094238, 0.00019734352827072144, 0.0002032071352005005, 0.00020907074213027954, 0.0002149343490600586]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 5.0, 5.0, 5.0, 11.0, 11.0, 18.0, 17.0, 27.0, 44.0, 46.0, 84.0, 279.0, 1482.0, 14263.0, 710706.0, 311467.0, 8564.0, 1024.0, 198.0, 101.0, 38.0, 37.0, 23.0, 22.0, 15.0, 11.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.044921875, -1.0111083984375, -0.977294921875, -0.9434814453125, -0.90966796875, -0.8758544921875, -0.842041015625, -0.8082275390625, -0.7744140625, -0.7406005859375, -0.706787109375, -0.6729736328125, -0.63916015625, -0.6053466796875, -0.571533203125, -0.5377197265625, -0.50390625, -0.4700927734375, -0.436279296875, -0.4024658203125, -0.36865234375, -0.3348388671875, -0.301025390625, -0.2672119140625, -0.2333984375, -0.1995849609375, -0.165771484375, -0.1319580078125, -0.09814453125, -0.0643310546875, -0.030517578125, 0.0032958984375, 0.037109375, 0.0709228515625, 0.104736328125, 0.1385498046875, 0.17236328125, 0.2061767578125, 0.239990234375, 0.2738037109375, 0.3076171875, 0.3414306640625, 0.375244140625, 0.4090576171875, 0.44287109375, 0.4766845703125, 0.510498046875, 0.5443115234375, 0.578125, 0.6119384765625, 0.645751953125, 0.6795654296875, 0.71337890625, 0.7471923828125, 0.781005859375, 0.8148193359375, 0.8486328125, 0.8824462890625, 0.916259765625, 0.9500732421875, 0.98388671875, 1.0177001953125, 1.051513671875, 1.0853271484375, 1.119140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 13.0, 7.0, 16.0, 11.0, 19.0, 27.0, 23.0, 35.0, 56.0, 66.0, 71.0, 75.0, 66.0, 71.0, 65.0, 60.0, 66.0, 38.0, 36.0, 37.0, 23.0, 19.0, 11.0, 9.0, 14.0, 14.0, 3.0, 1.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0780029296875, -0.07548236846923828, -0.07296180725097656, -0.07044124603271484, -0.06792068481445312, -0.0654001235961914, -0.06287956237792969, -0.06035900115966797, -0.05783843994140625, -0.05531787872314453, -0.05279731750488281, -0.050276756286621094, -0.047756195068359375, -0.045235633850097656, -0.04271507263183594, -0.04019451141357422, -0.0376739501953125, -0.03515338897705078, -0.03263282775878906, -0.030112266540527344, -0.027591705322265625, -0.025071144104003906, -0.022550582885742188, -0.02003002166748047, -0.01750946044921875, -0.014988899230957031, -0.012468338012695312, -0.009947776794433594, -0.007427215576171875, -0.004906654357910156, -0.0023860931396484375, 0.00013446807861328125, 0.002655029296875, 0.005175590515136719, 0.0076961517333984375, 0.010216712951660156, 0.012737274169921875, 0.015257835388183594, 0.017778396606445312, 0.02029895782470703, 0.02281951904296875, 0.02534008026123047, 0.027860641479492188, 0.030381202697753906, 0.032901763916015625, 0.035422325134277344, 0.03794288635253906, 0.04046344757080078, 0.0429840087890625, 0.04550457000732422, 0.04802513122558594, 0.050545692443847656, 0.053066253662109375, 0.055586814880371094, 0.05810737609863281, 0.06062793731689453, 0.06314849853515625, 0.06566905975341797, 0.06818962097167969, 0.0707101821899414, 0.07323074340820312, 0.07575130462646484, 0.07827186584472656, 0.08079242706298828, 0.08331298828125]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 32.0, 87.0, 231.0, 280.0, 201.0, 105.0, 35.0, 20.0, 5.0, 4.0], "bins": [-7.9226555824279785, -7.78477668762207, -7.646897792816162, -7.509018898010254, -7.371140003204346, -7.2332611083984375, -7.095382213592529, -6.957503318786621, -6.819624900817871, -6.681746006011963, -6.543867111206055, -6.4059882164001465, -6.268109321594238, -6.13023042678833, -5.992351531982422, -5.854473114013672, -5.7165937423706055, -5.578714847564697, -5.440835952758789, -5.302957057952881, -5.165078163146973, -5.0271992683410645, -4.889320373535156, -4.751441955566406, -4.61356258392334, -4.475683689117432, -4.337804794311523, -4.199925899505615, -4.062047004699707, -3.924168109893799, -3.7862894535064697, -3.6484105587005615, -3.510531425476074, -3.372652530670166, -3.234773635864258, -3.0968947410583496, -2.9590158462524414, -2.821136951446533, -2.683258295059204, -2.545379400253296, -2.407500743865967, -2.2696218490600586, -2.1317429542541504, -1.9938641786575317, -1.8559852838516235, -1.7181063890457153, -1.5802276134490967, -1.4423487186431885, -1.3044697046279907, -1.1665908098220825, -1.0287120342254639, -0.8908331394195557, -0.7529542446136475, -0.6150753498077393, -0.47719651460647583, -0.3393176794052124, -0.2014387845993042, -0.06355991959571838, 0.07431894540786743, 0.21219781041145325, 0.35007667541503906, 0.48795557022094727, 0.6258344054222107, 0.7637132406234741, 0.9015921354293823]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 7.0, 8.0, 14.0, 16.0, 9.0, 12.0, 21.0, 32.0, 29.0, 19.0, 30.0, 24.0, 26.0, 23.0, 47.0, 40.0, 32.0, 46.0, 50.0, 42.0, 43.0, 44.0, 34.0, 29.0, 30.0, 33.0, 33.0, 30.0, 29.0, 26.0, 20.0, 16.0, 14.0, 11.0, 17.0, 7.0, 8.0, 9.0, 9.0, 1.0, 5.0, 1.0, 3.0, 5.0, 2.0, 4.0], "bins": [-0.8810598850250244, -0.8572274446487427, -0.8333950042724609, -0.8095625638961792, -0.7857301235198975, -0.761897623538971, -0.7380651831626892, -0.7142327427864075, -0.6904003024101257, -0.666567862033844, -0.6427354216575623, -0.6189029812812805, -0.595070481300354, -0.5712380409240723, -0.5474056005477905, -0.5235731601715088, -0.49974071979522705, -0.4759082794189453, -0.4520758390426636, -0.42824336886405945, -0.4044109284877777, -0.38057848811149597, -0.35674601793289185, -0.3329135775566101, -0.30908113718032837, -0.28524869680404663, -0.2614162564277649, -0.23758378624916077, -0.21375134587287903, -0.1899189054965973, -0.16608645021915436, -0.14225399494171143, -0.11842155456542969, -0.09458910673856735, -0.07075665891170502, -0.04692421108484268, -0.023091763257980347, 0.0007406845688819885, 0.024573132395744324, 0.048405587673187256, 0.072238028049469, 0.09607047587633133, 0.11990292370319366, 0.1437353789806366, 0.16756781935691833, 0.19140025973320007, 0.215232715010643, 0.23906517028808594, 0.2628976106643677, 0.2867300510406494, 0.31056249141693115, 0.3343949615955353, 0.358227401971817, 0.38205984234809875, 0.4058923125267029, 0.4297247529029846, 0.45355719327926636, 0.4773896336555481, 0.5012220740318298, 0.5250545144081116, 0.5488870143890381, 0.5727194547653198, 0.5965518951416016, 0.6203843355178833, 0.644216775894165]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 3.0, 7.0, 8.0, 10.0, 23.0, 30.0, 42.0, 57.0, 74.0, 121.0, 180.0, 289.0, 389.0, 665.0, 967.0, 1591.0, 2807.0, 4721.0, 9295.0, 19553.0, 49026.0, 133165.0, 308850.0, 302368.0, 127270.0, 47062.0, 19321.0, 8847.0, 4726.0, 2660.0, 1588.0, 1010.0, 659.0, 408.0, 242.0, 160.0, 128.0, 72.0, 50.0, 41.0, 19.0, 18.0, 14.0, 6.0, 5.0, 10.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366455078125, -0.3538093566894531, -0.34116363525390625, -0.3285179138183594, -0.3158721923828125, -0.3032264709472656, -0.29058074951171875, -0.2779350280761719, -0.265289306640625, -0.2526435852050781, -0.23999786376953125, -0.22735214233398438, -0.2147064208984375, -0.20206069946289062, -0.18941497802734375, -0.17676925659179688, -0.16412353515625, -0.15147781372070312, -0.13883209228515625, -0.12618637084960938, -0.1135406494140625, -0.10089492797851562, -0.08824920654296875, -0.07560348510742188, -0.062957763671875, -0.050312042236328125, -0.03766632080078125, -0.025020599365234375, -0.0123748779296875, 0.000270843505859375, 0.01291656494140625, 0.025562286376953125, 0.0382080078125, 0.050853729248046875, 0.06349945068359375, 0.07614517211914062, 0.0887908935546875, 0.10143661499023438, 0.11408233642578125, 0.12672805786132812, 0.139373779296875, 0.15201950073242188, 0.16466522216796875, 0.17731094360351562, 0.1899566650390625, 0.20260238647460938, 0.21524810791015625, 0.22789382934570312, 0.24053955078125, 0.2531852722167969, 0.26583099365234375, 0.2784767150878906, 0.2911224365234375, 0.3037681579589844, 0.31641387939453125, 0.3290596008300781, 0.341705322265625, 0.3543510437011719, 0.36699676513671875, 0.3796424865722656, 0.3922882080078125, 0.4049339294433594, 0.41757965087890625, 0.4302253723144531, 0.44287109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 9.0, 6.0, 6.0, 16.0, 18.0, 22.0, 22.0, 27.0, 24.0, 33.0, 41.0, 33.0, 36.0, 53.0, 46.0, 50.0, 54.0, 48.0, 28.0, 49.0, 54.0, 28.0, 38.0, 31.0, 19.0, 23.0, 25.0, 19.0, 20.0, 17.0, 10.0, 9.0, 13.0, 11.0, 8.0, 6.0, 0.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.392578125, -3.297698974609375, -3.20281982421875, -3.107940673828125, -3.0130615234375, -2.918182373046875, -2.82330322265625, -2.728424072265625, -2.633544921875, -2.538665771484375, -2.44378662109375, -2.348907470703125, -2.2540283203125, -2.159149169921875, -2.06427001953125, -1.969390869140625, -1.87451171875, -1.779632568359375, -1.68475341796875, -1.589874267578125, -1.4949951171875, -1.400115966796875, -1.30523681640625, -1.210357666015625, -1.115478515625, -1.020599365234375, -0.92572021484375, -0.830841064453125, -0.7359619140625, -0.641082763671875, -0.54620361328125, -0.451324462890625, -0.3564453125, -0.261566162109375, -0.16668701171875, -0.071807861328125, 0.0230712890625, 0.117950439453125, 0.21282958984375, 0.307708740234375, 0.402587890625, 0.497467041015625, 0.59234619140625, 0.687225341796875, 0.7821044921875, 0.876983642578125, 0.97186279296875, 1.066741943359375, 1.16162109375, 1.256500244140625, 1.35137939453125, 1.446258544921875, 1.5411376953125, 1.636016845703125, 1.73089599609375, 1.825775146484375, 1.920654296875, 2.015533447265625, 2.11041259765625, 2.205291748046875, 2.3001708984375, 2.395050048828125, 2.48992919921875, 2.584808349609375, 2.6796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 7.0, 4.0, 13.0, 20.0, 24.0, 43.0, 50.0, 43.0, 68.0, 101.0, 120.0, 173.0, 296.0, 624.0, 2299.0, 132478.0, 901979.0, 8173.0, 907.0, 370.0, 228.0, 142.0, 105.0, 77.0, 50.0, 30.0, 28.0, 26.0, 16.0, 14.0, 10.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.090972900390625, -2.02178955078125, -1.952606201171875, -1.8834228515625, -1.814239501953125, -1.74505615234375, -1.675872802734375, -1.606689453125, -1.537506103515625, -1.46832275390625, -1.399139404296875, -1.3299560546875, -1.260772705078125, -1.19158935546875, -1.122406005859375, -1.05322265625, -0.984039306640625, -0.91485595703125, -0.845672607421875, -0.7764892578125, -0.707305908203125, -0.63812255859375, -0.568939208984375, -0.499755859375, -0.430572509765625, -0.36138916015625, -0.292205810546875, -0.2230224609375, -0.153839111328125, -0.08465576171875, -0.015472412109375, 0.0537109375, 0.122894287109375, 0.19207763671875, 0.261260986328125, 0.3304443359375, 0.399627685546875, 0.46881103515625, 0.537994384765625, 0.607177734375, 0.676361083984375, 0.74554443359375, 0.814727783203125, 0.8839111328125, 0.953094482421875, 1.02227783203125, 1.091461181640625, 1.16064453125, 1.229827880859375, 1.29901123046875, 1.368194580078125, 1.4373779296875, 1.506561279296875, 1.57574462890625, 1.644927978515625, 1.714111328125, 1.783294677734375, 1.85247802734375, 1.921661376953125, 1.9908447265625, 2.060028076171875, 2.12921142578125, 2.198394775390625, 2.267578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 3.0, 4.0, 11.0, 8.0, 14.0, 10.0, 8.0, 10.0, 18.0, 16.0, 23.0, 19.0, 18.0, 31.0, 29.0, 29.0, 31.0, 44.0, 33.0, 40.0, 49.0, 46.0, 30.0, 37.0, 40.0, 48.0, 43.0, 37.0, 34.0, 36.0, 22.0, 24.0, 23.0, 26.0, 23.0, 16.0, 18.0, 12.0, 6.0, 11.0, 4.0, 5.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.9765625, -2.882965087890625, -2.78936767578125, -2.695770263671875, -2.6021728515625, -2.508575439453125, -2.41497802734375, -2.321380615234375, -2.227783203125, -2.134185791015625, -2.04058837890625, -1.946990966796875, -1.8533935546875, -1.759796142578125, -1.66619873046875, -1.572601318359375, -1.47900390625, -1.385406494140625, -1.29180908203125, -1.198211669921875, -1.1046142578125, -1.011016845703125, -0.91741943359375, -0.823822021484375, -0.730224609375, -0.636627197265625, -0.54302978515625, -0.449432373046875, -0.3558349609375, -0.262237548828125, -0.16864013671875, -0.075042724609375, 0.0185546875, 0.112152099609375, 0.20574951171875, 0.299346923828125, 0.3929443359375, 0.486541748046875, 0.58013916015625, 0.673736572265625, 0.767333984375, 0.860931396484375, 0.95452880859375, 1.048126220703125, 1.1417236328125, 1.235321044921875, 1.32891845703125, 1.422515869140625, 1.51611328125, 1.609710693359375, 1.70330810546875, 1.796905517578125, 1.8905029296875, 1.984100341796875, 2.07769775390625, 2.171295166015625, 2.264892578125, 2.358489990234375, 2.45208740234375, 2.545684814453125, 2.6392822265625, 2.732879638671875, 2.82647705078125, 2.920074462890625, 3.013671875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 11.0, 11.0, 12.0, 22.0, 34.0, 70.0, 96.0, 195.0, 341.0, 676.0, 1388.0, 3651.0, 13208.0, 901591.0, 113979.0, 8316.0, 2623.0, 1093.0, 558.0, 272.0, 162.0, 106.0, 47.0, 32.0, 24.0, 11.0, 9.0, 6.0, 8.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4599609375, -0.44637298583984375, -0.4327850341796875, -0.41919708251953125, -0.405609130859375, -0.39202117919921875, -0.3784332275390625, -0.36484527587890625, -0.35125732421875, -0.33766937255859375, -0.3240814208984375, -0.31049346923828125, -0.296905517578125, -0.28331756591796875, -0.2697296142578125, -0.25614166259765625, -0.2425537109375, -0.22896575927734375, -0.2153778076171875, -0.20178985595703125, -0.188201904296875, -0.17461395263671875, -0.1610260009765625, -0.14743804931640625, -0.13385009765625, -0.12026214599609375, -0.1066741943359375, -0.09308624267578125, -0.079498291015625, -0.06591033935546875, -0.0523223876953125, -0.03873443603515625, -0.025146484375, -0.01155853271484375, 0.0020294189453125, 0.01561737060546875, 0.029205322265625, 0.04279327392578125, 0.0563812255859375, 0.06996917724609375, 0.08355712890625, 0.09714508056640625, 0.1107330322265625, 0.12432098388671875, 0.137908935546875, 0.15149688720703125, 0.1650848388671875, 0.17867279052734375, 0.1922607421875, 0.20584869384765625, 0.2194366455078125, 0.23302459716796875, 0.246612548828125, 0.26020050048828125, 0.2737884521484375, 0.28737640380859375, 0.30096435546875, 0.31455230712890625, 0.3281402587890625, 0.34172821044921875, 0.355316162109375, 0.36890411376953125, 0.3824920654296875, 0.39608001708984375, 0.40966796875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 13.0, 14.0, 37.0, 73.0, 229.0, 366.0, 147.0, 53.0, 29.0, 10.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.902217864990234e-05, -6.730575114488602e-05, -6.558932363986969e-05, -6.387289613485336e-05, -6.215646862983704e-05, -6.044004112482071e-05, -5.872361361980438e-05, -5.7007186114788055e-05, -5.529075860977173e-05, -5.35743311047554e-05, -5.1857903599739075e-05, -5.014147609472275e-05, -4.842504858970642e-05, -4.6708621084690094e-05, -4.499219357967377e-05, -4.327576607465744e-05, -4.155933856964111e-05, -3.9842911064624786e-05, -3.812648355960846e-05, -3.641005605459213e-05, -3.4693628549575806e-05, -3.297720104455948e-05, -3.126077353954315e-05, -2.9544346034526825e-05, -2.7827918529510498e-05, -2.611149102449417e-05, -2.4395063519477844e-05, -2.2678636014461517e-05, -2.096220850944519e-05, -1.9245781004428864e-05, -1.7529353499412537e-05, -1.581292599439621e-05, -1.4096498489379883e-05, -1.2380070984363556e-05, -1.0663643479347229e-05, -8.947215974330902e-06, -7.230788469314575e-06, -5.514360964298248e-06, -3.7979334592819214e-06, -2.0815059542655945e-06, -3.650784492492676e-07, 1.3513490557670593e-06, 3.0677765607833862e-06, 4.784204065799713e-06, 6.50063157081604e-06, 8.217059075832367e-06, 9.933486580848694e-06, 1.164991408586502e-05, 1.3366341590881348e-05, 1.5082769095897675e-05, 1.6799196600914e-05, 1.851562410593033e-05, 2.0232051610946655e-05, 2.1948479115962982e-05, 2.366490662097931e-05, 2.5381334125995636e-05, 2.7097761631011963e-05, 2.881418913602829e-05, 3.053061664104462e-05, 3.2247044146060944e-05, 3.396347165107727e-05, 3.56798991560936e-05, 3.7396326661109924e-05, 3.911275416612625e-05, 4.082918167114258e-05]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 7.0, 1.0, 11.0, 11.0, 38.0, 72.0, 151.0, 452.0, 1499.0, 7000.0, 192382.0, 835711.0, 8678.0, 1691.0, 488.0, 202.0, 71.0, 39.0, 15.0, 9.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6201171875, -0.6013565063476562, -0.5825958251953125, -0.5638351440429688, -0.545074462890625, -0.5263137817382812, -0.5075531005859375, -0.48879241943359375, -0.47003173828125, -0.45127105712890625, -0.4325103759765625, -0.41374969482421875, -0.394989013671875, -0.37622833251953125, -0.3574676513671875, -0.33870697021484375, -0.3199462890625, -0.30118560791015625, -0.2824249267578125, -0.26366424560546875, -0.244903564453125, -0.22614288330078125, -0.2073822021484375, -0.18862152099609375, -0.16986083984375, -0.15110015869140625, -0.1323394775390625, -0.11357879638671875, -0.094818115234375, -0.07605743408203125, -0.0572967529296875, -0.03853607177734375, -0.019775390625, -0.00101470947265625, 0.0177459716796875, 0.03650665283203125, 0.055267333984375, 0.07402801513671875, 0.0927886962890625, 0.11154937744140625, 0.13031005859375, 0.14907073974609375, 0.1678314208984375, 0.18659210205078125, 0.205352783203125, 0.22411346435546875, 0.2428741455078125, 0.26163482666015625, 0.2803955078125, 0.29915618896484375, 0.3179168701171875, 0.33667755126953125, 0.355438232421875, 0.37419891357421875, 0.3929595947265625, 0.41172027587890625, 0.43048095703125, 0.44924163818359375, 0.4680023193359375, 0.48676300048828125, 0.505523681640625, 0.5242843627929688, 0.5430450439453125, 0.5618057250976562, 0.58056640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 4.0, 10.0, 24.0, 35.0, 92.0, 417.0, 247.0, 56.0, 31.0, 16.0, 11.0, 8.0, 13.0, 3.0, 7.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11944580078125, -0.11499691009521484, -0.11054801940917969, -0.10609912872314453, -0.10165023803710938, -0.09720134735107422, -0.09275245666503906, -0.0883035659790039, -0.08385467529296875, -0.0794057846069336, -0.07495689392089844, -0.07050800323486328, -0.06605911254882812, -0.06161022186279297, -0.05716133117675781, -0.052712440490722656, -0.0482635498046875, -0.043814659118652344, -0.03936576843261719, -0.03491687774658203, -0.030467987060546875, -0.02601909637451172, -0.021570205688476562, -0.017121315002441406, -0.01267242431640625, -0.008223533630371094, -0.0037746429443359375, 0.0006742477416992188, 0.005123138427734375, 0.009572029113769531, 0.014020919799804688, 0.018469810485839844, 0.022918701171875, 0.027367591857910156, 0.03181648254394531, 0.03626537322998047, 0.040714263916015625, 0.04516315460205078, 0.04961204528808594, 0.054060935974121094, 0.05850982666015625, 0.0629587173461914, 0.06740760803222656, 0.07185649871826172, 0.07630538940429688, 0.08075428009033203, 0.08520317077636719, 0.08965206146240234, 0.0941009521484375, 0.09854984283447266, 0.10299873352050781, 0.10744762420654297, 0.11189651489257812, 0.11634540557861328, 0.12079429626464844, 0.1252431869506836, 0.12969207763671875, 0.1341409683227539, 0.13858985900878906, 0.14303874969482422, 0.14748764038085938, 0.15193653106689453, 0.1563854217529297, 0.16083431243896484, 0.165283203125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 15.0, 42.0, 63.0, 127.0, 179.0, 181.0, 140.0, 118.0, 52.0, 44.0, 19.0, 10.0, 3.0, 8.0], "bins": [-7.642716884613037, -7.5045037269592285, -7.36629056930542, -7.228076934814453, -7.0898637771606445, -6.951650619506836, -6.813437461853027, -6.675224304199219, -6.53701114654541, -6.398797988891602, -6.260584831237793, -6.122371673583984, -5.984158039093018, -5.845944881439209, -5.7077317237854, -5.569518566131592, -5.431304931640625, -5.293091773986816, -5.154878616333008, -5.016665458679199, -4.878451824188232, -4.740238666534424, -4.602025508880615, -4.463812351226807, -4.325599193572998, -4.1873860359191895, -4.049172878265381, -3.910959482192993, -3.7727463245391846, -3.634532928466797, -3.4963197708129883, -3.3581066131591797, -3.219892978668213, -3.0816798210144043, -2.9434664249420166, -2.805253267288208, -2.6670401096343994, -2.5288267135620117, -2.390613555908203, -2.2524003982543945, -2.114187240600586, -1.9759739637374878, -1.8377608060836792, -1.699547529220581, -1.5613343715667725, -1.4231210947036743, -1.2849078178405762, -1.1466946601867676, -1.0084813833236694, -0.8702681660652161, -0.7320549488067627, -0.5938416719436646, -0.4556284546852112, -0.3174152374267578, -0.17920196056365967, -0.0409887433052063, 0.09722447395324707, 0.23543770611286163, 0.3736509382724762, 0.511864185333252, 0.6500774025917053, 0.7882906198501587, 0.9265038967132568, 1.0647170543670654, 1.2029303312301636]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 11.0, 6.0, 8.0, 8.0, 16.0, 7.0, 19.0, 26.0, 22.0, 29.0, 26.0, 29.0, 29.0, 30.0, 41.0, 45.0, 34.0, 38.0, 30.0, 35.0, 44.0, 38.0, 44.0, 42.0, 38.0, 28.0, 27.0, 25.0, 27.0, 28.0, 18.0, 17.0, 20.0, 19.0, 12.0, 13.0, 16.0, 9.0, 6.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.250396251678467, -5.103309631347656, -4.9562225341796875, -4.809135913848877, -4.662048816680908, -4.514962196350098, -4.367875099182129, -4.220788478851318, -4.073701858520508, -3.926614999771118, -3.7795281410217285, -3.632441282272339, -3.485354423522949, -3.3382678031921387, -3.191180944442749, -3.0440940856933594, -2.8970069885253906, -2.749920129776001, -2.6028332710266113, -2.4557464122772217, -2.308659553527832, -2.1615729331970215, -2.014486074447632, -1.8673992156982422, -1.7203123569488525, -1.573225498199463, -1.4261386394500732, -1.2790518999099731, -1.1319650411605835, -0.9848781824111938, -0.837791383266449, -0.6907045841217041, -0.5436172485351562, -0.396530419588089, -0.24944359064102173, -0.10235676169395447, 0.04473006725311279, 0.19181692600250244, 0.3389037251472473, 0.4859905242919922, 0.6330773830413818, 0.7801642417907715, 0.9272510409355164, 1.0743378400802612, 1.2214246988296509, 1.3685115575790405, 1.5155982971191406, 1.6626851558685303, 1.80977201461792, 1.9568588733673096, 2.103945732116699, 2.251032590866089, 2.3981194496154785, 2.545206069946289, 2.6922929286956787, 2.8393797874450684, 2.986466646194458, 3.1335535049438477, 3.2806403636932373, 3.427727222442627, 3.5748138427734375, 3.7219009399414062, 3.868987560272217, 4.016074180603027, 4.163161277770996]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 7.0, 9.0, 17.0, 6.0, 16.0, 11.0, 17.0, 31.0, 50.0, 57.0, 78.0, 139.0, 208.0, 402.0, 825.0, 1865.0, 5047.0, 16806.0, 87382.0, 942823.0, 2769022.0, 310923.0, 41304.0, 10677.0, 3659.0, 1494.0, 622.0, 332.0, 154.0, 96.0, 52.0, 43.0, 19.0, 20.0, 14.0, 15.0, 8.0, 9.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.7470703125, -1.7002105712890625, -1.653350830078125, -1.6064910888671875, -1.55963134765625, -1.5127716064453125, -1.465911865234375, -1.4190521240234375, -1.3721923828125, -1.3253326416015625, -1.278472900390625, -1.2316131591796875, -1.18475341796875, -1.1378936767578125, -1.091033935546875, -1.0441741943359375, -0.997314453125, -0.9504547119140625, -0.903594970703125, -0.8567352294921875, -0.80987548828125, -0.7630157470703125, -0.716156005859375, -0.6692962646484375, -0.6224365234375, -0.5755767822265625, -0.528717041015625, -0.4818572998046875, -0.43499755859375, -0.3881378173828125, -0.341278076171875, -0.2944183349609375, -0.24755859375, -0.2006988525390625, -0.153839111328125, -0.1069793701171875, -0.06011962890625, -0.0132598876953125, 0.033599853515625, 0.0804595947265625, 0.1273193359375, 0.1741790771484375, 0.221038818359375, 0.2678985595703125, 0.31475830078125, 0.3616180419921875, 0.408477783203125, 0.4553375244140625, 0.502197265625, 0.5490570068359375, 0.595916748046875, 0.6427764892578125, 0.68963623046875, 0.7364959716796875, 0.783355712890625, 0.8302154541015625, 0.8770751953125, 0.9239349365234375, 0.970794677734375, 1.0176544189453125, 1.06451416015625, 1.1113739013671875, 1.158233642578125, 1.2050933837890625, 1.251953125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 9.0, 14.0, 13.0, 19.0, 16.0, 23.0, 40.0, 28.0, 35.0, 58.0, 55.0, 57.0, 67.0, 47.0, 66.0, 68.0, 70.0, 53.0, 49.0, 44.0, 31.0, 36.0, 20.0, 22.0, 22.0, 13.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-1.7646484375, -1.7251739501953125, -1.685699462890625, -1.6462249755859375, -1.60675048828125, -1.5672760009765625, -1.527801513671875, -1.4883270263671875, -1.4488525390625, -1.4093780517578125, -1.369903564453125, -1.3304290771484375, -1.29095458984375, -1.2514801025390625, -1.212005615234375, -1.1725311279296875, -1.133056640625, -1.0935821533203125, -1.054107666015625, -1.0146331787109375, -0.97515869140625, -0.9356842041015625, -0.896209716796875, -0.8567352294921875, -0.8172607421875, -0.7777862548828125, -0.738311767578125, -0.6988372802734375, -0.65936279296875, -0.6198883056640625, -0.580413818359375, -0.5409393310546875, -0.50146484375, -0.4619903564453125, -0.422515869140625, -0.3830413818359375, -0.34356689453125, -0.3040924072265625, -0.264617919921875, -0.2251434326171875, -0.1856689453125, -0.1461944580078125, -0.106719970703125, -0.0672454833984375, -0.02777099609375, 0.0117034912109375, 0.051177978515625, 0.0906524658203125, 0.130126953125, 0.1696014404296875, 0.209075927734375, 0.2485504150390625, 0.28802490234375, 0.3274993896484375, 0.366973876953125, 0.4064483642578125, 0.4459228515625, 0.4853973388671875, 0.524871826171875, 0.5643463134765625, 0.60382080078125, 0.6432952880859375, 0.682769775390625, 0.7222442626953125, 0.76171875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 18.0, 24.0, 51.0, 99.0, 351.0, 30195.0, 4162677.0, 580.0, 152.0, 62.0, 32.0, 15.0, 7.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-22.078125, -21.5782470703125, -21.078369140625, -20.5784912109375, -20.07861328125, -19.5787353515625, -19.078857421875, -18.5789794921875, -18.0791015625, -17.5792236328125, -17.079345703125, -16.5794677734375, -16.07958984375, -15.5797119140625, -15.079833984375, -14.5799560546875, -14.080078125, -13.5802001953125, -13.080322265625, -12.5804443359375, -12.08056640625, -11.5806884765625, -11.080810546875, -10.5809326171875, -10.0810546875, -9.5811767578125, -9.081298828125, -8.5814208984375, -8.08154296875, -7.5816650390625, -7.081787109375, -6.5819091796875, -6.08203125, -5.5821533203125, -5.082275390625, -4.5823974609375, -4.08251953125, -3.5826416015625, -3.082763671875, -2.5828857421875, -2.0830078125, -1.5831298828125, -1.083251953125, -0.5833740234375, -0.08349609375, 0.4163818359375, 0.916259765625, 1.4161376953125, 1.916015625, 2.4158935546875, 2.915771484375, 3.4156494140625, 3.91552734375, 4.4154052734375, 4.915283203125, 5.4151611328125, 5.9150390625, 6.4149169921875, 6.914794921875, 7.4146728515625, 7.91455078125, 8.4144287109375, 8.914306640625, 9.4141845703125, 9.9140625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 10.0, 12.0, 20.0, 42.0, 60.0, 108.0, 167.0, 333.0, 776.0, 1205.0, 668.0, 310.0, 146.0, 84.0, 44.0, 34.0, 14.0, 15.0, 10.0, 10.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7780418395996094, -0.7596969604492188, -0.7413520812988281, -0.7230072021484375, -0.7046623229980469, -0.6863174438476562, -0.6679725646972656, -0.649627685546875, -0.6312828063964844, -0.6129379272460938, -0.5945930480957031, -0.5762481689453125, -0.5579032897949219, -0.5395584106445312, -0.5212135314941406, -0.50286865234375, -0.4845237731933594, -0.46617889404296875, -0.4478340148925781, -0.4294891357421875, -0.4111442565917969, -0.39279937744140625, -0.3744544982910156, -0.356109619140625, -0.3377647399902344, -0.31941986083984375, -0.3010749816894531, -0.2827301025390625, -0.2643852233886719, -0.24604034423828125, -0.22769546508789062, -0.2093505859375, -0.19100570678710938, -0.17266082763671875, -0.15431594848632812, -0.1359710693359375, -0.11762619018554688, -0.09928131103515625, -0.08093643188476562, -0.062591552734375, -0.044246673583984375, -0.02590179443359375, -0.007556915283203125, 0.0107879638671875, 0.029132843017578125, 0.04747772216796875, 0.06582260131835938, 0.08416748046875, 0.10251235961914062, 0.12085723876953125, 0.13920211791992188, 0.1575469970703125, 0.17589187622070312, 0.19423675537109375, 0.21258163452148438, 0.230926513671875, 0.24927139282226562, 0.26761627197265625, 0.2859611511230469, 0.3043060302734375, 0.3226509094238281, 0.34099578857421875, 0.3593406677246094, 0.377685546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 13.0, 29.0, 52.0, 104.0, 142.0, 175.0, 169.0, 125.0, 76.0, 60.0, 28.0, 12.0, 13.0, 2.0, 1.0, 2.0, 3.0], "bins": [-5.074952602386475, -4.978900909423828, -4.88284969329834, -4.786798000335693, -4.690746784210205, -4.594695091247559, -4.49864387512207, -4.402592182159424, -4.3065409660339355, -4.210489273071289, -4.114438056945801, -4.018386363983154, -3.922335147857666, -3.8262836933135986, -3.7302322387695312, -3.634180784225464, -3.5381293296813965, -3.442077875137329, -3.3460264205932617, -3.2499749660491943, -3.153923511505127, -3.0578720569610596, -2.961820602416992, -2.865769147872925, -2.7697174549102783, -2.673666000366211, -2.5776145458221436, -2.481563091278076, -2.385511636734009, -2.2894601821899414, -2.193408727645874, -2.0973572731018066, -2.0013058185577393, -1.9052543640136719, -1.8092029094696045, -1.713151454925537, -1.6171000003814697, -1.5210485458374023, -1.424997091293335, -1.3289456367492676, -1.2328941822052002, -1.1368427276611328, -1.0407912731170654, -0.944739818572998, -0.8486883640289307, -0.7526369094848633, -0.6565853953361511, -0.5605339407920837, -0.4644824266433716, -0.3684309720993042, -0.2723795175552368, -0.17632803320884705, -0.08027657866477966, 0.01577487587928772, 0.11182636022567749, 0.20787781476974487, 0.30392926931381226, 0.39998072385787964, 0.496032178401947, 0.5920836925506592, 0.6881351470947266, 0.784186601638794, 0.8802380561828613, 0.9762895107269287, 1.072340965270996]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 7.0, 5.0, 8.0, 10.0, 11.0, 20.0, 22.0, 23.0, 12.0, 24.0, 29.0, 23.0, 23.0, 38.0, 42.0, 48.0, 38.0, 43.0, 49.0, 43.0, 36.0, 52.0, 44.0, 34.0, 40.0, 40.0, 24.0, 32.0, 27.0, 19.0, 26.0, 17.0, 15.0, 14.0, 16.0, 2.0, 13.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0], "bins": [-1.1443462371826172, -1.114729881286621, -1.085113525390625, -1.055497169494629, -1.0258808135986328, -0.9962645173072815, -0.9666481614112854, -0.9370318055152893, -0.907415509223938, -0.8777991533279419, -0.8481827974319458, -0.8185664415359497, -0.7889501452445984, -0.7593337893486023, -0.7297174334526062, -0.7001010775566101, -0.670484721660614, -0.6408683657646179, -0.6112520098686218, -0.5816357135772705, -0.5520193576812744, -0.5224030017852783, -0.4927866458892822, -0.46317028999328613, -0.4335539638996124, -0.40393760800361633, -0.3743212819099426, -0.34470492601394653, -0.31508857011795044, -0.28547224402427673, -0.25585588812828064, -0.22623954713344574, -0.19662314653396606, -0.16700680553913116, -0.13739046454429626, -0.10777410864830017, -0.07815776765346527, -0.04854142665863037, -0.018925070762634277, 0.010691270232200623, 0.04030761122703552, 0.06992395222187042, 0.09954030066728592, 0.12915664911270142, 0.15877299010753632, 0.18838933110237122, 0.2180056869983673, 0.2476220279932022, 0.2772383689880371, 0.3068547248840332, 0.3364710509777069, 0.366087406873703, 0.3957037329673767, 0.4253200888633728, 0.4549364447593689, 0.484552800655365, 0.5141690969467163, 0.5437854528427124, 0.5734018087387085, 0.6030181646347046, 0.6326344609260559, 0.662250816822052, 0.6918671727180481, 0.7214835286140442, 0.7510998845100403]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 8.0, 4.0, 10.0, 13.0, 26.0, 25.0, 37.0, 57.0, 73.0, 114.0, 170.0, 279.0, 420.0, 740.0, 1153.0, 2010.0, 3483.0, 6285.0, 12318.0, 25275.0, 57788.0, 134685.0, 289723.0, 279631.0, 128685.0, 54916.0, 24302.0, 11763.0, 6183.0, 3369.0, 1909.0, 1164.0, 683.0, 472.0, 261.0, 155.0, 123.0, 88.0, 37.0, 41.0, 24.0, 18.0, 9.0, 10.0, 4.0, 8.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39306640625, -0.3811454772949219, -0.36922454833984375, -0.3573036193847656, -0.3453826904296875, -0.3334617614746094, -0.32154083251953125, -0.3096199035644531, -0.297698974609375, -0.2857780456542969, -0.27385711669921875, -0.2619361877441406, -0.2500152587890625, -0.23809432983398438, -0.22617340087890625, -0.21425247192382812, -0.20233154296875, -0.19041061401367188, -0.17848968505859375, -0.16656875610351562, -0.1546478271484375, -0.14272689819335938, -0.13080596923828125, -0.11888504028320312, -0.106964111328125, -0.09504318237304688, -0.08312225341796875, -0.07120132446289062, -0.0592803955078125, -0.047359466552734375, -0.03543853759765625, -0.023517608642578125, -0.0115966796875, 0.000324249267578125, 0.01224517822265625, 0.024166107177734375, 0.0360870361328125, 0.048007965087890625, 0.05992889404296875, 0.07184982299804688, 0.083770751953125, 0.09569168090820312, 0.10761260986328125, 0.11953353881835938, 0.1314544677734375, 0.14337539672851562, 0.15529632568359375, 0.16721725463867188, 0.17913818359375, 0.19105911254882812, 0.20298004150390625, 0.21490097045898438, 0.2268218994140625, 0.23874282836914062, 0.25066375732421875, 0.2625846862792969, 0.274505615234375, 0.2864265441894531, 0.29834747314453125, 0.3102684020996094, 0.3221893310546875, 0.3341102600097656, 0.34603118896484375, 0.3579521179199219, 0.369873046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 8.0, 5.0, 10.0, 11.0, 17.0, 25.0, 21.0, 24.0, 31.0, 35.0, 44.0, 55.0, 69.0, 42.0, 67.0, 56.0, 60.0, 58.0, 55.0, 57.0, 36.0, 41.0, 42.0, 26.0, 24.0, 12.0, 15.0, 17.0, 14.0, 10.0, 7.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98046875, -0.9536285400390625, -0.926788330078125, -0.8999481201171875, -0.87310791015625, -0.8462677001953125, -0.819427490234375, -0.7925872802734375, -0.7657470703125, -0.7389068603515625, -0.712066650390625, -0.6852264404296875, -0.65838623046875, -0.6315460205078125, -0.604705810546875, -0.5778656005859375, -0.551025390625, -0.5241851806640625, -0.497344970703125, -0.4705047607421875, -0.44366455078125, -0.4168243408203125, -0.389984130859375, -0.3631439208984375, -0.3363037109375, -0.3094635009765625, -0.282623291015625, -0.2557830810546875, -0.22894287109375, -0.2021026611328125, -0.175262451171875, -0.1484222412109375, -0.12158203125, -0.0947418212890625, -0.067901611328125, -0.0410614013671875, -0.01422119140625, 0.0126190185546875, 0.039459228515625, 0.0662994384765625, 0.0931396484375, 0.1199798583984375, 0.146820068359375, 0.1736602783203125, 0.20050048828125, 0.2273406982421875, 0.254180908203125, 0.2810211181640625, 0.307861328125, 0.3347015380859375, 0.361541748046875, 0.3883819580078125, 0.41522216796875, 0.4420623779296875, 0.468902587890625, 0.4957427978515625, 0.5225830078125, 0.5494232177734375, 0.576263427734375, 0.6031036376953125, 0.62994384765625, 0.6567840576171875, 0.683624267578125, 0.7104644775390625, 0.7373046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 2.0, 6.0, 11.0, 9.0, 14.0, 18.0, 30.0, 37.0, 61.0, 106.0, 150.0, 241.0, 407.0, 804.0, 1453.0, 3321.0, 8776.0, 29069.0, 128549.0, 538258.0, 260959.0, 52599.0, 14277.0, 4887.0, 2093.0, 1016.0, 534.0, 291.0, 163.0, 131.0, 85.0, 50.0, 37.0, 28.0, 20.0, 13.0, 12.0, 10.0, 6.0, 6.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.58935546875, -0.5728530883789062, -0.5563507080078125, -0.5398483276367188, -0.523345947265625, -0.5068435668945312, -0.4903411865234375, -0.47383880615234375, -0.45733642578125, -0.44083404541015625, -0.4243316650390625, -0.40782928466796875, -0.391326904296875, -0.37482452392578125, -0.3583221435546875, -0.34181976318359375, -0.3253173828125, -0.30881500244140625, -0.2923126220703125, -0.27581024169921875, -0.259307861328125, -0.24280548095703125, -0.2263031005859375, -0.20980072021484375, -0.19329833984375, -0.17679595947265625, -0.1602935791015625, -0.14379119873046875, -0.127288818359375, -0.11078643798828125, -0.0942840576171875, -0.07778167724609375, -0.061279296875, -0.04477691650390625, -0.0282745361328125, -0.01177215576171875, 0.004730224609375, 0.02123260498046875, 0.0377349853515625, 0.05423736572265625, 0.07073974609375, 0.08724212646484375, 0.1037445068359375, 0.12024688720703125, 0.136749267578125, 0.15325164794921875, 0.1697540283203125, 0.18625640869140625, 0.2027587890625, 0.21926116943359375, 0.2357635498046875, 0.25226593017578125, 0.268768310546875, 0.28527069091796875, 0.3017730712890625, 0.31827545166015625, 0.33477783203125, 0.35128021240234375, 0.3677825927734375, 0.38428497314453125, 0.400787353515625, 0.41728973388671875, 0.4337921142578125, 0.45029449462890625, 0.466796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 8.0, 4.0, 7.0, 10.0, 14.0, 20.0, 13.0, 18.0, 28.0, 25.0, 29.0, 27.0, 34.0, 37.0, 43.0, 35.0, 40.0, 56.0, 39.0, 46.0, 37.0, 42.0, 41.0, 53.0, 38.0, 39.0, 22.0, 27.0, 18.0, 35.0, 15.0, 13.0, 12.0, 11.0, 15.0, 11.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.22845458984375, -1.1883544921875, -1.14825439453125, -1.108154296875, -1.06805419921875, -1.0279541015625, -0.98785400390625, -0.94775390625, -0.90765380859375, -0.8675537109375, -0.82745361328125, -0.787353515625, -0.74725341796875, -0.7071533203125, -0.66705322265625, -0.626953125, -0.58685302734375, -0.5467529296875, -0.50665283203125, -0.466552734375, -0.42645263671875, -0.3863525390625, -0.34625244140625, -0.30615234375, -0.26605224609375, -0.2259521484375, -0.18585205078125, -0.145751953125, -0.10565185546875, -0.0655517578125, -0.02545166015625, 0.0146484375, 0.05474853515625, 0.0948486328125, 0.13494873046875, 0.175048828125, 0.21514892578125, 0.2552490234375, 0.29534912109375, 0.33544921875, 0.37554931640625, 0.4156494140625, 0.45574951171875, 0.495849609375, 0.53594970703125, 0.5760498046875, 0.61614990234375, 0.65625, 0.69635009765625, 0.7364501953125, 0.77655029296875, 0.816650390625, 0.85675048828125, 0.8968505859375, 0.93695068359375, 0.97705078125, 1.01715087890625, 1.0572509765625, 1.09735107421875, 1.137451171875, 1.17755126953125, 1.2176513671875, 1.25775146484375, 1.2978515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 9.0, 8.0, 21.0, 19.0, 27.0, 53.0, 94.0, 144.0, 178.0, 340.0, 663.0, 1259.0, 2640.0, 6205.0, 17814.0, 71658.0, 472490.0, 387102.0, 61170.0, 15836.0, 5684.0, 2475.0, 1131.0, 612.0, 342.0, 209.0, 129.0, 73.0, 58.0, 29.0, 16.0, 16.0, 14.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228271484375, -0.22064971923828125, -0.2130279541015625, -0.20540618896484375, -0.197784423828125, -0.19016265869140625, -0.1825408935546875, -0.17491912841796875, -0.16729736328125, -0.15967559814453125, -0.1520538330078125, -0.14443206787109375, -0.136810302734375, -0.12918853759765625, -0.1215667724609375, -0.11394500732421875, -0.1063232421875, -0.09870147705078125, -0.0910797119140625, -0.08345794677734375, -0.075836181640625, -0.06821441650390625, -0.0605926513671875, -0.05297088623046875, -0.04534912109375, -0.03772735595703125, -0.0301055908203125, -0.02248382568359375, -0.014862060546875, -0.00724029541015625, 0.0003814697265625, 0.00800323486328125, 0.015625, 0.02324676513671875, 0.0308685302734375, 0.03849029541015625, 0.046112060546875, 0.05373382568359375, 0.0613555908203125, 0.06897735595703125, 0.07659912109375, 0.08422088623046875, 0.0918426513671875, 0.09946441650390625, 0.107086181640625, 0.11470794677734375, 0.1223297119140625, 0.12995147705078125, 0.1375732421875, 0.14519500732421875, 0.1528167724609375, 0.16043853759765625, 0.168060302734375, 0.17568206787109375, 0.1833038330078125, 0.19092559814453125, 0.19854736328125, 0.20616912841796875, 0.2137908935546875, 0.22141265869140625, 0.229034423828125, 0.23665618896484375, 0.2442779541015625, 0.25189971923828125, 0.259521484375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 15.0, 16.0, 27.0, 23.0, 40.0, 89.0, 91.0, 138.0, 151.0, 134.0, 84.0, 65.0, 37.0, 26.0, 12.0, 14.0, 4.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012540817260742188, -0.00011981092393398285, -0.00011421367526054382, -0.0001086164265871048, -0.00010301917791366577, -9.742192924022675e-05, -9.182468056678772e-05, -8.62274318933487e-05, -8.063018321990967e-05, -7.503293454647064e-05, -6.943568587303162e-05, -6.383843719959259e-05, -5.8241188526153564e-05, -5.264393985271454e-05, -4.704669117927551e-05, -4.144944250583649e-05, -3.585219383239746e-05, -3.0254945158958435e-05, -2.465769648551941e-05, -1.9060447812080383e-05, -1.3463199138641357e-05, -7.865950465202332e-06, -2.2687017917633057e-06, 3.3285468816757202e-06, 8.925795555114746e-06, 1.4523044228553772e-05, 2.0120292901992798e-05, 2.5717541575431824e-05, 3.131479024887085e-05, 3.6912038922309875e-05, 4.25092875957489e-05, 4.810653626918793e-05, 5.370378494262695e-05, 5.930103361606598e-05, 6.4898282289505e-05, 7.049553096294403e-05, 7.609277963638306e-05, 8.169002830982208e-05, 8.728727698326111e-05, 9.288452565670013e-05, 9.848177433013916e-05, 0.00010407902300357819, 0.00010967627167701721, 0.00011527352035045624, 0.00012087076902389526, 0.0001264680176973343, 0.00013206526637077332, 0.00013766251504421234, 0.00014325976371765137, 0.0001488570123910904, 0.00015445426106452942, 0.00016005150973796844, 0.00016564875841140747, 0.0001712460070848465, 0.00017684325575828552, 0.00018244050443172455, 0.00018803775310516357, 0.0001936350017786026, 0.00019923225045204163, 0.00020482949912548065, 0.00021042674779891968, 0.0002160239964723587, 0.00022162124514579773, 0.00022721849381923676, 0.00023281574249267578]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 8.0, 9.0, 8.0, 14.0, 13.0, 16.0, 23.0, 38.0, 65.0, 138.0, 699.0, 11394.0, 912918.0, 120210.0, 2470.0, 282.0, 97.0, 35.0, 35.0, 21.0, 16.0, 9.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76123046875, -0.7338027954101562, -0.7063751220703125, -0.6789474487304688, -0.651519775390625, -0.6240921020507812, -0.5966644287109375, -0.5692367553710938, -0.54180908203125, -0.5143814086914062, -0.4869537353515625, -0.45952606201171875, -0.432098388671875, -0.40467071533203125, -0.3772430419921875, -0.34981536865234375, -0.3223876953125, -0.29496002197265625, -0.2675323486328125, -0.24010467529296875, -0.212677001953125, -0.18524932861328125, -0.1578216552734375, -0.13039398193359375, -0.10296630859375, -0.07553863525390625, -0.0481109619140625, -0.02068328857421875, 0.006744384765625, 0.03417205810546875, 0.0615997314453125, 0.08902740478515625, 0.116455078125, 0.14388275146484375, 0.1713104248046875, 0.19873809814453125, 0.226165771484375, 0.25359344482421875, 0.2810211181640625, 0.30844879150390625, 0.33587646484375, 0.36330413818359375, 0.3907318115234375, 0.41815948486328125, 0.445587158203125, 0.47301483154296875, 0.5004425048828125, 0.5278701782226562, 0.5552978515625, 0.5827255249023438, 0.6101531982421875, 0.6375808715820312, 0.665008544921875, 0.6924362182617188, 0.7198638916015625, 0.7472915649414062, 0.77471923828125, 0.8021469116210938, 0.8295745849609375, 0.8570022583007812, 0.884429931640625, 0.9118576049804688, 0.9392852783203125, 0.9667129516601562, 0.994140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 7.0, 8.0, 4.0, 11.0, 13.0, 18.0, 33.0, 43.0, 55.0, 69.0, 98.0, 87.0, 114.0, 104.0, 71.0, 70.0, 43.0, 34.0, 33.0, 24.0, 10.0, 14.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.077880859375, -0.07568073272705078, -0.07348060607910156, -0.07128047943115234, -0.06908035278320312, -0.0668802261352539, -0.06468009948730469, -0.06247997283935547, -0.06027984619140625, -0.05807971954345703, -0.05587959289550781, -0.053679466247558594, -0.051479339599609375, -0.049279212951660156, -0.04707908630371094, -0.04487895965576172, -0.0426788330078125, -0.04047870635986328, -0.03827857971191406, -0.036078453063964844, -0.033878326416015625, -0.031678199768066406, -0.029478073120117188, -0.02727794647216797, -0.02507781982421875, -0.02287769317626953, -0.020677566528320312, -0.018477439880371094, -0.016277313232421875, -0.014077186584472656, -0.011877059936523438, -0.009676933288574219, -0.007476806640625, -0.005276679992675781, -0.0030765533447265625, -0.0008764266967773438, 0.001323699951171875, 0.0035238265991210938, 0.0057239532470703125, 0.007924079895019531, 0.01012420654296875, 0.012324333190917969, 0.014524459838867188, 0.016724586486816406, 0.018924713134765625, 0.021124839782714844, 0.023324966430664062, 0.02552509307861328, 0.0277252197265625, 0.02992534637451172, 0.03212547302246094, 0.034325599670410156, 0.036525726318359375, 0.038725852966308594, 0.04092597961425781, 0.04312610626220703, 0.04532623291015625, 0.04752635955810547, 0.04972648620605469, 0.051926612854003906, 0.054126739501953125, 0.056326866149902344, 0.05852699279785156, 0.06072711944580078, 0.06292724609375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 13.0, 18.0, 57.0, 123.0, 211.0, 251.0, 158.0, 101.0, 39.0, 17.0, 11.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4172747135162354, -3.336487293243408, -3.25570011138916, -3.174912691116333, -3.094125270843506, -3.013338088989258, -2.9325506687164307, -2.8517632484436035, -2.7709760665893555, -2.6901886463165283, -2.6094014644622803, -2.528614044189453, -2.447826623916626, -2.367039203643799, -2.286252021789551, -2.2054646015167236, -2.1246771812438965, -2.0438897609710693, -1.9631024599075317, -1.8823151588439941, -1.801527738571167, -1.7207404375076294, -1.6399531364440918, -1.5591657161712646, -1.478378415107727, -1.3975911140441895, -1.3168036937713623, -1.2360163927078247, -1.155229091644287, -1.07444167137146, -0.9936543703079224, -0.91286700963974, -0.8320795297622681, -0.7512921690940857, -0.6705048084259033, -0.5897175073623657, -0.5089301466941833, -0.428142786026001, -0.347355455160141, -0.266568124294281, -0.18578076362609863, -0.10499341785907745, -0.024206072092056274, 0.056581273674964905, 0.13736861944198608, 0.21815598011016846, 0.29894331097602844, 0.3797306418418884, 0.4605180025100708, 0.5413053631782532, 0.6220927238464355, 0.7028800249099731, 0.7836673855781555, 0.8644547462463379, 0.9452420473098755, 1.026029348373413, 1.1068167686462402, 1.1876040697097778, 1.268391489982605, 1.3491787910461426, 1.4299662113189697, 1.5107535123825073, 1.591540813446045, 1.672328233718872, 1.7531155347824097]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 9.0, 15.0, 27.0, 20.0, 22.0, 35.0, 32.0, 33.0, 36.0, 62.0, 51.0, 46.0, 73.0, 61.0, 52.0, 65.0, 54.0, 46.0, 40.0, 39.0, 32.0, 29.0, 20.0, 21.0, 14.0, 15.0, 14.0, 4.0, 4.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8841239809989929, -0.8583108186721802, -0.8324977159500122, -0.8066845536231995, -0.7808713912963867, -0.7550582885742188, -0.729245126247406, -0.7034319639205933, -0.6776188611984253, -0.6518056988716125, -0.6259925961494446, -0.6001794338226318, -0.5743663311004639, -0.5485531687736511, -0.5227400064468384, -0.496926873922348, -0.47111374139785767, -0.4453006088733673, -0.41948747634887695, -0.3936743140220642, -0.36786118149757385, -0.3420480489730835, -0.31623488664627075, -0.2904217541217804, -0.26460862159729004, -0.23879548907279968, -0.21298234164714813, -0.18716919422149658, -0.16135606169700623, -0.13554292917251587, -0.10972978174686432, -0.08391663432121277, -0.05810344219207764, -0.03229030221700668, -0.00647716224193573, 0.019335977733135223, 0.04514911770820618, 0.07096225023269653, 0.09677539765834808, 0.12258854508399963, 0.14840167760849, 0.17421481013298035, 0.2000279575586319, 0.22584110498428345, 0.2516542375087738, 0.27746737003326416, 0.3032805323600769, 0.32909366488456726, 0.3549067974090576, 0.380719929933548, 0.40653306245803833, 0.4323462247848511, 0.45815935730934143, 0.4839724898338318, 0.5097856521606445, 0.5355987548828125, 0.5614119172096252, 0.587225079536438, 0.613038182258606, 0.6388513445854187, 0.6646645069122314, 0.6904776096343994, 0.7162907719612122, 0.7421039342880249, 0.7679170370101929]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 6.0, 4.0, 10.0, 10.0, 27.0, 35.0, 91.0, 99.0, 219.0, 454.0, 896.0, 2040.0, 5108.0, 14338.0, 50881.0, 288700.0, 556032.0, 93597.0, 22876.0, 7608.0, 2970.0, 1268.0, 575.0, 320.0, 159.0, 87.0, 61.0, 23.0, 17.0, 9.0, 10.0, 10.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.9892578125, -0.9619293212890625, -0.934600830078125, -0.9072723388671875, -0.87994384765625, -0.8526153564453125, -0.825286865234375, -0.7979583740234375, -0.7706298828125, -0.7433013916015625, -0.715972900390625, -0.6886444091796875, -0.66131591796875, -0.6339874267578125, -0.606658935546875, -0.5793304443359375, -0.552001953125, -0.5246734619140625, -0.497344970703125, -0.4700164794921875, -0.44268798828125, -0.4153594970703125, -0.388031005859375, -0.3607025146484375, -0.3333740234375, -0.3060455322265625, -0.278717041015625, -0.2513885498046875, -0.22406005859375, -0.1967315673828125, -0.169403076171875, -0.1420745849609375, -0.11474609375, -0.0874176025390625, -0.060089111328125, -0.0327606201171875, -0.00543212890625, 0.0218963623046875, 0.049224853515625, 0.0765533447265625, 0.1038818359375, 0.1312103271484375, 0.158538818359375, 0.1858673095703125, 0.21319580078125, 0.2405242919921875, 0.267852783203125, 0.2951812744140625, 0.322509765625, 0.3498382568359375, 0.377166748046875, 0.4044952392578125, 0.43182373046875, 0.4591522216796875, 0.486480712890625, 0.5138092041015625, 0.5411376953125, 0.5684661865234375, 0.595794677734375, 0.6231231689453125, 0.65045166015625, 0.6777801513671875, 0.705108642578125, 0.7324371337890625, 0.759765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 8.0, 10.0, 17.0, 13.0, 11.0, 17.0, 31.0, 26.0, 25.0, 34.0, 52.0, 41.0, 50.0, 41.0, 39.0, 57.0, 49.0, 48.0, 38.0, 55.0, 44.0, 44.0, 33.0, 32.0, 34.0, 23.0, 29.0, 14.0, 17.0, 12.0, 7.0, 14.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.385406494140625, -1.33428955078125, -1.283172607421875, -1.2320556640625, -1.180938720703125, -1.12982177734375, -1.078704833984375, -1.027587890625, -0.976470947265625, -0.92535400390625, -0.874237060546875, -0.8231201171875, -0.772003173828125, -0.72088623046875, -0.669769287109375, -0.61865234375, -0.567535400390625, -0.51641845703125, -0.465301513671875, -0.4141845703125, -0.363067626953125, -0.31195068359375, -0.260833740234375, -0.209716796875, -0.158599853515625, -0.10748291015625, -0.056365966796875, -0.0052490234375, 0.045867919921875, 0.09698486328125, 0.148101806640625, 0.19921875, 0.250335693359375, 0.30145263671875, 0.352569580078125, 0.4036865234375, 0.454803466796875, 0.50592041015625, 0.557037353515625, 0.608154296875, 0.659271240234375, 0.71038818359375, 0.761505126953125, 0.8126220703125, 0.863739013671875, 0.91485595703125, 0.965972900390625, 1.01708984375, 1.068206787109375, 1.11932373046875, 1.170440673828125, 1.2215576171875, 1.272674560546875, 1.32379150390625, 1.374908447265625, 1.426025390625, 1.477142333984375, 1.52825927734375, 1.579376220703125, 1.6304931640625, 1.681610107421875, 1.73272705078125, 1.783843994140625, 1.8349609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 10.0, 5.0, 9.0, 9.0, 9.0, 21.0, 38.0, 39.0, 63.0, 49.0, 72.0, 99.0, 312.0, 1033848.0, 13426.0, 159.0, 92.0, 63.0, 56.0, 36.0, 44.0, 28.0, 25.0, 18.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.65869140625, -9.3642578125, -9.06982421875, -8.775390625, -8.48095703125, -8.1865234375, -7.89208984375, -7.59765625, -7.30322265625, -7.0087890625, -6.71435546875, -6.419921875, -6.12548828125, -5.8310546875, -5.53662109375, -5.2421875, -4.94775390625, -4.6533203125, -4.35888671875, -4.064453125, -3.77001953125, -3.4755859375, -3.18115234375, -2.88671875, -2.59228515625, -2.2978515625, -2.00341796875, -1.708984375, -1.41455078125, -1.1201171875, -0.82568359375, -0.53125, -0.23681640625, 0.0576171875, 0.35205078125, 0.646484375, 0.94091796875, 1.2353515625, 1.52978515625, 1.82421875, 2.11865234375, 2.4130859375, 2.70751953125, 3.001953125, 3.29638671875, 3.5908203125, 3.88525390625, 4.1796875, 4.47412109375, 4.7685546875, 5.06298828125, 5.357421875, 5.65185546875, 5.9462890625, 6.24072265625, 6.53515625, 6.82958984375, 7.1240234375, 7.41845703125, 7.712890625, 8.00732421875, 8.3017578125, 8.59619140625, 8.890625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 6.0, 7.0, 11.0, 9.0, 10.0, 18.0, 39.0, 33.0, 57.0, 43.0, 54.0, 78.0, 54.0, 76.0, 74.0, 78.0, 63.0, 70.0, 47.0, 40.0, 42.0, 26.0, 22.0, 20.0, 13.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.966796875, -2.8792724609375, -2.791748046875, -2.7042236328125, -2.61669921875, -2.5291748046875, -2.441650390625, -2.3541259765625, -2.2666015625, -2.1790771484375, -2.091552734375, -2.0040283203125, -1.91650390625, -1.8289794921875, -1.741455078125, -1.6539306640625, -1.56640625, -1.4788818359375, -1.391357421875, -1.3038330078125, -1.21630859375, -1.1287841796875, -1.041259765625, -0.9537353515625, -0.8662109375, -0.7786865234375, -0.691162109375, -0.6036376953125, -0.51611328125, -0.4285888671875, -0.341064453125, -0.2535400390625, -0.166015625, -0.0784912109375, 0.009033203125, 0.0965576171875, 0.18408203125, 0.2716064453125, 0.359130859375, 0.4466552734375, 0.5341796875, 0.6217041015625, 0.709228515625, 0.7967529296875, 0.88427734375, 0.9718017578125, 1.059326171875, 1.1468505859375, 1.234375, 1.3218994140625, 1.409423828125, 1.4969482421875, 1.58447265625, 1.6719970703125, 1.759521484375, 1.8470458984375, 1.9345703125, 2.0220947265625, 2.109619140625, 2.1971435546875, 2.28466796875, 2.3721923828125, 2.459716796875, 2.5472412109375, 2.634765625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 5.0, 10.0, 5.0, 9.0, 4.0, 23.0, 34.0, 52.0, 76.0, 129.0, 288.0, 619.0, 1927.0, 8768.0, 67923.0, 837186.0, 114991.0, 12507.0, 2520.0, 721.0, 325.0, 155.0, 104.0, 53.0, 42.0, 20.0, 9.0, 12.0, 10.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5146484375, -0.4993324279785156, -0.48401641845703125, -0.4687004089355469, -0.4533843994140625, -0.4380683898925781, -0.42275238037109375, -0.4074363708496094, -0.392120361328125, -0.3768043518066406, -0.36148834228515625, -0.3461723327636719, -0.3308563232421875, -0.3155403137207031, -0.30022430419921875, -0.2849082946777344, -0.26959228515625, -0.2542762756347656, -0.23896026611328125, -0.22364425659179688, -0.2083282470703125, -0.19301223754882812, -0.17769622802734375, -0.16238021850585938, -0.147064208984375, -0.13174819946289062, -0.11643218994140625, -0.10111618041992188, -0.0858001708984375, -0.07048416137695312, -0.05516815185546875, -0.039852142333984375, -0.0245361328125, -0.009220123291015625, 0.00609588623046875, 0.021411895751953125, 0.0367279052734375, 0.052043914794921875, 0.06735992431640625, 0.08267593383789062, 0.097991943359375, 0.11330795288085938, 0.12862396240234375, 0.14393997192382812, 0.1592559814453125, 0.17457199096679688, 0.18988800048828125, 0.20520401000976562, 0.22052001953125, 0.23583602905273438, 0.25115203857421875, 0.2664680480957031, 0.2817840576171875, 0.2971000671386719, 0.31241607666015625, 0.3277320861816406, 0.343048095703125, 0.3583641052246094, 0.37368011474609375, 0.3889961242675781, 0.4043121337890625, 0.4196281433105469, 0.43494415283203125, 0.4502601623535156, 0.465576171875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 10.0, 7.0, 5.0, 16.0, 16.0, 22.0, 49.0, 60.0, 100.0, 173.0, 180.0, 125.0, 63.0, 46.0, 34.0, 20.0, 16.0, 5.0, 8.0, 12.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.942583084106445e-05, -5.7637691497802734e-05, -5.5849552154541016e-05, -5.40614128112793e-05, -5.227327346801758e-05, -5.048513412475586e-05, -4.869699478149414e-05, -4.690885543823242e-05, -4.51207160949707e-05, -4.3332576751708984e-05, -4.1544437408447266e-05, -3.975629806518555e-05, -3.796815872192383e-05, -3.618001937866211e-05, -3.439188003540039e-05, -3.260374069213867e-05, -3.081560134887695e-05, -2.9027462005615234e-05, -2.7239322662353516e-05, -2.5451183319091797e-05, -2.3663043975830078e-05, -2.187490463256836e-05, -2.008676528930664e-05, -1.8298625946044922e-05, -1.6510486602783203e-05, -1.4722347259521484e-05, -1.2934207916259766e-05, -1.1146068572998047e-05, -9.357929229736328e-06, -7.569789886474609e-06, -5.781650543212891e-06, -3.993511199951172e-06, -2.205371856689453e-06, -4.172325134277344e-07, 1.3709068298339844e-06, 3.159046173095703e-06, 4.947185516357422e-06, 6.735324859619141e-06, 8.52346420288086e-06, 1.0311603546142578e-05, 1.2099742889404297e-05, 1.3887882232666016e-05, 1.5676021575927734e-05, 1.7464160919189453e-05, 1.9252300262451172e-05, 2.104043960571289e-05, 2.282857894897461e-05, 2.4616718292236328e-05, 2.6404857635498047e-05, 2.8192996978759766e-05, 2.9981136322021484e-05, 3.17692756652832e-05, 3.355741500854492e-05, 3.534555435180664e-05, 3.713369369506836e-05, 3.892183303833008e-05, 4.07099723815918e-05, 4.2498111724853516e-05, 4.4286251068115234e-05, 4.607439041137695e-05, 4.786252975463867e-05, 4.965066909790039e-05, 5.143880844116211e-05, 5.322694778442383e-05, 5.501508712768555e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 11.0, 19.0, 47.0, 84.0, 347.0, 2704.0, 105909.0, 927216.0, 11127.0, 792.0, 160.0, 52.0, 25.0, 20.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0166015625, -0.9850616455078125, -0.953521728515625, -0.9219818115234375, -0.89044189453125, -0.8589019775390625, -0.827362060546875, -0.7958221435546875, -0.7642822265625, -0.7327423095703125, -0.701202392578125, -0.6696624755859375, -0.63812255859375, -0.6065826416015625, -0.575042724609375, -0.5435028076171875, -0.511962890625, -0.4804229736328125, -0.448883056640625, -0.4173431396484375, -0.38580322265625, -0.3542633056640625, -0.322723388671875, -0.2911834716796875, -0.2596435546875, -0.2281036376953125, -0.196563720703125, -0.1650238037109375, -0.13348388671875, -0.1019439697265625, -0.070404052734375, -0.0388641357421875, -0.00732421875, 0.0242156982421875, 0.055755615234375, 0.0872955322265625, 0.11883544921875, 0.1503753662109375, 0.181915283203125, 0.2134552001953125, 0.2449951171875, 0.2765350341796875, 0.308074951171875, 0.3396148681640625, 0.37115478515625, 0.4026947021484375, 0.434234619140625, 0.4657745361328125, 0.497314453125, 0.5288543701171875, 0.560394287109375, 0.5919342041015625, 0.62347412109375, 0.6550140380859375, 0.686553955078125, 0.7180938720703125, 0.7496337890625, 0.7811737060546875, 0.812713623046875, 0.8442535400390625, 0.87579345703125, 0.9073333740234375, 0.938873291015625, 0.9704132080078125, 1.001953125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 10.0, 11.0, 9.0, 11.0, 19.0, 19.0, 32.0, 33.0, 28.0, 53.0, 61.0, 93.0, 185.0, 96.0, 67.0, 44.0, 41.0, 45.0, 34.0, 24.0, 5.0, 14.0, 15.0, 9.0, 9.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0943603515625, -0.09106159210205078, -0.08776283264160156, -0.08446407318115234, -0.08116531372070312, -0.0778665542602539, -0.07456779479980469, -0.07126903533935547, -0.06797027587890625, -0.06467151641845703, -0.06137275695800781, -0.058073997497558594, -0.054775238037109375, -0.051476478576660156, -0.04817771911621094, -0.04487895965576172, -0.0415802001953125, -0.03828144073486328, -0.03498268127441406, -0.031683921813964844, -0.028385162353515625, -0.025086402893066406, -0.021787643432617188, -0.01848888397216797, -0.01519012451171875, -0.011891365051269531, -0.008592605590820312, -0.005293846130371094, -0.001995086669921875, 0.0013036727905273438, 0.0046024322509765625, 0.007901191711425781, 0.011199951171875, 0.014498710632324219, 0.017797470092773438, 0.021096229553222656, 0.024394989013671875, 0.027693748474121094, 0.030992507934570312, 0.03429126739501953, 0.03759002685546875, 0.04088878631591797, 0.04418754577636719, 0.047486305236816406, 0.050785064697265625, 0.054083824157714844, 0.05738258361816406, 0.06068134307861328, 0.0639801025390625, 0.06727886199951172, 0.07057762145996094, 0.07387638092041016, 0.07717514038085938, 0.0804738998413086, 0.08377265930175781, 0.08707141876220703, 0.09037017822265625, 0.09366893768310547, 0.09696769714355469, 0.1002664566040039, 0.10356521606445312, 0.10686397552490234, 0.11016273498535156, 0.11346149444580078, 0.11676025390625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 21.0, 50.0, 114.0, 170.0, 209.0, 202.0, 113.0, 59.0, 25.0, 23.0, 8.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4421045780181885, -2.303454875946045, -2.1648051738739014, -2.026155471801758, -1.8875057697296143, -1.7488560676574707, -1.6102063655853271, -1.4715566635131836, -1.33290696144104, -1.1942572593688965, -1.055607557296753, -0.9169578552246094, -0.7783081531524658, -0.6396584510803223, -0.5010087490081787, -0.36235904693603516, -0.2237093448638916, -0.08505964279174805, 0.05359005928039551, 0.19223976135253906, 0.3308894634246826, 0.46953916549682617, 0.6081888675689697, 0.7468385696411133, 0.8854882717132568, 1.0241379737854004, 1.162787675857544, 1.3014373779296875, 1.440087080001831, 1.5787367820739746, 1.7173864841461182, 1.8560361862182617, 1.9946861267089844, 2.133335828781128, 2.2719855308532715, 2.410635232925415, 2.5492849349975586, 2.687934637069702, 2.8265843391418457, 2.9652340412139893, 3.103883743286133, 3.2425334453582764, 3.38118314743042, 3.5198328495025635, 3.658482551574707, 3.7971322536468506, 3.935781955718994, 4.074431419372559, 4.213081359863281, 4.351731300354004, 4.490380764007568, 4.629030227661133, 4.7676801681518555, 4.906330108642578, 5.044979572296143, 5.183629035949707, 5.32227897644043, 5.460928916931152, 5.599578380584717, 5.738227844238281, 5.876877784729004, 6.015527725219727, 6.154177188873291, 6.2928266525268555, 6.431476593017578]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 6.0, 4.0, 3.0, 8.0, 12.0, 10.0, 6.0, 8.0, 15.0, 16.0, 13.0, 16.0, 22.0, 33.0, 24.0, 31.0, 29.0, 35.0, 39.0, 34.0, 27.0, 43.0, 45.0, 44.0, 55.0, 39.0, 39.0, 30.0, 44.0, 27.0, 32.0, 30.0, 34.0, 24.0, 17.0, 18.0, 22.0, 19.0, 9.0, 8.0, 8.0, 7.0, 6.0, 1.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 4.0, 2.0], "bins": [-2.5910654067993164, -2.520235776901245, -2.449406147003174, -2.3785765171051025, -2.3077468872070312, -2.23691725730896, -2.1660876274108887, -2.0952582359313965, -2.024428367614746, -1.9535987377166748, -1.8827691078186035, -1.8119394779205322, -1.741109848022461, -1.6702802181243896, -1.599450707435608, -1.5286210775375366, -1.4577915668487549, -1.3869619369506836, -1.3161323070526123, -1.245302677154541, -1.1744730472564697, -1.1036434173583984, -1.0328139066696167, -0.9619842767715454, -0.8911546468734741, -0.8203250169754028, -0.7494953870773315, -0.678665816783905, -0.6078361868858337, -0.5370065569877625, -0.46617695689201355, -0.39534735679626465, -0.3245178461074829, -0.2536882162094116, -0.18285861611366272, -0.11202900111675262, -0.04119938611984253, 0.02963024377822876, 0.10045984387397766, 0.17128944396972656, 0.24211907386779785, 0.31294870376586914, 0.38377830386161804, 0.45460790395736694, 0.5254375338554382, 0.5962671637535095, 0.667096734046936, 0.7379263639450073, 0.8087559938430786, 0.8795856237411499, 0.9504152536392212, 1.0212448835372925, 1.0920743942260742, 1.1629040241241455, 1.2337336540222168, 1.304563283920288, 1.3753929138183594, 1.4462225437164307, 1.517052173614502, 1.5878818035125732, 1.6587114334106445, 1.7295410633087158, 1.8003705739974976, 1.8712002038955688, 1.9420298337936401]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 8.0, 17.0, 20.0, 33.0, 39.0, 72.0, 113.0, 226.0, 473.0, 1266.0, 4059.0, 22332.0, 326808.0, 3594012.0, 219959.0, 19065.0, 3784.0, 1108.0, 433.0, 187.0, 83.0, 68.0, 33.0, 22.0, 13.0, 10.0, 7.0, 6.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.767578125, -2.6991424560546875, -2.630706787109375, -2.5622711181640625, -2.49383544921875, -2.4253997802734375, -2.356964111328125, -2.2885284423828125, -2.2200927734375, -2.1516571044921875, -2.083221435546875, -2.0147857666015625, -1.94635009765625, -1.8779144287109375, -1.809478759765625, -1.7410430908203125, -1.672607421875, -1.6041717529296875, -1.535736083984375, -1.4673004150390625, -1.39886474609375, -1.3304290771484375, -1.261993408203125, -1.1935577392578125, -1.1251220703125, -1.0566864013671875, -0.988250732421875, -0.9198150634765625, -0.85137939453125, -0.7829437255859375, -0.714508056640625, -0.6460723876953125, -0.57763671875, -0.5092010498046875, -0.440765380859375, -0.3723297119140625, -0.30389404296875, -0.2354583740234375, -0.167022705078125, -0.0985870361328125, -0.0301513671875, 0.0382843017578125, 0.106719970703125, 0.1751556396484375, 0.24359130859375, 0.3120269775390625, 0.380462646484375, 0.4488983154296875, 0.517333984375, 0.5857696533203125, 0.654205322265625, 0.7226409912109375, 0.79107666015625, 0.8595123291015625, 0.927947998046875, 0.9963836669921875, 1.0648193359375, 1.1332550048828125, 1.201690673828125, 1.2701263427734375, 1.33856201171875, 1.4069976806640625, 1.475433349609375, 1.5438690185546875, 1.6123046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 6.0, 9.0, 10.0, 14.0, 13.0, 22.0, 18.0, 39.0, 34.0, 42.0, 63.0, 54.0, 57.0, 57.0, 66.0, 69.0, 85.0, 64.0, 52.0, 50.0, 46.0, 33.0, 31.0, 19.0, 6.0, 14.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.125, -1.0933151245117188, -1.0616302490234375, -1.0299453735351562, -0.998260498046875, -0.9665756225585938, -0.9348907470703125, -0.9032058715820312, -0.87152099609375, -0.8398361206054688, -0.8081512451171875, -0.7764663696289062, -0.744781494140625, -0.7130966186523438, -0.6814117431640625, -0.6497268676757812, -0.6180419921875, -0.5863571166992188, -0.5546722412109375, -0.5229873657226562, -0.491302490234375, -0.45961761474609375, -0.4279327392578125, -0.39624786376953125, -0.36456298828125, -0.33287811279296875, -0.3011932373046875, -0.26950836181640625, -0.237823486328125, -0.20613861083984375, -0.1744537353515625, -0.14276885986328125, -0.111083984375, -0.07939910888671875, -0.0477142333984375, -0.01602935791015625, 0.015655517578125, 0.04734039306640625, 0.0790252685546875, 0.11071014404296875, 0.14239501953125, 0.17407989501953125, 0.2057647705078125, 0.23744964599609375, 0.269134521484375, 0.30081939697265625, 0.3325042724609375, 0.36418914794921875, 0.3958740234375, 0.42755889892578125, 0.4592437744140625, 0.49092864990234375, 0.522613525390625, 0.5542984008789062, 0.5859832763671875, 0.6176681518554688, 0.64935302734375, 0.6810379028320312, 0.7127227783203125, 0.7444076538085938, 0.776092529296875, 0.8077774047851562, 0.8394622802734375, 0.8711471557617188, 0.90283203125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 13.0, 20.0, 49.0, 89.0, 544.0, 16393.0, 4168684.0, 7928.0, 385.0, 105.0, 33.0, 12.0, 11.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.655517578125, -8.43603515625, -8.216552734375, -7.9970703125, -7.777587890625, -7.55810546875, -7.338623046875, -7.119140625, -6.899658203125, -6.68017578125, -6.460693359375, -6.2412109375, -6.021728515625, -5.80224609375, -5.582763671875, -5.36328125, -5.143798828125, -4.92431640625, -4.704833984375, -4.4853515625, -4.265869140625, -4.04638671875, -3.826904296875, -3.607421875, -3.387939453125, -3.16845703125, -2.948974609375, -2.7294921875, -2.510009765625, -2.29052734375, -2.071044921875, -1.8515625, -1.632080078125, -1.41259765625, -1.193115234375, -0.9736328125, -0.754150390625, -0.53466796875, -0.315185546875, -0.095703125, 0.123779296875, 0.34326171875, 0.562744140625, 0.7822265625, 1.001708984375, 1.22119140625, 1.440673828125, 1.66015625, 1.879638671875, 2.09912109375, 2.318603515625, 2.5380859375, 2.757568359375, 2.97705078125, 3.196533203125, 3.416015625, 3.635498046875, 3.85498046875, 4.074462890625, 4.2939453125, 4.513427734375, 4.73291015625, 4.952392578125, 5.171875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 11.0, 11.0, 10.0, 15.0, 18.0, 21.0, 45.0, 41.0, 52.0, 93.0, 115.0, 152.0, 231.0, 308.0, 492.0, 711.0, 534.0, 371.0, 255.0, 125.0, 109.0, 73.0, 61.0, 55.0, 42.0, 29.0, 16.0, 16.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2493896484375, -0.2403697967529297, -0.23134994506835938, -0.22233009338378906, -0.21331024169921875, -0.20429039001464844, -0.19527053833007812, -0.1862506866455078, -0.1772308349609375, -0.1682109832763672, -0.15919113159179688, -0.15017127990722656, -0.14115142822265625, -0.13213157653808594, -0.12311172485351562, -0.11409187316894531, -0.105072021484375, -0.09605216979980469, -0.08703231811523438, -0.07801246643066406, -0.06899261474609375, -0.05997276306152344, -0.050952911376953125, -0.04193305969238281, -0.0329132080078125, -0.023893356323242188, -0.014873504638671875, -0.0058536529541015625, 0.00316619873046875, 0.012186050415039062, 0.021205902099609375, 0.030225753784179688, 0.03924560546875, 0.04826545715332031, 0.057285308837890625, 0.06630516052246094, 0.07532501220703125, 0.08434486389160156, 0.09336471557617188, 0.10238456726074219, 0.1114044189453125, 0.12042427062988281, 0.12944412231445312, 0.13846397399902344, 0.14748382568359375, 0.15650367736816406, 0.16552352905273438, 0.1745433807373047, 0.183563232421875, 0.1925830841064453, 0.20160293579101562, 0.21062278747558594, 0.21964263916015625, 0.22866249084472656, 0.23768234252929688, 0.2467021942138672, 0.2557220458984375, 0.2647418975830078, 0.2737617492675781, 0.28278160095214844, 0.29180145263671875, 0.30082130432128906, 0.3098411560058594, 0.3188610076904297, 0.327880859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 5.0, 13.0, 21.0, 29.0, 32.0, 61.0, 73.0, 105.0, 125.0, 111.0, 105.0, 93.0, 65.0, 40.0, 33.0, 23.0, 17.0, 11.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.1261439323425293, -2.073329210281372, -2.020514726638794, -1.9677000045776367, -1.914885401725769, -1.8620707988739014, -1.8092561960220337, -1.756441593170166, -1.7036268711090088, -1.6508122682571411, -1.5979976654052734, -1.5451829433441162, -1.4923683404922485, -1.4395537376403809, -1.3867391347885132, -1.3339245319366455, -1.2811099290847778, -1.2282953262329102, -1.1754807233810425, -1.1226661205291748, -1.0698513984680176, -1.01703679561615, -0.9642221927642822, -0.9114075899124146, -0.8585929274559021, -0.8057783246040344, -0.752963662147522, -0.7001490592956543, -0.6473344564437866, -0.5945197939872742, -0.5417051911354065, -0.48889055848121643, -0.4360760450363159, -0.38326141238212585, -0.3304467797279358, -0.2776321768760681, -0.22481754422187805, -0.172002911567688, -0.11918830871582031, -0.06637367606163025, -0.013559043407440186, 0.03925558179616928, 0.09207020699977875, 0.14488482475280762, 0.19769945740699768, 0.25051409006118774, 0.3033286929130554, 0.3561433255672455, 0.40895795822143555, 0.4617725908756256, 0.5145872235298157, 0.5674018263816833, 0.6202164888381958, 0.6730310916900635, 0.7258456945419312, 0.7786602973937988, 0.8314749598503113, 0.884289562702179, 0.9371042251586914, 0.9899188280105591, 1.0427334308624268, 1.095548152923584, 1.148362636566162, 1.2011773586273193, 1.253991961479187]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 4.0, 6.0, 12.0, 6.0, 12.0, 9.0, 12.0, 10.0, 20.0, 22.0, 19.0, 27.0, 38.0, 27.0, 40.0, 44.0, 51.0, 44.0, 50.0, 40.0, 50.0, 47.0, 38.0, 41.0, 48.0, 47.0, 34.0, 40.0, 22.0, 33.0, 23.0, 16.0, 21.0, 9.0, 9.0, 6.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8382196426391602, -0.8120490312576294, -0.7858783602714539, -0.7597077488899231, -0.7335370779037476, -0.7073664665222168, -0.681195855140686, -0.6550252437591553, -0.6288545727729797, -0.602683961391449, -0.5765132904052734, -0.5503426790237427, -0.5241720676422119, -0.4980013966560364, -0.4718307852745056, -0.44566014409065247, -0.4194895029067993, -0.39331886172294617, -0.367148220539093, -0.34097760915756226, -0.3148069679737091, -0.28863632678985596, -0.2624657154083252, -0.23629507422447205, -0.2101244330406189, -0.18395379185676575, -0.1577831655740738, -0.13161253929138184, -0.10544189810752869, -0.07927125692367554, -0.05310063064098358, -0.026930004358291626, -0.0007593035697937012, 0.02541133016347885, 0.051581963896751404, 0.07775259763002396, 0.10392323136329651, 0.13009387254714966, 0.1562644988298416, 0.18243512511253357, 0.20860576629638672, 0.23477640748023987, 0.260947048664093, 0.2871176600456238, 0.31328830122947693, 0.3394589424133301, 0.36562955379486084, 0.391800194978714, 0.41797083616256714, 0.4441414773464203, 0.47031211853027344, 0.4964827299118042, 0.522653341293335, 0.5488240122795105, 0.5749946236610413, 0.6011652946472168, 0.6273359060287476, 0.6535065174102783, 0.6796771883964539, 0.7058477997779846, 0.7320184707641602, 0.7581890821456909, 0.7843596935272217, 0.8105303049087524, 0.836700975894928]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 10.0, 7.0, 9.0, 16.0, 31.0, 44.0, 78.0, 191.0, 358.0, 909.0, 2350.0, 6703.0, 22151.0, 96274.0, 438663.0, 374908.0, 77913.0, 18651.0, 5685.0, 1995.0, 816.0, 371.0, 194.0, 105.0, 42.0, 26.0, 19.0, 8.0, 5.0, 6.0, 2.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.65625, -0.6398162841796875, -0.623382568359375, -0.6069488525390625, -0.59051513671875, -0.5740814208984375, -0.557647705078125, -0.5412139892578125, -0.5247802734375, -0.5083465576171875, -0.491912841796875, -0.4754791259765625, -0.45904541015625, -0.4426116943359375, -0.426177978515625, -0.4097442626953125, -0.393310546875, -0.3768768310546875, -0.360443115234375, -0.3440093994140625, -0.32757568359375, -0.3111419677734375, -0.294708251953125, -0.2782745361328125, -0.2618408203125, -0.2454071044921875, -0.228973388671875, -0.2125396728515625, -0.19610595703125, -0.1796722412109375, -0.163238525390625, -0.1468048095703125, -0.13037109375, -0.1139373779296875, -0.097503662109375, -0.0810699462890625, -0.06463623046875, -0.0482025146484375, -0.031768798828125, -0.0153350830078125, 0.0010986328125, 0.0175323486328125, 0.033966064453125, 0.0503997802734375, 0.06683349609375, 0.0832672119140625, 0.099700927734375, 0.1161346435546875, 0.132568359375, 0.1490020751953125, 0.165435791015625, 0.1818695068359375, 0.19830322265625, 0.2147369384765625, 0.231170654296875, 0.2476043701171875, 0.2640380859375, 0.2804718017578125, 0.296905517578125, 0.3133392333984375, 0.32977294921875, 0.3462066650390625, 0.362640380859375, 0.3790740966796875, 0.3955078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 6.0, 10.0, 9.0, 14.0, 18.0, 31.0, 44.0, 58.0, 87.0, 88.0, 87.0, 97.0, 89.0, 91.0, 72.0, 50.0, 49.0, 37.0, 19.0, 19.0, 13.0, 8.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6083984375, -0.5771636962890625, -0.545928955078125, -0.5146942138671875, -0.48345947265625, -0.4522247314453125, -0.420989990234375, -0.3897552490234375, -0.3585205078125, -0.3272857666015625, -0.296051025390625, -0.2648162841796875, -0.23358154296875, -0.2023468017578125, -0.171112060546875, -0.1398773193359375, -0.108642578125, -0.0774078369140625, -0.046173095703125, -0.0149383544921875, 0.01629638671875, 0.0475311279296875, 0.078765869140625, 0.1100006103515625, 0.1412353515625, 0.1724700927734375, 0.203704833984375, 0.2349395751953125, 0.26617431640625, 0.2974090576171875, 0.328643798828125, 0.3598785400390625, 0.39111328125, 0.4223480224609375, 0.453582763671875, 0.4848175048828125, 0.51605224609375, 0.5472869873046875, 0.578521728515625, 0.6097564697265625, 0.6409912109375, 0.6722259521484375, 0.703460693359375, 0.7346954345703125, 0.76593017578125, 0.7971649169921875, 0.828399658203125, 0.8596343994140625, 0.890869140625, 0.9221038818359375, 0.953338623046875, 0.9845733642578125, 1.01580810546875, 1.0470428466796875, 1.078277587890625, 1.1095123291015625, 1.1407470703125, 1.1719818115234375, 1.203216552734375, 1.2344512939453125, 1.26568603515625, 1.2969207763671875, 1.328155517578125, 1.3593902587890625, 1.390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 7.0, 1.0, 5.0, 9.0, 10.0, 13.0, 15.0, 27.0, 30.0, 48.0, 63.0, 103.0, 142.0, 224.0, 372.0, 611.0, 1100.0, 2183.0, 4806.0, 11479.0, 33044.0, 124476.0, 444696.0, 312250.0, 75181.0, 22118.0, 8078.0, 3553.0, 1721.0, 821.0, 482.0, 291.0, 182.0, 115.0, 74.0, 65.0, 34.0, 32.0, 15.0, 21.0, 14.0, 6.0, 14.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.31884765625, -0.3088264465332031, -0.29880523681640625, -0.2887840270996094, -0.2787628173828125, -0.2687416076660156, -0.25872039794921875, -0.24869918823242188, -0.238677978515625, -0.22865676879882812, -0.21863555908203125, -0.20861434936523438, -0.1985931396484375, -0.18857192993164062, -0.17855072021484375, -0.16852951049804688, -0.15850830078125, -0.14848709106445312, -0.13846588134765625, -0.12844467163085938, -0.1184234619140625, -0.10840225219726562, -0.09838104248046875, -0.08835983276367188, -0.078338623046875, -0.06831741333007812, -0.05829620361328125, -0.048274993896484375, -0.0382537841796875, -0.028232574462890625, -0.01821136474609375, -0.008190155029296875, 0.0018310546875, 0.011852264404296875, 0.02187347412109375, 0.031894683837890625, 0.0419158935546875, 0.051937103271484375, 0.06195831298828125, 0.07197952270507812, 0.082000732421875, 0.09202194213867188, 0.10204315185546875, 0.11206436157226562, 0.1220855712890625, 0.13210678100585938, 0.14212799072265625, 0.15214920043945312, 0.16217041015625, 0.17219161987304688, 0.18221282958984375, 0.19223403930664062, 0.2022552490234375, 0.21227645874023438, 0.22229766845703125, 0.23231887817382812, 0.242340087890625, 0.2523612976074219, 0.26238250732421875, 0.2724037170410156, 0.2824249267578125, 0.2924461364746094, 0.30246734619140625, 0.3124885559082031, 0.322509765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 7.0, 9.0, 13.0, 10.0, 9.0, 13.0, 14.0, 22.0, 27.0, 37.0, 21.0, 32.0, 42.0, 44.0, 41.0, 46.0, 45.0, 45.0, 36.0, 45.0, 47.0, 59.0, 40.0, 30.0, 51.0, 30.0, 26.0, 22.0, 20.0, 24.0, 12.0, 14.0, 9.0, 12.0, 7.0, 7.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.9189453125, -0.8901519775390625, -0.861358642578125, -0.8325653076171875, -0.80377197265625, -0.7749786376953125, -0.746185302734375, -0.7173919677734375, -0.6885986328125, -0.6598052978515625, -0.631011962890625, -0.6022186279296875, -0.57342529296875, -0.5446319580078125, -0.515838623046875, -0.4870452880859375, -0.458251953125, -0.4294586181640625, -0.400665283203125, -0.3718719482421875, -0.34307861328125, -0.3142852783203125, -0.285491943359375, -0.2566986083984375, -0.2279052734375, -0.1991119384765625, -0.170318603515625, -0.1415252685546875, -0.11273193359375, -0.0839385986328125, -0.055145263671875, -0.0263519287109375, 0.00244140625, 0.0312347412109375, 0.060028076171875, 0.0888214111328125, 0.11761474609375, 0.1464080810546875, 0.175201416015625, 0.2039947509765625, 0.2327880859375, 0.2615814208984375, 0.290374755859375, 0.3191680908203125, 0.34796142578125, 0.3767547607421875, 0.405548095703125, 0.4343414306640625, 0.463134765625, 0.4919281005859375, 0.520721435546875, 0.5495147705078125, 0.57830810546875, 0.6071014404296875, 0.635894775390625, 0.6646881103515625, 0.6934814453125, 0.7222747802734375, 0.751068115234375, 0.7798614501953125, 0.80865478515625, 0.8374481201171875, 0.866241455078125, 0.8950347900390625, 0.923828125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 18.0, 28.0, 36.0, 54.0, 75.0, 107.0, 200.0, 323.0, 507.0, 879.0, 1565.0, 2894.0, 5775.0, 13100.0, 33716.0, 110654.0, 423219.0, 326564.0, 80924.0, 26635.0, 10584.0, 4866.0, 2475.0, 1360.0, 736.0, 456.0, 268.0, 166.0, 128.0, 82.0, 38.0, 32.0, 19.0, 16.0, 14.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.134765625, -0.130401611328125, -0.12603759765625, -0.121673583984375, -0.1173095703125, -0.112945556640625, -0.10858154296875, -0.104217529296875, -0.099853515625, -0.095489501953125, -0.09112548828125, -0.086761474609375, -0.0823974609375, -0.078033447265625, -0.07366943359375, -0.069305419921875, -0.06494140625, -0.060577392578125, -0.05621337890625, -0.051849365234375, -0.0474853515625, -0.043121337890625, -0.03875732421875, -0.034393310546875, -0.030029296875, -0.025665283203125, -0.02130126953125, -0.016937255859375, -0.0125732421875, -0.008209228515625, -0.00384521484375, 0.000518798828125, 0.0048828125, 0.009246826171875, 0.01361083984375, 0.017974853515625, 0.0223388671875, 0.026702880859375, 0.03106689453125, 0.035430908203125, 0.039794921875, 0.044158935546875, 0.04852294921875, 0.052886962890625, 0.0572509765625, 0.061614990234375, 0.06597900390625, 0.070343017578125, 0.07470703125, 0.079071044921875, 0.08343505859375, 0.087799072265625, 0.0921630859375, 0.096527099609375, 0.10089111328125, 0.105255126953125, 0.109619140625, 0.113983154296875, 0.11834716796875, 0.122711181640625, 0.1270751953125, 0.131439208984375, 0.13580322265625, 0.140167236328125, 0.14453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 5.0, 8.0, 7.0, 15.0, 6.0, 24.0, 46.0, 52.0, 73.0, 107.0, 164.0, 142.0, 111.0, 80.0, 50.0, 23.0, 26.0, 12.0, 9.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012922286987304688, -0.00012488290667533875, -0.00012054294347763062, -0.00011620298027992249, -0.00011186301708221436, -0.00010752305388450623, -0.0001031830906867981, -9.884312748908997e-05, -9.450316429138184e-05, -9.01632010936737e-05, -8.582323789596558e-05, -8.148327469825745e-05, -7.714331150054932e-05, -7.280334830284119e-05, -6.846338510513306e-05, -6.412342190742493e-05, -5.97834587097168e-05, -5.544349551200867e-05, -5.110353231430054e-05, -4.676356911659241e-05, -4.242360591888428e-05, -3.808364272117615e-05, -3.374367952346802e-05, -2.9403716325759888e-05, -2.5063753128051758e-05, -2.0723789930343628e-05, -1.6383826732635498e-05, -1.2043863534927368e-05, -7.703900337219238e-06, -3.3639371395111084e-06, 9.760260581970215e-07, 5.315989255905151e-06, 9.655952453613281e-06, 1.3995915651321411e-05, 1.833587884902954e-05, 2.267584204673767e-05, 2.70158052444458e-05, 3.135576844215393e-05, 3.569573163986206e-05, 4.003569483757019e-05, 4.437565803527832e-05, 4.871562123298645e-05, 5.305558443069458e-05, 5.739554762840271e-05, 6.173551082611084e-05, 6.607547402381897e-05, 7.04154372215271e-05, 7.475540041923523e-05, 7.909536361694336e-05, 8.343532681465149e-05, 8.777529001235962e-05, 9.211525321006775e-05, 9.645521640777588e-05, 0.00010079517960548401, 0.00010513514280319214, 0.00010947510600090027, 0.0001138150691986084, 0.00011815503239631653, 0.00012249499559402466, 0.0001268349587917328, 0.00013117492198944092, 0.00013551488518714905, 0.00013985484838485718, 0.0001441948115825653, 0.00014853477478027344]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 10.0, 24.0, 23.0, 49.0, 55.0, 67.0, 114.0, 210.0, 268.0, 419.0, 748.0, 1333.0, 2463.0, 4952.0, 10369.0, 24067.0, 65995.0, 208005.0, 415663.0, 204400.0, 64684.0, 23918.0, 10138.0, 4795.0, 2457.0, 1311.0, 751.0, 434.0, 280.0, 183.0, 99.0, 68.0, 62.0, 40.0, 18.0, 19.0, 12.0, 9.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0], "bins": [-0.133056640625, -0.12919902801513672, -0.12534141540527344, -0.12148380279541016, -0.11762619018554688, -0.1137685775756836, -0.10991096496582031, -0.10605335235595703, -0.10219573974609375, -0.09833812713623047, -0.09448051452636719, -0.0906229019165039, -0.08676528930664062, -0.08290767669677734, -0.07905006408691406, -0.07519245147705078, -0.0713348388671875, -0.06747722625732422, -0.06361961364746094, -0.059762001037597656, -0.055904388427734375, -0.052046775817871094, -0.04818916320800781, -0.04433155059814453, -0.04047393798828125, -0.03661632537841797, -0.03275871276855469, -0.028901100158691406, -0.025043487548828125, -0.021185874938964844, -0.017328262329101562, -0.013470649719238281, -0.009613037109375, -0.005755424499511719, -0.0018978118896484375, 0.0019598007202148438, 0.005817413330078125, 0.009675025939941406, 0.013532638549804688, 0.01739025115966797, 0.02124786376953125, 0.02510547637939453, 0.028963088989257812, 0.032820701599121094, 0.036678314208984375, 0.040535926818847656, 0.04439353942871094, 0.04825115203857422, 0.0521087646484375, 0.05596637725830078, 0.05982398986816406, 0.06368160247802734, 0.06753921508789062, 0.0713968276977539, 0.07525444030761719, 0.07911205291748047, 0.08296966552734375, 0.08682727813720703, 0.09068489074707031, 0.0945425033569336, 0.09840011596679688, 0.10225772857666016, 0.10611534118652344, 0.10997295379638672, 0.11383056640625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 5.0, 18.0, 19.0, 24.0, 18.0, 37.0, 54.0, 61.0, 58.0, 73.0, 84.0, 82.0, 80.0, 72.0, 68.0, 48.0, 42.0, 25.0, 24.0, 16.0, 9.0, 17.0, 15.0, 10.0, 10.0, 8.0, 1.0, 6.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036773681640625, -0.03556632995605469, -0.034358978271484375, -0.03315162658691406, -0.03194427490234375, -0.030736923217773438, -0.029529571533203125, -0.028322219848632812, -0.0271148681640625, -0.025907516479492188, -0.024700164794921875, -0.023492813110351562, -0.02228546142578125, -0.021078109741210938, -0.019870758056640625, -0.018663406372070312, -0.0174560546875, -0.016248703002929688, -0.015041351318359375, -0.013833999633789062, -0.01262664794921875, -0.011419296264648438, -0.010211944580078125, -0.009004592895507812, -0.0077972412109375, -0.0065898895263671875, -0.005382537841796875, -0.0041751861572265625, -0.00296783447265625, -0.0017604827880859375, -0.000553131103515625, 0.0006542205810546875, 0.001861572265625, 0.0030689239501953125, 0.004276275634765625, 0.0054836273193359375, 0.00669097900390625, 0.007898330688476562, 0.009105682373046875, 0.010313034057617188, 0.0115203857421875, 0.012727737426757812, 0.013935089111328125, 0.015142440795898438, 0.01634979248046875, 0.017557144165039062, 0.018764495849609375, 0.019971847534179688, 0.02117919921875, 0.022386550903320312, 0.023593902587890625, 0.024801254272460938, 0.02600860595703125, 0.027215957641601562, 0.028423309326171875, 0.029630661010742188, 0.0308380126953125, 0.03204536437988281, 0.033252716064453125, 0.03446006774902344, 0.03566741943359375, 0.03687477111816406, 0.038082122802734375, 0.03928947448730469, 0.040496826171875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 18.0, 26.0, 65.0, 108.0, 161.0, 163.0, 184.0, 108.0, 70.0, 33.0, 13.0, 11.0, 7.0, 10.0, 4.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1375699043273926, -2.088608503341675, -2.039647102355957, -1.9906858205795288, -1.9417245388031006, -1.8927631378173828, -1.843801736831665, -1.7948404550552368, -1.745879054069519, -1.6969176530838013, -1.647956371307373, -1.5989949703216553, -1.550033688545227, -1.5010722875595093, -1.452111005783081, -1.4031496047973633, -1.3541882038116455, -1.3052268028259277, -1.2562655210494995, -1.2073041200637817, -1.1583428382873535, -1.1093814373016357, -1.060420036315918, -1.0114587545394897, -0.9624974727630615, -0.9135361313819885, -0.8645747900009155, -0.8156133890151978, -0.7666520476341248, -0.7176907062530518, -0.6687293648719788, -0.6197680234909058, -0.570806622505188, -0.521845281124115, -0.4728839099407196, -0.4239225685596466, -0.3749611973762512, -0.3259998559951782, -0.2770385146141052, -0.22807714343070984, -0.17911580204963684, -0.13015444576740265, -0.08119309693574905, -0.03223174810409546, 0.016729608178138733, 0.06569096446037292, 0.11465230584144592, 0.1636136770248413, 0.2125750184059143, 0.2615363597869873, 0.3104977309703827, 0.3594590723514557, 0.4084204435348511, 0.4573817849159241, 0.5063431262969971, 0.5553045272827148, 0.6042658090591431, 0.6532271504402161, 0.7021884918212891, 0.7511498928070068, 0.8001112341880798, 0.8490725755691528, 0.8980339169502258, 0.9469952583312988, 0.9959566593170166]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 12.0, 13.0, 14.0, 19.0, 25.0, 39.0, 40.0, 57.0, 80.0, 84.0, 106.0, 89.0, 95.0, 90.0, 69.0, 53.0, 48.0, 22.0, 18.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5825619697570801, -0.5521473288536072, -0.5217326283454895, -0.4913179874420166, -0.4609033167362213, -0.430488646030426, -0.4000740051269531, -0.36965933442115784, -0.33924466371536255, -0.30882999300956726, -0.278415322303772, -0.24800068140029907, -0.21758601069450378, -0.1871713399887085, -0.1567566841840744, -0.1263420283794403, -0.09592735767364502, -0.06551269441843033, -0.03509803116321564, -0.004683367908000946, 0.025731295347213745, 0.05614596605300903, 0.08656062185764313, 0.11697527766227722, 0.1473899483680725, 0.1778046190738678, 0.2082192748785019, 0.238633930683136, 0.2690486013889313, 0.29946327209472656, 0.32987791299819946, 0.36029258370399475, 0.39070725440979004, 0.4211219251155853, 0.4515365958213806, 0.4819512367248535, 0.5123659372329712, 0.5427805781364441, 0.573195219039917, 0.6036099195480347, 0.6340245604515076, 0.6644392013549805, 0.6948539018630981, 0.725268542766571, 0.755683183670044, 0.7860978841781616, 0.8165125250816345, 0.8469271659851074, 0.8773418664932251, 0.907756507396698, 0.9381712079048157, 0.9685858488082886, 0.9990005493164062, 1.0294151306152344, 1.059829831123352, 1.0902445316314697, 1.1206591129302979, 1.1510738134384155, 1.1814883947372437, 1.2119030952453613, 1.242317795753479, 1.2727324962615967, 1.3031470775604248, 1.3335617780685425, 1.3639764785766602]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 10.0, 5.0, 12.0, 14.0, 25.0, 48.0, 73.0, 123.0, 211.0, 457.0, 929.0, 2116.0, 5569.0, 17391.0, 68852.0, 340352.0, 475597.0, 100606.0, 23907.0, 7274.0, 2718.0, 1078.0, 515.0, 294.0, 154.0, 89.0, 36.0, 31.0, 23.0, 9.0, 6.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.88720703125, -0.859588623046875, -0.83197021484375, -0.804351806640625, -0.7767333984375, -0.749114990234375, -0.72149658203125, -0.693878173828125, -0.666259765625, -0.638641357421875, -0.61102294921875, -0.583404541015625, -0.5557861328125, -0.528167724609375, -0.50054931640625, -0.472930908203125, -0.4453125, -0.417694091796875, -0.39007568359375, -0.362457275390625, -0.3348388671875, -0.307220458984375, -0.27960205078125, -0.251983642578125, -0.224365234375, -0.196746826171875, -0.16912841796875, -0.141510009765625, -0.1138916015625, -0.086273193359375, -0.05865478515625, -0.031036376953125, -0.00341796875, 0.024200439453125, 0.05181884765625, 0.079437255859375, 0.1070556640625, 0.134674072265625, 0.16229248046875, 0.189910888671875, 0.217529296875, 0.245147705078125, 0.27276611328125, 0.300384521484375, 0.3280029296875, 0.355621337890625, 0.38323974609375, 0.410858154296875, 0.4384765625, 0.466094970703125, 0.49371337890625, 0.521331787109375, 0.5489501953125, 0.576568603515625, 0.60418701171875, 0.631805419921875, 0.659423828125, 0.687042236328125, 0.71466064453125, 0.742279052734375, 0.7698974609375, 0.797515869140625, 0.82513427734375, 0.852752685546875, 0.88037109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 5.0, 8.0, 5.0, 1.0, 7.0, 4.0, 5.0, 10.0, 9.0, 13.0, 18.0, 21.0, 16.0, 28.0, 35.0, 34.0, 36.0, 38.0, 43.0, 50.0, 51.0, 53.0, 56.0, 56.0, 47.0, 59.0, 38.0, 49.0, 37.0, 29.0, 31.0, 18.0, 24.0, 10.0, 5.0, 12.0, 9.0, 9.0, 1.0, 8.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.962890625, -0.92828369140625, -0.8936767578125, -0.85906982421875, -0.824462890625, -0.78985595703125, -0.7552490234375, -0.72064208984375, -0.68603515625, -0.65142822265625, -0.6168212890625, -0.58221435546875, -0.547607421875, -0.51300048828125, -0.4783935546875, -0.44378662109375, -0.4091796875, -0.37457275390625, -0.3399658203125, -0.30535888671875, -0.270751953125, -0.23614501953125, -0.2015380859375, -0.16693115234375, -0.13232421875, -0.09771728515625, -0.0631103515625, -0.02850341796875, 0.006103515625, 0.04071044921875, 0.0753173828125, 0.10992431640625, 0.14453125, 0.17913818359375, 0.2137451171875, 0.24835205078125, 0.282958984375, 0.31756591796875, 0.3521728515625, 0.38677978515625, 0.42138671875, 0.45599365234375, 0.4906005859375, 0.52520751953125, 0.559814453125, 0.59442138671875, 0.6290283203125, 0.66363525390625, 0.6982421875, 0.73284912109375, 0.7674560546875, 0.80206298828125, 0.836669921875, 0.87127685546875, 0.9058837890625, 0.94049072265625, 0.97509765625, 1.00970458984375, 1.0443115234375, 1.07891845703125, 1.113525390625, 1.14813232421875, 1.1827392578125, 1.21734619140625, 1.251953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 9.0, 5.0, 10.0, 9.0, 13.0, 12.0, 16.0, 23.0, 30.0, 28.0, 23.0, 32.0, 30.0, 37.0, 57.0, 68.0, 155.0, 1229.0, 255419.0, 788490.0, 2263.0, 178.0, 60.0, 47.0, 44.0, 34.0, 31.0, 23.0, 29.0, 23.0, 18.0, 13.0, 11.0, 16.0, 12.0, 7.0, 9.0, 7.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.53125, -3.41387939453125, -3.2965087890625, -3.17913818359375, -3.061767578125, -2.94439697265625, -2.8270263671875, -2.70965576171875, -2.59228515625, -2.47491455078125, -2.3575439453125, -2.24017333984375, -2.122802734375, -2.00543212890625, -1.8880615234375, -1.77069091796875, -1.6533203125, -1.53594970703125, -1.4185791015625, -1.30120849609375, -1.183837890625, -1.06646728515625, -0.9490966796875, -0.83172607421875, -0.71435546875, -0.59698486328125, -0.4796142578125, -0.36224365234375, -0.244873046875, -0.12750244140625, -0.0101318359375, 0.10723876953125, 0.224609375, 0.34197998046875, 0.4593505859375, 0.57672119140625, 0.694091796875, 0.81146240234375, 0.9288330078125, 1.04620361328125, 1.16357421875, 1.28094482421875, 1.3983154296875, 1.51568603515625, 1.633056640625, 1.75042724609375, 1.8677978515625, 1.98516845703125, 2.1025390625, 2.21990966796875, 2.3372802734375, 2.45465087890625, 2.572021484375, 2.68939208984375, 2.8067626953125, 2.92413330078125, 3.04150390625, 3.15887451171875, 3.2762451171875, 3.39361572265625, 3.510986328125, 3.62835693359375, 3.7457275390625, 3.86309814453125, 3.98046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 10.0, 8.0, 11.0, 8.0, 15.0, 18.0, 21.0, 31.0, 22.0, 26.0, 33.0, 36.0, 37.0, 44.0, 51.0, 38.0, 39.0, 29.0, 34.0, 34.0, 47.0, 38.0, 45.0, 36.0, 35.0, 30.0, 27.0, 30.0, 22.0, 16.0, 21.0, 18.0, 17.0, 12.0, 9.0, 4.0, 5.0, 7.0, 7.0, 2.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0625, -1.0273284912109375, -0.992156982421875, -0.9569854736328125, -0.92181396484375, -0.8866424560546875, -0.851470947265625, -0.8162994384765625, -0.7811279296875, -0.7459564208984375, -0.710784912109375, -0.6756134033203125, -0.64044189453125, -0.6052703857421875, -0.570098876953125, -0.5349273681640625, -0.499755859375, -0.4645843505859375, -0.429412841796875, -0.3942413330078125, -0.35906982421875, -0.3238983154296875, -0.288726806640625, -0.2535552978515625, -0.2183837890625, -0.1832122802734375, -0.148040771484375, -0.1128692626953125, -0.07769775390625, -0.0425262451171875, -0.007354736328125, 0.0278167724609375, 0.06298828125, 0.0981597900390625, 0.133331298828125, 0.1685028076171875, 0.20367431640625, 0.2388458251953125, 0.274017333984375, 0.3091888427734375, 0.3443603515625, 0.3795318603515625, 0.414703369140625, 0.4498748779296875, 0.48504638671875, 0.5202178955078125, 0.555389404296875, 0.5905609130859375, 0.625732421875, 0.6609039306640625, 0.696075439453125, 0.7312469482421875, 0.76641845703125, 0.8015899658203125, 0.836761474609375, 0.8719329833984375, 0.9071044921875, 0.9422760009765625, 0.977447509765625, 1.0126190185546875, 1.04779052734375, 1.0829620361328125, 1.118133544921875, 1.1533050537109375, 1.1884765625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 6.0, 11.0, 19.0, 19.0, 27.0, 36.0, 64.0, 139.0, 332.0, 840.0, 2899.0, 14592.0, 239253.0, 751387.0, 31689.0, 5047.0, 1325.0, 454.0, 175.0, 88.0, 56.0, 27.0, 23.0, 10.0, 12.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56494140625, -0.5484123229980469, -0.5318832397460938, -0.5153541564941406, -0.4988250732421875, -0.4822959899902344, -0.46576690673828125, -0.4492378234863281, -0.432708740234375, -0.4161796569824219, -0.39965057373046875, -0.3831214904785156, -0.3665924072265625, -0.3500633239746094, -0.33353424072265625, -0.3170051574707031, -0.30047607421875, -0.2839469909667969, -0.26741790771484375, -0.2508888244628906, -0.2343597412109375, -0.21783065795898438, -0.20130157470703125, -0.18477249145507812, -0.168243408203125, -0.15171432495117188, -0.13518524169921875, -0.11865615844726562, -0.1021270751953125, -0.08559799194335938, -0.06906890869140625, -0.052539825439453125, -0.0360107421875, -0.019481658935546875, -0.00295257568359375, 0.013576507568359375, 0.0301055908203125, 0.046634674072265625, 0.06316375732421875, 0.07969284057617188, 0.096221923828125, 0.11275100708007812, 0.12928009033203125, 0.14580917358398438, 0.1623382568359375, 0.17886734008789062, 0.19539642333984375, 0.21192550659179688, 0.22845458984375, 0.24498367309570312, 0.26151275634765625, 0.2780418395996094, 0.2945709228515625, 0.3111000061035156, 0.32762908935546875, 0.3441581726074219, 0.360687255859375, 0.3772163391113281, 0.39374542236328125, 0.4102745056152344, 0.4268035888671875, 0.4433326721191406, 0.45986175537109375, 0.4763908386230469, 0.492919921875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 7.0, 13.0, 14.0, 25.0, 27.0, 47.0, 79.0, 104.0, 120.0, 131.0, 141.0, 89.0, 61.0, 47.0, 23.0, 19.0, 6.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.650520324707031e-05, -5.495641380548477e-05, -5.340762436389923e-05, -5.185883492231369e-05, -5.031004548072815e-05, -4.876125603914261e-05, -4.721246659755707e-05, -4.566367715597153e-05, -4.4114887714385986e-05, -4.2566098272800446e-05, -4.1017308831214905e-05, -3.9468519389629364e-05, -3.791972994804382e-05, -3.637094050645828e-05, -3.482215106487274e-05, -3.32733616232872e-05, -3.172457218170166e-05, -3.017578274011612e-05, -2.862699329853058e-05, -2.7078203856945038e-05, -2.5529414415359497e-05, -2.3980624973773956e-05, -2.2431835532188416e-05, -2.0883046090602875e-05, -1.9334256649017334e-05, -1.7785467207431793e-05, -1.6236677765846252e-05, -1.4687888324260712e-05, -1.3139098882675171e-05, -1.159030944108963e-05, -1.004151999950409e-05, -8.492730557918549e-06, -6.943941116333008e-06, -5.395151674747467e-06, -3.846362233161926e-06, -2.2975727915763855e-06, -7.487833499908447e-07, 8.00006091594696e-07, 2.348795533180237e-06, 3.897584974765778e-06, 5.446374416351318e-06, 6.995163857936859e-06, 8.5439532995224e-06, 1.009274274110794e-05, 1.1641532182693481e-05, 1.3190321624279022e-05, 1.4739111065864563e-05, 1.6287900507450104e-05, 1.7836689949035645e-05, 1.9385479390621185e-05, 2.0934268832206726e-05, 2.2483058273792267e-05, 2.4031847715377808e-05, 2.558063715696335e-05, 2.712942659854889e-05, 2.867821604013443e-05, 3.022700548171997e-05, 3.177579492330551e-05, 3.332458436489105e-05, 3.487337380647659e-05, 3.6422163248062134e-05, 3.7970952689647675e-05, 3.9519742131233215e-05, 4.1068531572818756e-05, 4.26173210144043e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 12.0, 9.0, 16.0, 21.0, 28.0, 40.0, 83.0, 112.0, 170.0, 325.0, 565.0, 1196.0, 2534.0, 5890.0, 17636.0, 93069.0, 680771.0, 203071.0, 28498.0, 8054.0, 3211.0, 1507.0, 738.0, 406.0, 242.0, 118.0, 76.0, 49.0, 35.0, 23.0, 9.0, 12.0, 4.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256591796875, -0.24731826782226562, -0.23804473876953125, -0.22877120971679688, -0.2194976806640625, -0.21022415161132812, -0.20095062255859375, -0.19167709350585938, -0.182403564453125, -0.17313003540039062, -0.16385650634765625, -0.15458297729492188, -0.1453094482421875, -0.13603591918945312, -0.12676239013671875, -0.11748886108398438, -0.10821533203125, -0.09894180297851562, -0.08966827392578125, -0.08039474487304688, -0.0711212158203125, -0.061847686767578125, -0.05257415771484375, -0.043300628662109375, -0.034027099609375, -0.024753570556640625, -0.01548004150390625, -0.006206512451171875, 0.0030670166015625, 0.012340545654296875, 0.02161407470703125, 0.030887603759765625, 0.0401611328125, 0.049434661865234375, 0.05870819091796875, 0.06798171997070312, 0.0772552490234375, 0.08652877807617188, 0.09580230712890625, 0.10507583618164062, 0.114349365234375, 0.12362289428710938, 0.13289642333984375, 0.14216995239257812, 0.1514434814453125, 0.16071701049804688, 0.16999053955078125, 0.17926406860351562, 0.18853759765625, 0.19781112670898438, 0.20708465576171875, 0.21635818481445312, 0.2256317138671875, 0.23490524291992188, 0.24417877197265625, 0.2534523010253906, 0.262725830078125, 0.2719993591308594, 0.28127288818359375, 0.2905464172363281, 0.2998199462890625, 0.3090934753417969, 0.31836700439453125, 0.3276405334472656, 0.3369140625]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 6.0, 7.0, 7.0, 14.0, 20.0, 24.0, 35.0, 76.0, 170.0, 178.0, 170.0, 121.0, 68.0, 41.0, 19.0, 9.0, 9.0, 3.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2037353515625, -0.19768714904785156, -0.19163894653320312, -0.1855907440185547, -0.17954254150390625, -0.1734943389892578, -0.16744613647460938, -0.16139793395996094, -0.1553497314453125, -0.14930152893066406, -0.14325332641601562, -0.1372051239013672, -0.13115692138671875, -0.1251087188720703, -0.11906051635742188, -0.11301231384277344, -0.106964111328125, -0.10091590881347656, -0.09486770629882812, -0.08881950378417969, -0.08277130126953125, -0.07672309875488281, -0.07067489624023438, -0.06462669372558594, -0.0585784912109375, -0.05253028869628906, -0.046482086181640625, -0.04043388366699219, -0.03438568115234375, -0.028337478637695312, -0.022289276123046875, -0.016241073608398438, -0.01019287109375, -0.0041446685791015625, 0.001903533935546875, 0.007951736450195312, 0.01399993896484375, 0.020048141479492188, 0.026096343994140625, 0.03214454650878906, 0.0381927490234375, 0.04424095153808594, 0.050289154052734375, 0.05633735656738281, 0.06238555908203125, 0.06843376159667969, 0.07448196411132812, 0.08053016662597656, 0.086578369140625, 0.09262657165527344, 0.09867477416992188, 0.10472297668457031, 0.11077117919921875, 0.11681938171386719, 0.12286758422851562, 0.12891578674316406, 0.1349639892578125, 0.14101219177246094, 0.14706039428710938, 0.1531085968017578, 0.15915679931640625, 0.1652050018310547, 0.17125320434570312, 0.17730140686035156, 0.183349609375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 13.0, 166.0, 544.0, 241.0, 34.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6267006397247314, -3.286273241043091, -2.94584584236145, -2.6054186820983887, -2.264991283416748, -1.9245637655258179, -1.5841364860534668, -1.2437090873718262, -0.9032816886901855, -0.5628542900085449, -0.22242695093154907, 0.11800038814544678, 0.4584277868270874, 0.798855185508728, 1.139282464981079, 1.4797098636627197, 1.8201372623443604, 2.160564661026001, 2.5009920597076416, 2.841419219970703, 3.1818466186523438, 3.5222740173339844, 3.862701416015625, 4.203128814697266, 4.543556213378906, 4.883983612060547, 5.2244110107421875, 5.564838409423828, 5.905265808105469, 6.245693206787109, 6.58612060546875, 6.926548004150391, 7.266974449157715, 7.6074018478393555, 7.947829246520996, 8.288256645202637, 8.628684043884277, 8.969111442565918, 9.309538841247559, 9.6499662399292, 9.99039363861084, 10.33082103729248, 10.671248435974121, 11.011675834655762, 11.352103233337402, 11.692530632019043, 12.032958030700684, 12.373385429382324, 12.713811874389648, 13.054239273071289, 13.39466667175293, 13.73509407043457, 14.075521469116211, 14.415948867797852, 14.756376266479492, 15.096803665161133, 15.437231063842773, 15.777658462524414, 16.118085861206055, 16.458513259887695, 16.798940658569336, 17.139368057250977, 17.479795455932617, 17.820222854614258, 18.1606502532959]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 12.0, 19.0, 21.0, 13.0, 19.0, 29.0, 24.0, 37.0, 39.0, 34.0, 46.0, 55.0, 49.0, 57.0, 46.0, 42.0, 45.0, 41.0, 50.0, 27.0, 34.0, 35.0, 32.0, 28.0, 26.0, 22.0, 18.0, 11.0, 17.0, 8.0, 4.0, 10.0, 5.0, 9.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7280319929122925, -1.6656150817871094, -1.6031981706619263, -1.5407812595367432, -1.47836434841156, -1.415947437286377, -1.3535306453704834, -1.2911136150360107, -1.2286968231201172, -1.166279911994934, -1.103863000869751, -1.0414460897445679, -0.9790291786193848, -0.9166122674942017, -0.8541954159736633, -0.7917785048484802, -0.7293615341186523, -0.6669446229934692, -0.6045277118682861, -0.542110800743103, -0.4796939194202423, -0.4172770082950592, -0.3548601269721985, -0.2924432158470154, -0.23002630472183228, -0.16760939359664917, -0.10519249737262726, -0.04277560114860535, 0.01964130997657776, 0.08205822110176086, 0.14447510242462158, 0.2068920135498047, 0.26930904388427734, 0.33172595500946045, 0.39414286613464355, 0.4565597474575043, 0.5189766883850098, 0.5813935995101929, 0.6438104510307312, 0.7062273621559143, 0.7686442732810974, 0.8310611844062805, 0.8934780955314636, 0.955894947052002, 1.018311858177185, 1.0807287693023682, 1.1431456804275513, 1.2055625915527344, 1.2679795026779175, 1.3303964138031006, 1.3928133249282837, 1.4552302360534668, 1.51764714717865, 1.580064058303833, 1.6424808502197266, 1.7048978805541992, 1.7673146724700928, 1.8297315835952759, 1.892148494720459, 1.954565405845642, 2.016982316970825, 2.0793991088867188, 2.1418161392211914, 2.204232931137085, 2.2666499614715576]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 16.0, 17.0, 17.0, 31.0, 37.0, 43.0, 84.0, 154.0, 384.0, 1462.0, 8976.0, 252547.0, 3845120.0, 78625.0, 5248.0, 925.0, 264.0, 117.0, 67.0, 47.0, 27.0, 18.0, 11.0, 19.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.433929443359375, -3.34442138671875, -3.254913330078125, -3.1654052734375, -3.075897216796875, -2.98638916015625, -2.896881103515625, -2.807373046875, -2.717864990234375, -2.62835693359375, -2.538848876953125, -2.4493408203125, -2.359832763671875, -2.27032470703125, -2.180816650390625, -2.09130859375, -2.001800537109375, -1.91229248046875, -1.822784423828125, -1.7332763671875, -1.643768310546875, -1.55426025390625, -1.464752197265625, -1.375244140625, -1.285736083984375, -1.19622802734375, -1.106719970703125, -1.0172119140625, -0.927703857421875, -0.83819580078125, -0.748687744140625, -0.6591796875, -0.569671630859375, -0.48016357421875, -0.390655517578125, -0.3011474609375, -0.211639404296875, -0.12213134765625, -0.032623291015625, 0.056884765625, 0.146392822265625, 0.23590087890625, 0.325408935546875, 0.4149169921875, 0.504425048828125, 0.59393310546875, 0.683441162109375, 0.77294921875, 0.862457275390625, 0.95196533203125, 1.041473388671875, 1.1309814453125, 1.220489501953125, 1.30999755859375, 1.399505615234375, 1.489013671875, 1.578521728515625, 1.66802978515625, 1.757537841796875, 1.8470458984375, 1.936553955078125, 2.02606201171875, 2.115570068359375, 2.205078125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 13.0, 7.0, 13.0, 18.0, 15.0, 22.0, 22.0, 26.0, 25.0, 36.0, 46.0, 45.0, 60.0, 56.0, 54.0, 61.0, 59.0, 46.0, 46.0, 47.0, 57.0, 48.0, 23.0, 29.0, 21.0, 20.0, 13.0, 11.0, 11.0, 8.0, 4.0, 8.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.79931640625, -0.776123046875, -0.7529296875, -0.729736328125, -0.70654296875, -0.683349609375, -0.66015625, -0.636962890625, -0.61376953125, -0.590576171875, -0.5673828125, -0.544189453125, -0.52099609375, -0.497802734375, -0.474609375, -0.451416015625, -0.42822265625, -0.405029296875, -0.3818359375, -0.358642578125, -0.33544921875, -0.312255859375, -0.2890625, -0.265869140625, -0.24267578125, -0.219482421875, -0.1962890625, -0.173095703125, -0.14990234375, -0.126708984375, -0.103515625, -0.080322265625, -0.05712890625, -0.033935546875, -0.0107421875, 0.012451171875, 0.03564453125, 0.058837890625, 0.08203125, 0.105224609375, 0.12841796875, 0.151611328125, 0.1748046875, 0.197998046875, 0.22119140625, 0.244384765625, 0.267578125, 0.290771484375, 0.31396484375, 0.337158203125, 0.3603515625, 0.383544921875, 0.40673828125, 0.429931640625, 0.453125, 0.476318359375, 0.49951171875, 0.522705078125, 0.5458984375, 0.569091796875, 0.59228515625, 0.615478515625, 0.638671875, 0.661865234375, 0.68505859375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 11.0, 24.0, 54.0, 134.0, 556.0, 19706.0, 4162949.0, 10191.0, 459.0, 107.0, 36.0, 13.0, 8.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41015625, -6.22930908203125, -6.0484619140625, -5.86761474609375, -5.686767578125, -5.50592041015625, -5.3250732421875, -5.14422607421875, -4.96337890625, -4.78253173828125, -4.6016845703125, -4.42083740234375, -4.239990234375, -4.05914306640625, -3.8782958984375, -3.69744873046875, -3.5166015625, -3.33575439453125, -3.1549072265625, -2.97406005859375, -2.793212890625, -2.61236572265625, -2.4315185546875, -2.25067138671875, -2.06982421875, -1.88897705078125, -1.7081298828125, -1.52728271484375, -1.346435546875, -1.16558837890625, -0.9847412109375, -0.80389404296875, -0.623046875, -0.44219970703125, -0.2613525390625, -0.08050537109375, 0.100341796875, 0.28118896484375, 0.4620361328125, 0.64288330078125, 0.82373046875, 1.00457763671875, 1.1854248046875, 1.36627197265625, 1.547119140625, 1.72796630859375, 1.9088134765625, 2.08966064453125, 2.2705078125, 2.45135498046875, 2.6322021484375, 2.81304931640625, 2.993896484375, 3.17474365234375, 3.3555908203125, 3.53643798828125, 3.71728515625, 3.89813232421875, 4.0789794921875, 4.25982666015625, 4.440673828125, 4.62152099609375, 4.8023681640625, 4.98321533203125, 5.1640625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 8.0, 15.0, 6.0, 14.0, 17.0, 29.0, 33.0, 50.0, 100.0, 137.0, 164.0, 257.0, 393.0, 611.0, 725.0, 479.0, 328.0, 207.0, 137.0, 81.0, 75.0, 51.0, 39.0, 21.0, 13.0, 19.0, 11.0, 14.0, 12.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.27099609375, -0.2619972229003906, -0.25299835205078125, -0.24399948120117188, -0.2350006103515625, -0.22600173950195312, -0.21700286865234375, -0.20800399780273438, -0.199005126953125, -0.19000625610351562, -0.18100738525390625, -0.17200851440429688, -0.1630096435546875, -0.15401077270507812, -0.14501190185546875, -0.13601303100585938, -0.12701416015625, -0.11801528930664062, -0.10901641845703125, -0.10001754760742188, -0.0910186767578125, -0.08201980590820312, -0.07302093505859375, -0.06402206420898438, -0.055023193359375, -0.046024322509765625, -0.03702545166015625, -0.028026580810546875, -0.0190277099609375, -0.010028839111328125, -0.00102996826171875, 0.007968902587890625, 0.0169677734375, 0.025966644287109375, 0.03496551513671875, 0.043964385986328125, 0.0529632568359375, 0.061962127685546875, 0.07096099853515625, 0.07995986938476562, 0.088958740234375, 0.09795761108398438, 0.10695648193359375, 0.11595535278320312, 0.1249542236328125, 0.13395309448242188, 0.14295196533203125, 0.15195083618164062, 0.16094970703125, 0.16994857788085938, 0.17894744873046875, 0.18794631958007812, 0.1969451904296875, 0.20594406127929688, 0.21494293212890625, 0.22394180297851562, 0.232940673828125, 0.24193954467773438, 0.25093841552734375, 0.2599372863769531, 0.2689361572265625, 0.2779350280761719, 0.28693389892578125, 0.2959327697753906, 0.304931640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 15.0, 23.0, 40.0, 65.0, 67.0, 96.0, 119.0, 125.0, 118.0, 94.0, 60.0, 45.0, 30.0, 23.0, 10.0, 12.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7117741107940674, -1.665800929069519, -1.6198277473449707, -1.573854684829712, -1.5278815031051636, -1.4819083213806152, -1.435935139656067, -1.3899619579315186, -1.3439888954162598, -1.2980157136917114, -1.252042531967163, -1.2060694694519043, -1.160096287727356, -1.1141231060028076, -1.0681499242782593, -1.022176742553711, -0.9762036204338074, -0.930230438709259, -0.8842573165893555, -0.8382841348648071, -0.7923110127449036, -0.7463378310203552, -0.7003647089004517, -0.6543915271759033, -0.608418345451355, -0.5624451637268066, -0.5164720416069031, -0.47049885988235474, -0.42452573776245117, -0.37855255603790283, -0.3325794041156769, -0.2866062521934509, -0.24063313007354736, -0.1946599781513214, -0.14868682622909546, -0.10271365940570831, -0.05674050748348236, -0.010767355561256409, 0.03520581126213074, 0.08117896318435669, 0.12715211510658264, 0.1731252670288086, 0.21909841895103455, 0.2650715708732605, 0.31104475259780884, 0.3570178747177124, 0.40299105644226074, 0.4489642083644867, 0.49493736028671265, 0.540910542011261, 0.5868836641311646, 0.6328568458557129, 0.6788299679756165, 0.7248031497001648, 0.7707762718200684, 0.8167494535446167, 0.862722635269165, 0.9086958169937134, 0.9546689391136169, 1.0006420612335205, 1.0466152429580688, 1.0925884246826172, 1.1385616064071655, 1.1845347881317139, 1.2305078506469727]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 7.0, 6.0, 9.0, 10.0, 15.0, 13.0, 18.0, 17.0, 19.0, 27.0, 40.0, 34.0, 45.0, 58.0, 55.0, 54.0, 52.0, 42.0, 54.0, 50.0, 43.0, 45.0, 47.0, 41.0, 41.0, 24.0, 30.0, 19.0, 17.0, 14.0, 12.0, 7.0, 12.0, 3.0, 5.0, 1.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875497102737427, -0.6619414687156677, -0.6363332271575928, -0.6107249855995178, -0.5851167440414429, -0.5595084428787231, -0.5339002013206482, -0.5082919597625732, -0.4826837182044983, -0.45707547664642334, -0.4314672350883484, -0.40585896372795105, -0.3802507221698761, -0.35464248061180115, -0.3290342092514038, -0.30342596769332886, -0.2778177261352539, -0.25220948457717896, -0.2266012281179428, -0.20099297165870667, -0.1753847301006317, -0.14977648854255676, -0.12416823208332062, -0.09855997562408447, -0.07295173406600952, -0.04734348505735397, -0.021735236048698425, 0.003873012959957123, 0.02948126196861267, 0.05508950352668762, 0.08069775998592377, 0.10630601644515991, 0.13191425800323486, 0.15752249956130981, 0.18313075602054596, 0.2087390124797821, 0.23434725403785706, 0.259955495595932, 0.28556376695632935, 0.3111720085144043, 0.33678025007247925, 0.3623884916305542, 0.38799673318862915, 0.4136050045490265, 0.43921324610710144, 0.4648214876651764, 0.49042975902557373, 0.5160380005836487, 0.5416462421417236, 0.5672544836997986, 0.5928627252578735, 0.6184709668159485, 0.6440792083740234, 0.6696875095367432, 0.6952957510948181, 0.7209039926528931, 0.746512234210968, 0.772120475769043, 0.7977287173271179, 0.8233369588851929, 0.8489452600479126, 0.8745534420013428, 0.9001617431640625, 0.9257699847221375, 0.9513782262802124]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 11.0, 18.0, 33.0, 55.0, 109.0, 192.0, 422.0, 920.0, 2373.0, 6786.0, 26600.0, 167301.0, 670373.0, 140018.0, 23575.0, 6058.0, 2064.0, 838.0, 379.0, 192.0, 102.0, 40.0, 25.0, 20.0, 8.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.51171875, -0.4968681335449219, -0.48201751708984375, -0.4671669006347656, -0.4523162841796875, -0.4374656677246094, -0.42261505126953125, -0.4077644348144531, -0.392913818359375, -0.3780632019042969, -0.36321258544921875, -0.3483619689941406, -0.3335113525390625, -0.3186607360839844, -0.30381011962890625, -0.2889595031738281, -0.27410888671875, -0.2592582702636719, -0.24440765380859375, -0.22955703735351562, -0.2147064208984375, -0.19985580444335938, -0.18500518798828125, -0.17015457153320312, -0.155303955078125, -0.14045333862304688, -0.12560272216796875, -0.11075210571289062, -0.0959014892578125, -0.08105087280273438, -0.06620025634765625, -0.051349639892578125, -0.0364990234375, -0.021648406982421875, -0.00679779052734375, 0.008052825927734375, 0.0229034423828125, 0.037754058837890625, 0.05260467529296875, 0.06745529174804688, 0.082305908203125, 0.09715652465820312, 0.11200714111328125, 0.12685775756835938, 0.1417083740234375, 0.15655899047851562, 0.17140960693359375, 0.18626022338867188, 0.20111083984375, 0.21596145629882812, 0.23081207275390625, 0.24566268920898438, 0.2605133056640625, 0.2753639221191406, 0.29021453857421875, 0.3050651550292969, 0.319915771484375, 0.3347663879394531, 0.34961700439453125, 0.3644676208496094, 0.3793182373046875, 0.3941688537597656, 0.40901947021484375, 0.4238700866699219, 0.438720703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 3.0, 2.0, 11.0, 7.0, 10.0, 10.0, 18.0, 24.0, 17.0, 28.0, 28.0, 31.0, 41.0, 40.0, 53.0, 63.0, 50.0, 53.0, 55.0, 47.0, 45.0, 43.0, 45.0, 50.0, 37.0, 34.0, 23.0, 23.0, 15.0, 16.0, 12.0, 13.0, 10.0, 12.0, 7.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.53564453125, -0.5204238891601562, -0.5052032470703125, -0.48998260498046875, -0.474761962890625, -0.45954132080078125, -0.4443206787109375, -0.42910003662109375, -0.41387939453125, -0.39865875244140625, -0.3834381103515625, -0.36821746826171875, -0.352996826171875, -0.33777618408203125, -0.3225555419921875, -0.30733489990234375, -0.2921142578125, -0.27689361572265625, -0.2616729736328125, -0.24645233154296875, -0.231231689453125, -0.21601104736328125, -0.2007904052734375, -0.18556976318359375, -0.17034912109375, -0.15512847900390625, -0.1399078369140625, -0.12468719482421875, -0.109466552734375, -0.09424591064453125, -0.0790252685546875, -0.06380462646484375, -0.048583984375, -0.03336334228515625, -0.0181427001953125, -0.00292205810546875, 0.012298583984375, 0.02751922607421875, 0.0427398681640625, 0.05796051025390625, 0.07318115234375, 0.08840179443359375, 0.1036224365234375, 0.11884307861328125, 0.134063720703125, 0.14928436279296875, 0.1645050048828125, 0.17972564697265625, 0.1949462890625, 0.21016693115234375, 0.2253875732421875, 0.24060821533203125, 0.255828857421875, 0.27104949951171875, 0.2862701416015625, 0.30149078369140625, 0.31671142578125, 0.33193206787109375, 0.3471527099609375, 0.36237335205078125, 0.377593994140625, 0.39281463623046875, 0.4080352783203125, 0.42325592041015625, 0.4384765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 5.0, 5.0, 6.0, 8.0, 12.0, 26.0, 22.0, 46.0, 42.0, 95.0, 130.0, 266.0, 444.0, 867.0, 1986.0, 4717.0, 14209.0, 55964.0, 345557.0, 509751.0, 84080.0, 19183.0, 6266.0, 2494.0, 1073.0, 527.0, 294.0, 167.0, 110.0, 61.0, 51.0, 24.0, 19.0, 10.0, 10.0, 12.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2998046875, -0.29047393798828125, -0.2811431884765625, -0.27181243896484375, -0.262481689453125, -0.25315093994140625, -0.2438201904296875, -0.23448944091796875, -0.22515869140625, -0.21582794189453125, -0.2064971923828125, -0.19716644287109375, -0.187835693359375, -0.17850494384765625, -0.1691741943359375, -0.15984344482421875, -0.1505126953125, -0.14118194580078125, -0.1318511962890625, -0.12252044677734375, -0.113189697265625, -0.10385894775390625, -0.0945281982421875, -0.08519744873046875, -0.07586669921875, -0.06653594970703125, -0.0572052001953125, -0.04787445068359375, -0.038543701171875, -0.02921295166015625, -0.0198822021484375, -0.01055145263671875, -0.001220703125, 0.00811004638671875, 0.0174407958984375, 0.02677154541015625, 0.036102294921875, 0.04543304443359375, 0.0547637939453125, 0.06409454345703125, 0.07342529296875, 0.08275604248046875, 0.0920867919921875, 0.10141754150390625, 0.110748291015625, 0.12007904052734375, 0.1294097900390625, 0.13874053955078125, 0.1480712890625, 0.15740203857421875, 0.1667327880859375, 0.17606353759765625, 0.185394287109375, 0.19472503662109375, 0.2040557861328125, 0.21338653564453125, 0.22271728515625, 0.23204803466796875, 0.2413787841796875, 0.25070953369140625, 0.260040283203125, 0.26937103271484375, 0.2787017822265625, 0.28803253173828125, 0.29736328125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 5.0, 7.0, 13.0, 5.0, 14.0, 16.0, 20.0, 25.0, 31.0, 32.0, 40.0, 36.0, 42.0, 38.0, 37.0, 40.0, 46.0, 48.0, 48.0, 43.0, 43.0, 39.0, 36.0, 34.0, 30.0, 34.0, 32.0, 26.0, 25.0, 18.0, 20.0, 17.0, 13.0, 8.0, 5.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77880859375, -0.7529220581054688, -0.7270355224609375, -0.7011489868164062, -0.675262451171875, -0.6493759155273438, -0.6234893798828125, -0.5976028442382812, -0.57171630859375, -0.5458297729492188, -0.5199432373046875, -0.49405670166015625, -0.468170166015625, -0.44228363037109375, -0.4163970947265625, -0.39051055908203125, -0.3646240234375, -0.33873748779296875, -0.3128509521484375, -0.28696441650390625, -0.261077880859375, -0.23519134521484375, -0.2093048095703125, -0.18341827392578125, -0.15753173828125, -0.13164520263671875, -0.1057586669921875, -0.07987213134765625, -0.053985595703125, -0.02809906005859375, -0.0022125244140625, 0.02367401123046875, 0.049560546875, 0.07544708251953125, 0.1013336181640625, 0.12722015380859375, 0.153106689453125, 0.17899322509765625, 0.2048797607421875, 0.23076629638671875, 0.25665283203125, 0.28253936767578125, 0.3084259033203125, 0.33431243896484375, 0.360198974609375, 0.38608551025390625, 0.4119720458984375, 0.43785858154296875, 0.4637451171875, 0.48963165283203125, 0.5155181884765625, 0.5414047241210938, 0.567291259765625, 0.5931777954101562, 0.6190643310546875, 0.6449508666992188, 0.67083740234375, 0.6967239379882812, 0.7226104736328125, 0.7484970092773438, 0.774383544921875, 0.8002700805664062, 0.8261566162109375, 0.8520431518554688, 0.8779296875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 15.0, 21.0, 32.0, 43.0, 93.0, 187.0, 314.0, 741.0, 1848.0, 5876.0, 33158.0, 694486.0, 287382.0, 17775.0, 4155.0, 1340.0, 551.0, 243.0, 118.0, 65.0, 27.0, 30.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152587890625, -0.14490127563476562, -0.13721466064453125, -0.12952804565429688, -0.1218414306640625, -0.11415481567382812, -0.10646820068359375, -0.09878158569335938, -0.091094970703125, -0.08340835571289062, -0.07572174072265625, -0.06803512573242188, -0.0603485107421875, -0.052661895751953125, -0.04497528076171875, -0.037288665771484375, -0.02960205078125, -0.021915435791015625, -0.01422882080078125, -0.006542205810546875, 0.0011444091796875, 0.008831024169921875, 0.01651763916015625, 0.024204254150390625, 0.031890869140625, 0.039577484130859375, 0.04726409912109375, 0.054950714111328125, 0.0626373291015625, 0.07032394409179688, 0.07801055908203125, 0.08569717407226562, 0.0933837890625, 0.10107040405273438, 0.10875701904296875, 0.11644363403320312, 0.1241302490234375, 0.13181686401367188, 0.13950347900390625, 0.14719009399414062, 0.154876708984375, 0.16256332397460938, 0.17024993896484375, 0.17793655395507812, 0.1856231689453125, 0.19330978393554688, 0.20099639892578125, 0.20868301391601562, 0.21636962890625, 0.22405624389648438, 0.23174285888671875, 0.23942947387695312, 0.2471160888671875, 0.2548027038574219, 0.26248931884765625, 0.2701759338378906, 0.277862548828125, 0.2855491638183594, 0.29323577880859375, 0.3009223937988281, 0.3086090087890625, 0.3162956237792969, 0.32398223876953125, 0.3316688537597656, 0.33935546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 14.0, 16.0, 19.0, 25.0, 40.0, 60.0, 98.0, 127.0, 125.0, 126.0, 113.0, 61.0, 48.0, 31.0, 15.0, 16.0, 8.0, 8.0, 7.0, 9.0, 4.0, 4.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.91278076171875e-05, -5.671940743923187e-05, -5.4311007261276245e-05, -5.190260708332062e-05, -4.949420690536499e-05, -4.708580672740936e-05, -4.4677406549453735e-05, -4.226900637149811e-05, -3.986060619354248e-05, -3.745220601558685e-05, -3.5043805837631226e-05, -3.26354056596756e-05, -3.022700548171997e-05, -2.7818605303764343e-05, -2.5410205125808716e-05, -2.300180494785309e-05, -2.059340476989746e-05, -1.8185004591941833e-05, -1.5776604413986206e-05, -1.3368204236030579e-05, -1.0959804058074951e-05, -8.551403880119324e-06, -6.143003702163696e-06, -3.734603524208069e-06, -1.3262033462524414e-06, 1.082196831703186e-06, 3.4905970096588135e-06, 5.898997187614441e-06, 8.307397365570068e-06, 1.0715797543525696e-05, 1.3124197721481323e-05, 1.553259789943695e-05, 1.7940998077392578e-05, 2.0349398255348206e-05, 2.2757798433303833e-05, 2.516619861125946e-05, 2.7574598789215088e-05, 2.9982998967170715e-05, 3.239139914512634e-05, 3.479979932308197e-05, 3.72081995010376e-05, 3.9616599678993225e-05, 4.202499985694885e-05, 4.443340003490448e-05, 4.684180021286011e-05, 4.9250200390815735e-05, 5.165860056877136e-05, 5.406700074672699e-05, 5.647540092468262e-05, 5.8883801102638245e-05, 6.129220128059387e-05, 6.37006014585495e-05, 6.610900163650513e-05, 6.851740181446075e-05, 7.092580199241638e-05, 7.333420217037201e-05, 7.574260234832764e-05, 7.815100252628326e-05, 8.055940270423889e-05, 8.296780288219452e-05, 8.537620306015015e-05, 8.778460323810577e-05, 9.01930034160614e-05, 9.260140359401703e-05, 9.500980377197266e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 6.0, 13.0, 27.0, 25.0, 44.0, 65.0, 88.0, 190.0, 276.0, 509.0, 937.0, 2008.0, 5075.0, 18600.0, 134701.0, 719955.0, 137771.0, 18700.0, 5224.0, 2093.0, 988.0, 494.0, 313.0, 160.0, 97.0, 64.0, 31.0, 27.0, 21.0, 18.0, 11.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212158203125, -0.20618247985839844, -0.20020675659179688, -0.1942310333251953, -0.18825531005859375, -0.1822795867919922, -0.17630386352539062, -0.17032814025878906, -0.1643524169921875, -0.15837669372558594, -0.15240097045898438, -0.1464252471923828, -0.14044952392578125, -0.1344738006591797, -0.12849807739257812, -0.12252235412597656, -0.116546630859375, -0.11057090759277344, -0.10459518432617188, -0.09861946105957031, -0.09264373779296875, -0.08666801452636719, -0.08069229125976562, -0.07471656799316406, -0.0687408447265625, -0.06276512145996094, -0.056789398193359375, -0.05081367492675781, -0.04483795166015625, -0.03886222839355469, -0.032886505126953125, -0.026910781860351562, -0.02093505859375, -0.014959335327148438, -0.008983612060546875, -0.0030078887939453125, 0.00296783447265625, 0.008943557739257812, 0.014919281005859375, 0.020895004272460938, 0.0268707275390625, 0.03284645080566406, 0.038822174072265625, 0.04479789733886719, 0.05077362060546875, 0.05674934387207031, 0.06272506713867188, 0.06870079040527344, 0.074676513671875, 0.08065223693847656, 0.08662796020507812, 0.09260368347167969, 0.09857940673828125, 0.10455513000488281, 0.11053085327148438, 0.11650657653808594, 0.1224822998046875, 0.12845802307128906, 0.13443374633789062, 0.1404094696044922, 0.14638519287109375, 0.1523609161376953, 0.15833663940429688, 0.16431236267089844, 0.1702880859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 16.0, 8.0, 31.0, 49.0, 59.0, 102.0, 148.0, 147.0, 155.0, 85.0, 67.0, 42.0, 30.0, 18.0, 7.0, 11.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053314208984375, -0.05176115036010742, -0.050208091735839844, -0.048655033111572266, -0.04710197448730469, -0.04554891586303711, -0.04399585723876953, -0.04244279861450195, -0.040889739990234375, -0.0393366813659668, -0.03778362274169922, -0.03623056411743164, -0.03467750549316406, -0.033124446868896484, -0.031571388244628906, -0.030018329620361328, -0.02846527099609375, -0.026912212371826172, -0.025359153747558594, -0.023806095123291016, -0.022253036499023438, -0.02069997787475586, -0.01914691925048828, -0.017593860626220703, -0.016040802001953125, -0.014487743377685547, -0.012934684753417969, -0.01138162612915039, -0.009828567504882812, -0.008275508880615234, -0.006722450256347656, -0.005169391632080078, -0.0036163330078125, -0.002063274383544922, -0.0005102157592773438, 0.0010428428649902344, 0.0025959014892578125, 0.004148960113525391, 0.005702018737792969, 0.007255077362060547, 0.008808135986328125, 0.010361194610595703, 0.011914253234863281, 0.01346731185913086, 0.015020370483398438, 0.016573429107666016, 0.018126487731933594, 0.019679546356201172, 0.02123260498046875, 0.022785663604736328, 0.024338722229003906, 0.025891780853271484, 0.027444839477539062, 0.02899789810180664, 0.03055095672607422, 0.0321040153503418, 0.033657073974609375, 0.03521013259887695, 0.03676319122314453, 0.03831624984741211, 0.03986930847167969, 0.041422367095947266, 0.042975425720214844, 0.04452848434448242, 0.04608154296875]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 14.0, 10.0, 24.0, 46.0, 67.0, 101.0, 146.0, 157.0, 157.0, 87.0, 70.0, 41.0, 19.0, 12.0, 9.0, 7.0, 4.0, 7.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3876785039901733, -1.3533293008804321, -1.3189799785614014, -1.2846307754516602, -1.250281572341919, -1.2159322500228882, -1.181583046913147, -1.1472338438034058, -1.112884521484375, -1.0785353183746338, -1.044185996055603, -1.0098367929458618, -0.9754875302314758, -0.9411382675170898, -0.9067890644073486, -0.8724398016929626, -0.8380905985832214, -0.8037413358688354, -0.7693921327590942, -0.7350428700447083, -0.7006936073303223, -0.666344404220581, -0.6319951415061951, -0.5976458787918091, -0.5632966756820679, -0.5289474129676819, -0.4945981800556183, -0.4602489471435547, -0.4258996844291687, -0.3915504515171051, -0.3572012186050415, -0.3228519558906555, -0.28850269317626953, -0.25415346026420593, -0.21980419754981995, -0.18545496463775635, -0.15110571682453156, -0.11675646901130676, -0.08240723609924316, -0.04805798828601837, -0.013708740472793579, 0.020640503615140915, 0.05498974770307541, 0.0893389880657196, 0.1236882358789444, 0.1580374836921692, 0.1923867166042328, 0.22673596441745758, 0.2610852122306824, 0.29543444514274597, 0.32978370785713196, 0.36413294076919556, 0.39848220348358154, 0.43283143639564514, 0.46718066930770874, 0.5015299320220947, 0.5358791351318359, 0.5702283978462219, 0.6045776009559631, 0.6389268636703491, 0.6732761263847351, 0.7076253890991211, 0.7419745922088623, 0.7763238549232483, 0.8106731176376343]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 3.0, 5.0, 9.0, 12.0, 17.0, 16.0, 13.0, 26.0, 26.0, 27.0, 37.0, 47.0, 49.0, 75.0, 54.0, 55.0, 56.0, 56.0, 58.0, 46.0, 50.0, 44.0, 44.0, 30.0, 32.0, 11.0, 17.0, 13.0, 13.0, 13.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4653225243091583, -0.4494207203388214, -0.4335188865661621, -0.4176170825958252, -0.4017152786254883, -0.38581347465515137, -0.36991167068481445, -0.35400983691215515, -0.33810803294181824, -0.3222062289714813, -0.306304395198822, -0.2904025912284851, -0.2745007872581482, -0.2585989832878113, -0.24269716441631317, -0.22679534554481506, -0.21089354157447815, -0.19499173760414124, -0.17908991873264313, -0.16318809986114502, -0.1472862958908081, -0.1313844919204712, -0.11548267304897308, -0.09958086162805557, -0.08367905020713806, -0.06777723878622055, -0.05187542736530304, -0.03597361594438553, -0.020071804523468018, -0.004169993102550507, 0.011731818318367004, 0.027633629739284515, 0.04353541135787964, 0.05943722277879715, 0.07533903419971466, 0.09124084562063217, 0.10714265704154968, 0.1230444684624672, 0.1389462798833847, 0.1548480987548828, 0.17074990272521973, 0.18665170669555664, 0.20255352556705475, 0.21845534443855286, 0.23435714840888977, 0.2502589523792267, 0.266160786151886, 0.2820625901222229, 0.2979643940925598, 0.31386619806289673, 0.32976800203323364, 0.34566983580589294, 0.36157163977622986, 0.3774734437465668, 0.3933752775192261, 0.409277081489563, 0.4251788854598999, 0.4410806894302368, 0.45698249340057373, 0.47288432717323303, 0.48878613114356995, 0.5046879649162292, 0.5205897688865662, 0.5364915728569031, 0.55239337682724]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 9.0, 12.0, 9.0, 28.0, 37.0, 68.0, 99.0, 182.0, 275.0, 497.0, 1003.0, 1855.0, 4036.0, 9772.0, 30354.0, 180402.0, 662631.0, 118373.0, 23823.0, 8023.0, 3358.0, 1643.0, 890.0, 459.0, 287.0, 160.0, 89.0, 75.0, 36.0, 24.0, 13.0, 10.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9541015625, -0.9263687133789062, -0.8986358642578125, -0.8709030151367188, -0.843170166015625, -0.8154373168945312, -0.7877044677734375, -0.7599716186523438, -0.73223876953125, -0.7045059204101562, -0.6767730712890625, -0.6490402221679688, -0.621307373046875, -0.5935745239257812, -0.5658416748046875, -0.5381088256835938, -0.5103759765625, -0.48264312744140625, -0.4549102783203125, -0.42717742919921875, -0.399444580078125, -0.37171173095703125, -0.3439788818359375, -0.31624603271484375, -0.28851318359375, -0.26078033447265625, -0.2330474853515625, -0.20531463623046875, -0.177581787109375, -0.14984893798828125, -0.1221160888671875, -0.09438323974609375, -0.066650390625, -0.03891754150390625, -0.0111846923828125, 0.01654815673828125, 0.044281005859375, 0.07201385498046875, 0.0997467041015625, 0.12747955322265625, 0.15521240234375, 0.18294525146484375, 0.2106781005859375, 0.23841094970703125, 0.266143798828125, 0.29387664794921875, 0.3216094970703125, 0.34934234619140625, 0.3770751953125, 0.40480804443359375, 0.4325408935546875, 0.46027374267578125, 0.488006591796875, 0.5157394409179688, 0.5434722900390625, 0.5712051391601562, 0.59893798828125, 0.6266708374023438, 0.6544036865234375, 0.6821365356445312, 0.709869384765625, 0.7376022338867188, 0.7653350830078125, 0.7930679321289062, 0.82080078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 8.0, 7.0, 7.0, 17.0, 18.0, 26.0, 25.0, 28.0, 38.0, 48.0, 55.0, 48.0, 56.0, 69.0, 69.0, 62.0, 62.0, 52.0, 60.0, 47.0, 34.0, 37.0, 28.0, 23.0, 12.0, 14.0, 12.0, 6.0, 5.0, 5.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2822265625, -1.240234375, -1.1982421875, -1.15625, -1.1142578125, -1.072265625, -1.0302734375, -0.98828125, -0.9462890625, -0.904296875, -0.8623046875, -0.8203125, -0.7783203125, -0.736328125, -0.6943359375, -0.65234375, -0.6103515625, -0.568359375, -0.5263671875, -0.484375, -0.4423828125, -0.400390625, -0.3583984375, -0.31640625, -0.2744140625, -0.232421875, -0.1904296875, -0.1484375, -0.1064453125, -0.064453125, -0.0224609375, 0.01953125, 0.0615234375, 0.103515625, 0.1455078125, 0.1875, 0.2294921875, 0.271484375, 0.3134765625, 0.35546875, 0.3974609375, 0.439453125, 0.4814453125, 0.5234375, 0.5654296875, 0.607421875, 0.6494140625, 0.69140625, 0.7333984375, 0.775390625, 0.8173828125, 0.859375, 0.9013671875, 0.943359375, 0.9853515625, 1.02734375, 1.0693359375, 1.111328125, 1.1533203125, 1.1953125, 1.2373046875, 1.279296875, 1.3212890625, 1.36328125, 1.4052734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 6.0, 10.0, 9.0, 13.0, 16.0, 14.0, 27.0, 27.0, 50.0, 34.0, 38.0, 44.0, 105.0, 300.0, 4763.0, 1001645.0, 40078.0, 862.0, 138.0, 59.0, 45.0, 43.0, 45.0, 25.0, 15.0, 27.0, 19.0, 15.0, 11.0, 8.0, 16.0, 9.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.533538818359375, -4.40301513671875, -4.272491455078125, -4.1419677734375, -4.011444091796875, -3.88092041015625, -3.750396728515625, -3.619873046875, -3.489349365234375, -3.35882568359375, -3.228302001953125, -3.0977783203125, -2.967254638671875, -2.83673095703125, -2.706207275390625, -2.57568359375, -2.445159912109375, -2.31463623046875, -2.184112548828125, -2.0535888671875, -1.923065185546875, -1.79254150390625, -1.662017822265625, -1.531494140625, -1.400970458984375, -1.27044677734375, -1.139923095703125, -1.0093994140625, -0.878875732421875, -0.74835205078125, -0.617828369140625, -0.4873046875, -0.356781005859375, -0.22625732421875, -0.095733642578125, 0.0347900390625, 0.165313720703125, 0.29583740234375, 0.426361083984375, 0.556884765625, 0.687408447265625, 0.81793212890625, 0.948455810546875, 1.0789794921875, 1.209503173828125, 1.34002685546875, 1.470550537109375, 1.60107421875, 1.731597900390625, 1.86212158203125, 1.992645263671875, 2.1231689453125, 2.253692626953125, 2.38421630859375, 2.514739990234375, 2.645263671875, 2.775787353515625, 2.90631103515625, 3.036834716796875, 3.1673583984375, 3.297882080078125, 3.42840576171875, 3.558929443359375, 3.689453125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 5.0, 8.0, 7.0, 7.0, 15.0, 21.0, 25.0, 18.0, 39.0, 37.0, 49.0, 38.0, 38.0, 61.0, 42.0, 50.0, 36.0, 43.0, 55.0, 39.0, 54.0, 35.0, 40.0, 39.0, 20.0, 30.0, 19.0, 18.0, 18.0, 11.0, 10.0, 10.0, 12.0, 7.0, 12.0, 1.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-1.3603515625, -1.3231658935546875, -1.285980224609375, -1.2487945556640625, -1.21160888671875, -1.1744232177734375, -1.137237548828125, -1.1000518798828125, -1.0628662109375, -1.0256805419921875, -0.988494873046875, -0.9513092041015625, -0.91412353515625, -0.8769378662109375, -0.839752197265625, -0.8025665283203125, -0.765380859375, -0.7281951904296875, -0.691009521484375, -0.6538238525390625, -0.61663818359375, -0.5794525146484375, -0.542266845703125, -0.5050811767578125, -0.4678955078125, -0.4307098388671875, -0.393524169921875, -0.3563385009765625, -0.31915283203125, -0.2819671630859375, -0.244781494140625, -0.2075958251953125, -0.17041015625, -0.1332244873046875, -0.096038818359375, -0.0588531494140625, -0.02166748046875, 0.0155181884765625, 0.052703857421875, 0.0898895263671875, 0.1270751953125, 0.1642608642578125, 0.201446533203125, 0.2386322021484375, 0.27581787109375, 0.3130035400390625, 0.350189208984375, 0.3873748779296875, 0.424560546875, 0.4617462158203125, 0.498931884765625, 0.5361175537109375, 0.57330322265625, 0.6104888916015625, 0.647674560546875, 0.6848602294921875, 0.7220458984375, 0.7592315673828125, 0.796417236328125, 0.8336029052734375, 0.87078857421875, 0.9079742431640625, 0.945159912109375, 0.9823455810546875, 1.01953125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 7.0, 13.0, 9.0, 19.0, 14.0, 28.0, 43.0, 56.0, 80.0, 121.0, 227.0, 444.0, 830.0, 2227.0, 6488.0, 23249.0, 103614.0, 465272.0, 349660.0, 70975.0, 16821.0, 4966.0, 1711.0, 727.0, 373.0, 216.0, 112.0, 72.0, 38.0, 35.0, 40.0, 13.0, 8.0, 13.0, 6.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1634521484375, -0.15798187255859375, -0.1525115966796875, -0.14704132080078125, -0.141571044921875, -0.13610076904296875, -0.1306304931640625, -0.12516021728515625, -0.11968994140625, -0.11421966552734375, -0.1087493896484375, -0.10327911376953125, -0.097808837890625, -0.09233856201171875, -0.0868682861328125, -0.08139801025390625, -0.075927734375, -0.07045745849609375, -0.0649871826171875, -0.05951690673828125, -0.054046630859375, -0.04857635498046875, -0.0431060791015625, -0.03763580322265625, -0.03216552734375, -0.02669525146484375, -0.0212249755859375, -0.01575469970703125, -0.010284423828125, -0.00481414794921875, 0.0006561279296875, 0.00612640380859375, 0.0115966796875, 0.01706695556640625, 0.0225372314453125, 0.02800750732421875, 0.033477783203125, 0.03894805908203125, 0.0444183349609375, 0.04988861083984375, 0.05535888671875, 0.06082916259765625, 0.0662994384765625, 0.07176971435546875, 0.077239990234375, 0.08271026611328125, 0.0881805419921875, 0.09365081787109375, 0.09912109375, 0.10459136962890625, 0.1100616455078125, 0.11553192138671875, 0.121002197265625, 0.12647247314453125, 0.1319427490234375, 0.13741302490234375, 0.14288330078125, 0.14835357666015625, 0.1538238525390625, 0.15929412841796875, 0.164764404296875, 0.17023468017578125, 0.1757049560546875, 0.18117523193359375, 0.1866455078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 13.0, 12.0, 14.0, 19.0, 17.0, 37.0, 39.0, 47.0, 53.0, 66.0, 92.0, 96.0, 81.0, 83.0, 42.0, 49.0, 39.0, 30.0, 38.0, 34.0, 8.0, 15.0, 15.0, 13.0, 6.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3817643523216248e-05, -2.3018568754196167e-05, -2.2219493985176086e-05, -2.1420419216156006e-05, -2.0621344447135925e-05, -1.9822269678115845e-05, -1.9023194909095764e-05, -1.8224120140075684e-05, -1.7425045371055603e-05, -1.6625970602035522e-05, -1.5826895833015442e-05, -1.5027821063995361e-05, -1.422874629497528e-05, -1.34296715259552e-05, -1.263059675693512e-05, -1.1831521987915039e-05, -1.1032447218894958e-05, -1.0233372449874878e-05, -9.434297680854797e-06, -8.635222911834717e-06, -7.836148142814636e-06, -7.037073373794556e-06, -6.237998604774475e-06, -5.4389238357543945e-06, -4.639849066734314e-06, -3.840774297714233e-06, -3.041699528694153e-06, -2.2426247596740723e-06, -1.4435499906539917e-06, -6.444752216339111e-07, 1.5459954738616943e-07, 9.5367431640625e-07, 1.7527490854263306e-06, 2.551823854446411e-06, 3.3508986234664917e-06, 4.149973392486572e-06, 4.949048161506653e-06, 5.748122930526733e-06, 6.547197699546814e-06, 7.3462724685668945e-06, 8.145347237586975e-06, 8.944422006607056e-06, 9.743496775627136e-06, 1.0542571544647217e-05, 1.1341646313667297e-05, 1.2140721082687378e-05, 1.2939795851707458e-05, 1.3738870620727539e-05, 1.453794538974762e-05, 1.53370201587677e-05, 1.613609492778778e-05, 1.693516969680786e-05, 1.7734244465827942e-05, 1.8533319234848022e-05, 1.9332394003868103e-05, 2.0131468772888184e-05, 2.0930543541908264e-05, 2.1729618310928345e-05, 2.2528693079948425e-05, 2.3327767848968506e-05, 2.4126842617988586e-05, 2.4925917387008667e-05, 2.5724992156028748e-05, 2.6524066925048828e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 11.0, 23.0, 25.0, 51.0, 63.0, 126.0, 218.0, 349.0, 680.0, 1319.0, 2810.0, 7821.0, 22574.0, 82795.0, 345696.0, 427833.0, 110891.0, 28993.0, 9321.0, 3604.0, 1592.0, 747.0, 420.0, 225.0, 134.0, 77.0, 50.0, 27.0, 16.0, 17.0, 9.0, 7.0, 6.0, 2.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1788330078125, -0.1740131378173828, -0.16919326782226562, -0.16437339782714844, -0.15955352783203125, -0.15473365783691406, -0.14991378784179688, -0.1450939178466797, -0.1402740478515625, -0.1354541778564453, -0.13063430786132812, -0.12581443786621094, -0.12099456787109375, -0.11617469787597656, -0.11135482788085938, -0.10653495788574219, -0.101715087890625, -0.09689521789550781, -0.09207534790039062, -0.08725547790527344, -0.08243560791015625, -0.07761573791503906, -0.07279586791992188, -0.06797599792480469, -0.0631561279296875, -0.05833625793457031, -0.053516387939453125, -0.04869651794433594, -0.04387664794921875, -0.03905677795410156, -0.034236907958984375, -0.029417037963867188, -0.02459716796875, -0.019777297973632812, -0.014957427978515625, -0.010137557983398438, -0.00531768798828125, -0.0004978179931640625, 0.004322052001953125, 0.009141921997070312, 0.0139617919921875, 0.018781661987304688, 0.023601531982421875, 0.028421401977539062, 0.03324127197265625, 0.03806114196777344, 0.042881011962890625, 0.04770088195800781, 0.052520751953125, 0.05734062194824219, 0.062160491943359375, 0.06698036193847656, 0.07180023193359375, 0.07662010192871094, 0.08143997192382812, 0.08625984191894531, 0.0910797119140625, 0.09589958190917969, 0.10071945190429688, 0.10553932189941406, 0.11035919189453125, 0.11517906188964844, 0.11999893188476562, 0.12481880187988281, 0.129638671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 9.0, 14.0, 18.0, 18.0, 31.0, 44.0, 44.0, 59.0, 66.0, 71.0, 77.0, 70.0, 76.0, 74.0, 61.0, 59.0, 36.0, 27.0, 30.0, 21.0, 25.0, 14.0, 6.0, 7.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059844970703125, -0.05748319625854492, -0.055121421813964844, -0.052759647369384766, -0.05039787292480469, -0.04803609848022461, -0.04567432403564453, -0.04331254959106445, -0.040950775146484375, -0.0385890007019043, -0.03622722625732422, -0.03386545181274414, -0.03150367736816406, -0.029141902923583984, -0.026780128479003906, -0.024418354034423828, -0.02205657958984375, -0.019694805145263672, -0.017333030700683594, -0.014971256256103516, -0.012609481811523438, -0.01024770736694336, -0.007885932922363281, -0.005524158477783203, -0.003162384033203125, -0.0008006095886230469, 0.0015611648559570312, 0.003922939300537109, 0.0062847137451171875, 0.008646488189697266, 0.011008262634277344, 0.013370037078857422, 0.0157318115234375, 0.018093585968017578, 0.020455360412597656, 0.022817134857177734, 0.025178909301757812, 0.02754068374633789, 0.02990245819091797, 0.03226423263549805, 0.034626007080078125, 0.0369877815246582, 0.03934955596923828, 0.04171133041381836, 0.04407310485839844, 0.046434879302978516, 0.048796653747558594, 0.05115842819213867, 0.05352020263671875, 0.05588197708129883, 0.058243751525878906, 0.060605525970458984, 0.06296730041503906, 0.06532907485961914, 0.06769084930419922, 0.0700526237487793, 0.07241439819335938, 0.07477617263793945, 0.07713794708251953, 0.07949972152709961, 0.08186149597167969, 0.08422327041625977, 0.08658504486083984, 0.08894681930541992, 0.09130859375]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 10.0, 7.0, 22.0, 65.0, 138.0, 229.0, 271.0, 136.0, 65.0, 22.0, 15.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.673368453979492, -5.557599067687988, -5.441829204559326, -5.326059818267822, -5.210290431976318, -5.094520568847656, -4.978751182556152, -4.862981796264648, -4.747211933135986, -4.631442546844482, -4.51567268371582, -4.399903297424316, -4.2841339111328125, -4.16836404800415, -4.0525946617126465, -3.9368250370025635, -3.8210556507110596, -3.7052860260009766, -3.5895166397094727, -3.4737470149993896, -3.3579773902893066, -3.2422080039978027, -3.1264383792877197, -3.0106687545776367, -2.894899368286133, -2.77912974357605, -2.663360357284546, -2.547590732574463, -2.43182110786438, -2.316051483154297, -2.200282096862793, -2.08451247215271, -1.9687429666519165, -1.852973461151123, -1.73720383644104, -1.6214343309402466, -1.5056648254394531, -1.3898952007293701, -1.2741256952285767, -1.1583561897277832, -1.0425865650177002, -0.926816999912262, -0.8110474348068237, -0.6952779293060303, -0.579508364200592, -0.4637387990951538, -0.34796929359436035, -0.23219972848892212, -0.11643016338348389, -0.0006606131792068481, 0.11510893702507019, 0.23087847232818604, 0.34664803743362427, 0.4624176025390625, 0.578187108039856, 0.6939566731452942, 0.8097262382507324, 0.9254958033561707, 1.0412653684616089, 1.1570348739624023, 1.2728044986724854, 1.3885740041732788, 1.5043435096740723, 1.6201131343841553, 1.7358826398849487]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 0.0, 7.0, 8.0, 6.0, 7.0, 15.0, 14.0, 26.0, 30.0, 28.0, 27.0, 32.0, 40.0, 44.0, 47.0, 56.0, 43.0, 55.0, 52.0, 52.0, 51.0, 40.0, 40.0, 41.0, 40.0, 37.0, 20.0, 38.0, 27.0, 12.0, 10.0, 14.0, 12.0, 8.0, 6.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1390507221221924, -2.0691416263580322, -1.999232530593872, -1.929323434829712, -1.8594143390655518, -1.7895052433013916, -1.719596266746521, -1.6496871709823608, -1.5797780752182007, -1.5098689794540405, -1.4399598836898804, -1.3700507879257202, -1.3001418113708496, -1.2302327156066895, -1.1603236198425293, -1.0904145240783691, -1.020505428314209, -0.9505963325500488, -0.8806872367858887, -0.8107782006263733, -0.7408691048622131, -0.670960009098053, -0.6010509729385376, -0.5311418771743774, -0.4612327814102173, -0.39132368564605713, -0.32141461968421936, -0.2515055537223816, -0.18159645795822144, -0.11168736219406128, -0.04177829623222351, 0.028130769729614258, 0.09803962707519531, 0.16794870793819427, 0.23785778880119324, 0.307766854763031, 0.37767595052719116, 0.4475850462913513, 0.5174940824508667, 0.5874031782150269, 0.657312273979187, 0.7272213697433472, 0.7971304655075073, 0.8670395016670227, 0.9369485974311829, 1.0068576335906982, 1.0767667293548584, 1.1466758251190186, 1.2165849208831787, 1.2864940166473389, 1.356403112411499, 1.4263122081756592, 1.4962213039398193, 1.5661303997039795, 1.63603937625885, 1.7059484720230103, 1.7758575677871704, 1.8457666635513306, 1.9156757593154907, 1.9855848550796509, 2.0554938316345215, 2.1254029273986816, 2.195312023162842, 2.265221118927002, 2.335130214691162]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 9.0, 12.0, 18.0, 31.0, 33.0, 51.0, 61.0, 90.0, 164.0, 238.0, 421.0, 759.0, 1436.0, 3194.0, 8041.0, 26283.0, 129381.0, 1486747.0, 2300008.0, 186854.0, 33176.0, 9848.0, 3775.0, 1616.0, 775.0, 467.0, 273.0, 156.0, 110.0, 86.0, 58.0, 28.0, 22.0, 20.0, 12.0, 8.0, 1.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.12109375, -1.0908660888671875, -1.060638427734375, -1.0304107666015625, -1.00018310546875, -0.9699554443359375, -0.939727783203125, -0.9095001220703125, -0.8792724609375, -0.8490447998046875, -0.818817138671875, -0.7885894775390625, -0.75836181640625, -0.7281341552734375, -0.697906494140625, -0.6676788330078125, -0.637451171875, -0.6072235107421875, -0.576995849609375, -0.5467681884765625, -0.51654052734375, -0.4863128662109375, -0.456085205078125, -0.4258575439453125, -0.3956298828125, -0.3654022216796875, -0.335174560546875, -0.3049468994140625, -0.27471923828125, -0.2444915771484375, -0.214263916015625, -0.1840362548828125, -0.15380859375, -0.1235809326171875, -0.093353271484375, -0.0631256103515625, -0.03289794921875, -0.0026702880859375, 0.027557373046875, 0.0577850341796875, 0.0880126953125, 0.1182403564453125, 0.148468017578125, 0.1786956787109375, 0.20892333984375, 0.2391510009765625, 0.269378662109375, 0.2996063232421875, 0.329833984375, 0.3600616455078125, 0.390289306640625, 0.4205169677734375, 0.45074462890625, 0.4809722900390625, 0.511199951171875, 0.5414276123046875, 0.5716552734375, 0.6018829345703125, 0.632110595703125, 0.6623382568359375, 0.69256591796875, 0.7227935791015625, 0.753021240234375, 0.7832489013671875, 0.8134765625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 5.0, 7.0, 10.0, 5.0, 12.0, 10.0, 20.0, 17.0, 14.0, 21.0, 36.0, 38.0, 53.0, 39.0, 64.0, 46.0, 52.0, 56.0, 60.0, 53.0, 46.0, 42.0, 53.0, 35.0, 46.0, 31.0, 16.0, 13.0, 17.0, 10.0, 11.0, 12.0, 6.0, 11.0, 3.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53271484375, -0.51336669921875, -0.4940185546875, -0.47467041015625, -0.455322265625, -0.43597412109375, -0.4166259765625, -0.39727783203125, -0.3779296875, -0.35858154296875, -0.3392333984375, -0.31988525390625, -0.300537109375, -0.28118896484375, -0.2618408203125, -0.24249267578125, -0.22314453125, -0.20379638671875, -0.1844482421875, -0.16510009765625, -0.145751953125, -0.12640380859375, -0.1070556640625, -0.08770751953125, -0.068359375, -0.04901123046875, -0.0296630859375, -0.01031494140625, 0.009033203125, 0.02838134765625, 0.0477294921875, 0.06707763671875, 0.08642578125, 0.10577392578125, 0.1251220703125, 0.14447021484375, 0.163818359375, 0.18316650390625, 0.2025146484375, 0.22186279296875, 0.2412109375, 0.26055908203125, 0.2799072265625, 0.29925537109375, 0.318603515625, 0.33795166015625, 0.3572998046875, 0.37664794921875, 0.39599609375, 0.41534423828125, 0.4346923828125, 0.45404052734375, 0.473388671875, 0.49273681640625, 0.5120849609375, 0.53143310546875, 0.55078125, 0.57012939453125, 0.5894775390625, 0.60882568359375, 0.628173828125, 0.64752197265625, 0.6668701171875, 0.68621826171875, 0.70556640625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 9.0, 14.0, 18.0, 15.0, 35.0, 60.0, 81.0, 150.0, 354.0, 1008.0, 5725.0, 116085.0, 3986414.0, 77983.0, 4795.0, 862.0, 292.0, 132.0, 64.0, 60.0, 31.0, 16.0, 9.0, 6.0, 15.0, 8.0, 12.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.69189453125, -1.6279296875, -1.56396484375, -1.5, -1.43603515625, -1.3720703125, -1.30810546875, -1.244140625, -1.18017578125, -1.1162109375, -1.05224609375, -0.98828125, -0.92431640625, -0.8603515625, -0.79638671875, -0.732421875, -0.66845703125, -0.6044921875, -0.54052734375, -0.4765625, -0.41259765625, -0.3486328125, -0.28466796875, -0.220703125, -0.15673828125, -0.0927734375, -0.02880859375, 0.03515625, 0.09912109375, 0.1630859375, 0.22705078125, 0.291015625, 0.35498046875, 0.4189453125, 0.48291015625, 0.546875, 0.61083984375, 0.6748046875, 0.73876953125, 0.802734375, 0.86669921875, 0.9306640625, 0.99462890625, 1.05859375, 1.12255859375, 1.1865234375, 1.25048828125, 1.314453125, 1.37841796875, 1.4423828125, 1.50634765625, 1.5703125, 1.63427734375, 1.6982421875, 1.76220703125, 1.826171875, 1.89013671875, 1.9541015625, 2.01806640625, 2.08203125, 2.14599609375, 2.2099609375, 2.27392578125, 2.337890625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 6.0, 8.0, 8.0, 14.0, 18.0, 28.0, 31.0, 45.0, 80.0, 108.0, 154.0, 320.0, 568.0, 791.0, 744.0, 419.0, 250.0, 128.0, 106.0, 81.0, 54.0, 29.0, 24.0, 13.0, 15.0, 11.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.299072265625, -0.2909526824951172, -0.2828330993652344, -0.27471351623535156, -0.26659393310546875, -0.25847434997558594, -0.2503547668457031, -0.2422351837158203, -0.2341156005859375, -0.2259960174560547, -0.21787643432617188, -0.20975685119628906, -0.20163726806640625, -0.19351768493652344, -0.18539810180664062, -0.1772785186767578, -0.169158935546875, -0.1610393524169922, -0.15291976928710938, -0.14480018615722656, -0.13668060302734375, -0.12856101989746094, -0.12044143676757812, -0.11232185363769531, -0.1042022705078125, -0.09608268737792969, -0.08796310424804688, -0.07984352111816406, -0.07172393798828125, -0.06360435485839844, -0.055484771728515625, -0.04736518859863281, -0.03924560546875, -0.031126022338867188, -0.023006439208984375, -0.014886856079101562, -0.00676727294921875, 0.0013523101806640625, 0.009471893310546875, 0.017591476440429688, 0.0257110595703125, 0.03383064270019531, 0.041950225830078125, 0.05006980895996094, 0.05818939208984375, 0.06630897521972656, 0.07442855834960938, 0.08254814147949219, 0.090667724609375, 0.09878730773925781, 0.10690689086914062, 0.11502647399902344, 0.12314605712890625, 0.13126564025878906, 0.13938522338867188, 0.1475048065185547, 0.1556243896484375, 0.1637439727783203, 0.17186355590820312, 0.17998313903808594, 0.18810272216796875, 0.19622230529785156, 0.20434188842773438, 0.2124614715576172, 0.2205810546875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 9.0, 16.0, 24.0, 59.0, 97.0, 120.0, 147.0, 165.0, 121.0, 94.0, 51.0, 32.0, 15.0, 17.0, 8.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8327101469039917, -1.780419111251831, -1.72812819480896, -1.6758371591567993, -1.6235461235046387, -1.5712552070617676, -1.518964171409607, -1.4666731357574463, -1.4143821001052856, -1.362091064453125, -1.309800148010254, -1.2575091123580933, -1.2052180767059326, -1.1529271602630615, -1.1006361246109009, -1.0483450889587402, -0.9960541129112244, -0.9437631368637085, -0.8914721012115479, -0.839181125164032, -0.7868900895118713, -0.7345991134643555, -0.6823080778121948, -0.630017101764679, -0.5777261257171631, -0.5254351496696472, -0.4731441140174866, -0.4208531379699707, -0.36856210231781006, -0.3162711262702942, -0.26398012042045593, -0.21168911457061768, -0.15939807891845703, -0.10710707306861877, -0.054816074669361115, -0.0025250762701034546, 0.0497659295797348, 0.10205692052841187, 0.15434792637825012, 0.20663893222808838, 0.25892993807792664, 0.3112209439277649, 0.36351194977760315, 0.4158029556274414, 0.4680939316749573, 0.5203849077224731, 0.5726759433746338, 0.6249669790267944, 0.6772579550743103, 0.7295489311218262, 0.7818399667739868, 0.8341309428215027, 0.8864219784736633, 0.9387129545211792, 0.9910039901733398, 1.043294906616211, 1.0955859422683716, 1.1478769779205322, 1.2001678943634033, 1.252458930015564, 1.3047499656677246, 1.3570408821105957, 1.4093319177627563, 1.461622953414917, 1.5139139890670776]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 13.0, 9.0, 14.0, 19.0, 24.0, 20.0, 26.0, 33.0, 45.0, 41.0, 54.0, 43.0, 58.0, 60.0, 48.0, 54.0, 57.0, 46.0, 55.0, 53.0, 35.0, 42.0, 27.0, 19.0, 20.0, 7.0, 19.0, 6.0, 10.0, 5.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6084237098693848, -0.586319625377655, -0.5642154812812805, -0.5421113967895508, -0.520007312297821, -0.4979031980037689, -0.4757990837097168, -0.45369499921798706, -0.4315909147262573, -0.4094868004322052, -0.38738271594047546, -0.36527860164642334, -0.3431745171546936, -0.3210704028606415, -0.29896628856658936, -0.2768622040748596, -0.2547580897808075, -0.23265399038791656, -0.21054989099502563, -0.1884457767009735, -0.16634169220924377, -0.14423757791519165, -0.12213347852230072, -0.10002937912940979, -0.07792527973651886, -0.05582118034362793, -0.0337170772254467, -0.011612974107265472, 0.010491125285625458, 0.03259522467851639, 0.054699331521987915, 0.07680343091487885, 0.09890753030776978, 0.1210116297006607, 0.14311572909355164, 0.16521984338760376, 0.1873239278793335, 0.20942804217338562, 0.23153214156627655, 0.2536362409591675, 0.2757403254508972, 0.29784443974494934, 0.3199485242366791, 0.3420526385307312, 0.36415672302246094, 0.38626083731651306, 0.4083649516105652, 0.4304690361022949, 0.45257315039634705, 0.47467726469039917, 0.4967813491821289, 0.5188854336738586, 0.5409895777702332, 0.5630936622619629, 0.5851977467536926, 0.6073018312454224, 0.6294059753417969, 0.6515100598335266, 0.6736142039299011, 0.6957182884216309, 0.7178223729133606, 0.7399264574050903, 0.7620306015014648, 0.7841346859931946, 0.8062387704849243]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 13.0, 23.0, 25.0, 46.0, 79.0, 115.0, 216.0, 330.0, 709.0, 1566.0, 3354.0, 7958.0, 22533.0, 72567.0, 296024.0, 462914.0, 124421.0, 34686.0, 11878.0, 4866.0, 2135.0, 954.0, 504.0, 262.0, 139.0, 89.0, 44.0, 25.0, 29.0, 14.0, 8.0, 7.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1577739715576172, -0.15197372436523438, -0.14617347717285156, -0.14037322998046875, -0.13457298278808594, -0.12877273559570312, -0.12297248840332031, -0.1171722412109375, -0.11137199401855469, -0.10557174682617188, -0.09977149963378906, -0.09397125244140625, -0.08817100524902344, -0.08237075805664062, -0.07657051086425781, -0.070770263671875, -0.06497001647949219, -0.059169769287109375, -0.05336952209472656, -0.04756927490234375, -0.04176902770996094, -0.035968780517578125, -0.030168533325195312, -0.0243682861328125, -0.018568038940429688, -0.012767791748046875, -0.0069675445556640625, -0.00116729736328125, 0.0046329498291015625, 0.010433197021484375, 0.016233444213867188, 0.02203369140625, 0.027833938598632812, 0.033634185791015625, 0.03943443298339844, 0.04523468017578125, 0.05103492736816406, 0.056835174560546875, 0.06263542175292969, 0.0684356689453125, 0.07423591613769531, 0.08003616333007812, 0.08583641052246094, 0.09163665771484375, 0.09743690490722656, 0.10323715209960938, 0.10903739929199219, 0.114837646484375, 0.12063789367675781, 0.12643814086914062, 0.13223838806152344, 0.13803863525390625, 0.14383888244628906, 0.14963912963867188, 0.1554393768310547, 0.1612396240234375, 0.1670398712158203, 0.17284011840820312, 0.17864036560058594, 0.18444061279296875, 0.19024085998535156, 0.19604110717773438, 0.2018413543701172, 0.2076416015625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 13.0, 16.0, 10.0, 19.0, 22.0, 28.0, 48.0, 48.0, 55.0, 67.0, 87.0, 77.0, 71.0, 69.0, 72.0, 73.0, 51.0, 48.0, 28.0, 17.0, 15.0, 14.0, 11.0, 10.0, 2.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48046875, -0.46120452880859375, -0.4419403076171875, -0.42267608642578125, -0.403411865234375, -0.38414764404296875, -0.3648834228515625, -0.34561920166015625, -0.32635498046875, -0.30709075927734375, -0.2878265380859375, -0.26856231689453125, -0.249298095703125, -0.23003387451171875, -0.2107696533203125, -0.19150543212890625, -0.1722412109375, -0.15297698974609375, -0.1337127685546875, -0.11444854736328125, -0.095184326171875, -0.07592010498046875, -0.0566558837890625, -0.03739166259765625, -0.01812744140625, 0.00113677978515625, 0.0204010009765625, 0.03966522216796875, 0.058929443359375, 0.07819366455078125, 0.0974578857421875, 0.11672210693359375, 0.135986328125, 0.15525054931640625, 0.1745147705078125, 0.19377899169921875, 0.213043212890625, 0.23230743408203125, 0.2515716552734375, 0.27083587646484375, 0.29010009765625, 0.30936431884765625, 0.3286285400390625, 0.34789276123046875, 0.367156982421875, 0.38642120361328125, 0.4056854248046875, 0.42494964599609375, 0.4442138671875, 0.46347808837890625, 0.4827423095703125, 0.5020065307617188, 0.521270751953125, 0.5405349731445312, 0.5597991943359375, 0.5790634155273438, 0.59832763671875, 0.6175918579101562, 0.6368560791015625, 0.6561203002929688, 0.675384521484375, 0.6946487426757812, 0.7139129638671875, 0.7331771850585938, 0.75244140625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0, 3.0, 5.0, 10.0, 14.0, 20.0, 20.0, 35.0, 56.0, 78.0, 130.0, 187.0, 367.0, 669.0, 1501.0, 3642.0, 11155.0, 44158.0, 233856.0, 571010.0, 139780.0, 28753.0, 7798.0, 2773.0, 1165.0, 569.0, 291.0, 177.0, 106.0, 69.0, 54.0, 46.0, 31.0, 12.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2052001953125, -0.19939613342285156, -0.19359207153320312, -0.1877880096435547, -0.18198394775390625, -0.1761798858642578, -0.17037582397460938, -0.16457176208496094, -0.1587677001953125, -0.15296363830566406, -0.14715957641601562, -0.1413555145263672, -0.13555145263671875, -0.1297473907470703, -0.12394332885742188, -0.11813926696777344, -0.112335205078125, -0.10653114318847656, -0.10072708129882812, -0.09492301940917969, -0.08911895751953125, -0.08331489562988281, -0.07751083374023438, -0.07170677185058594, -0.0659027099609375, -0.06009864807128906, -0.054294586181640625, -0.04849052429199219, -0.04268646240234375, -0.03688240051269531, -0.031078338623046875, -0.025274276733398438, -0.01947021484375, -0.013666152954101562, -0.007862091064453125, -0.0020580291748046875, 0.00374603271484375, 0.009550094604492188, 0.015354156494140625, 0.021158218383789062, 0.0269622802734375, 0.03276634216308594, 0.038570404052734375, 0.04437446594238281, 0.05017852783203125, 0.05598258972167969, 0.061786651611328125, 0.06759071350097656, 0.073394775390625, 0.07919883728027344, 0.08500289916992188, 0.09080696105957031, 0.09661102294921875, 0.10241508483886719, 0.10821914672851562, 0.11402320861816406, 0.1198272705078125, 0.12563133239746094, 0.13143539428710938, 0.1372394561767578, 0.14304351806640625, 0.1488475799560547, 0.15465164184570312, 0.16045570373535156, 0.166259765625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 4.0, 11.0, 5.0, 13.0, 14.0, 6.0, 13.0, 22.0, 21.0, 17.0, 32.0, 25.0, 30.0, 47.0, 34.0, 52.0, 32.0, 44.0, 61.0, 45.0, 49.0, 48.0, 47.0, 38.0, 43.0, 39.0, 28.0, 38.0, 19.0, 20.0, 25.0, 18.0, 13.0, 12.0, 8.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7607421875, -0.73699951171875, -0.7132568359375, -0.68951416015625, -0.665771484375, -0.64202880859375, -0.6182861328125, -0.59454345703125, -0.57080078125, -0.54705810546875, -0.5233154296875, -0.49957275390625, -0.475830078125, -0.45208740234375, -0.4283447265625, -0.40460205078125, -0.380859375, -0.35711669921875, -0.3333740234375, -0.30963134765625, -0.285888671875, -0.26214599609375, -0.2384033203125, -0.21466064453125, -0.19091796875, -0.16717529296875, -0.1434326171875, -0.11968994140625, -0.095947265625, -0.07220458984375, -0.0484619140625, -0.02471923828125, -0.0009765625, 0.02276611328125, 0.0465087890625, 0.07025146484375, 0.093994140625, 0.11773681640625, 0.1414794921875, 0.16522216796875, 0.18896484375, 0.21270751953125, 0.2364501953125, 0.26019287109375, 0.283935546875, 0.30767822265625, 0.3314208984375, 0.35516357421875, 0.37890625, 0.40264892578125, 0.4263916015625, 0.45013427734375, 0.473876953125, 0.49761962890625, 0.5213623046875, 0.54510498046875, 0.56884765625, 0.59259033203125, 0.6163330078125, 0.64007568359375, 0.663818359375, 0.68756103515625, 0.7113037109375, 0.73504638671875, 0.7587890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 5.0, 18.0, 14.0, 19.0, 27.0, 52.0, 88.0, 125.0, 218.0, 359.0, 644.0, 1219.0, 2385.0, 5109.0, 12823.0, 36920.0, 135936.0, 493904.0, 262111.0, 62660.0, 19763.0, 7445.0, 3241.0, 1467.0, 786.0, 469.0, 220.0, 197.0, 111.0, 57.0, 45.0, 32.0, 26.0, 14.0, 12.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06485128402709961, -0.06286907196044922, -0.06088685989379883, -0.05890464782714844, -0.05692243576049805, -0.054940223693847656, -0.052958011627197266, -0.050975799560546875, -0.048993587493896484, -0.047011375427246094, -0.0450291633605957, -0.04304695129394531, -0.04106473922729492, -0.03908252716064453, -0.03710031509399414, -0.03511810302734375, -0.03313589096069336, -0.03115367889404297, -0.029171466827392578, -0.027189254760742188, -0.025207042694091797, -0.023224830627441406, -0.021242618560791016, -0.019260406494140625, -0.017278194427490234, -0.015295982360839844, -0.013313770294189453, -0.011331558227539062, -0.009349346160888672, -0.007367134094238281, -0.005384922027587891, -0.0034027099609375, -0.0014204978942871094, 0.0005617141723632812, 0.002543926239013672, 0.0045261383056640625, 0.006508350372314453, 0.008490562438964844, 0.010472774505615234, 0.012454986572265625, 0.014437198638916016, 0.016419410705566406, 0.018401622772216797, 0.020383834838867188, 0.022366046905517578, 0.02434825897216797, 0.02633047103881836, 0.02831268310546875, 0.03029489517211914, 0.03227710723876953, 0.03425931930541992, 0.03624153137207031, 0.0382237434387207, 0.040205955505371094, 0.042188167572021484, 0.044170379638671875, 0.046152591705322266, 0.048134803771972656, 0.05011701583862305, 0.05209922790527344, 0.05408143997192383, 0.05606365203857422, 0.05804586410522461, 0.060028076171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 11.0, 12.0, 24.0, 20.0, 43.0, 46.0, 58.0, 87.0, 113.0, 134.0, 128.0, 85.0, 68.0, 34.0, 43.0, 18.0, 16.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17692756652832e-05, -3.0279159545898438e-05, -2.8789043426513672e-05, -2.7298927307128906e-05, -2.580881118774414e-05, -2.4318695068359375e-05, -2.282857894897461e-05, -2.1338462829589844e-05, -1.9848346710205078e-05, -1.8358230590820312e-05, -1.6868114471435547e-05, -1.537799835205078e-05, -1.3887882232666016e-05, -1.239776611328125e-05, -1.0907649993896484e-05, -9.417533874511719e-06, -7.927417755126953e-06, -6.4373016357421875e-06, -4.947185516357422e-06, -3.4570693969726562e-06, -1.9669532775878906e-06, -4.76837158203125e-07, 1.0132789611816406e-06, 2.5033950805664062e-06, 3.993511199951172e-06, 5.4836273193359375e-06, 6.973743438720703e-06, 8.463859558105469e-06, 9.953975677490234e-06, 1.1444091796875e-05, 1.2934207916259766e-05, 1.4424324035644531e-05, 1.5914440155029297e-05, 1.7404556274414062e-05, 1.8894672393798828e-05, 2.0384788513183594e-05, 2.187490463256836e-05, 2.3365020751953125e-05, 2.485513687133789e-05, 2.6345252990722656e-05, 2.7835369110107422e-05, 2.9325485229492188e-05, 3.081560134887695e-05, 3.230571746826172e-05, 3.3795833587646484e-05, 3.528594970703125e-05, 3.6776065826416016e-05, 3.826618194580078e-05, 3.975629806518555e-05, 4.124641418457031e-05, 4.273653030395508e-05, 4.4226646423339844e-05, 4.571676254272461e-05, 4.7206878662109375e-05, 4.869699478149414e-05, 5.0187110900878906e-05, 5.167722702026367e-05, 5.316734313964844e-05, 5.46574592590332e-05, 5.614757537841797e-05, 5.7637691497802734e-05, 5.91278076171875e-05, 6.0617923736572266e-05, 6.210803985595703e-05, 6.35981559753418e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 10.0, 16.0, 31.0, 33.0, 59.0, 90.0, 143.0, 232.0, 457.0, 869.0, 1929.0, 4378.0, 11090.0, 31345.0, 100134.0, 354506.0, 378828.0, 109563.0, 34002.0, 12042.0, 4793.0, 1957.0, 944.0, 469.0, 239.0, 144.0, 83.0, 47.0, 29.0, 23.0, 16.0, 15.0, 10.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061309814453125, -0.05933427810668945, -0.057358741760253906, -0.05538320541381836, -0.05340766906738281, -0.051432132720947266, -0.04945659637451172, -0.04748106002807617, -0.045505523681640625, -0.04352998733520508, -0.04155445098876953, -0.039578914642333984, -0.03760337829589844, -0.03562784194946289, -0.033652305603027344, -0.0316767692565918, -0.02970123291015625, -0.027725696563720703, -0.025750160217285156, -0.02377462387084961, -0.021799087524414062, -0.019823551177978516, -0.01784801483154297, -0.015872478485107422, -0.013896942138671875, -0.011921405792236328, -0.009945869445800781, -0.007970333099365234, -0.0059947967529296875, -0.004019260406494141, -0.0020437240600585938, -6.818771362304688e-05, 0.0019073486328125, 0.003882884979248047, 0.005858421325683594, 0.00783395767211914, 0.009809494018554688, 0.011785030364990234, 0.013760566711425781, 0.015736103057861328, 0.017711639404296875, 0.019687175750732422, 0.02166271209716797, 0.023638248443603516, 0.025613784790039062, 0.02758932113647461, 0.029564857482910156, 0.0315403938293457, 0.03351593017578125, 0.0354914665222168, 0.037467002868652344, 0.03944253921508789, 0.04141807556152344, 0.043393611907958984, 0.04536914825439453, 0.04734468460083008, 0.049320220947265625, 0.05129575729370117, 0.05327129364013672, 0.055246829986572266, 0.05722236633300781, 0.05919790267944336, 0.061173439025878906, 0.06314897537231445, 0.06512451171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 3.0, 4.0, 9.0, 4.0, 10.0, 9.0, 14.0, 11.0, 22.0, 12.0, 26.0, 35.0, 31.0, 33.0, 40.0, 46.0, 57.0, 71.0, 72.0, 60.0, 47.0, 58.0, 45.0, 40.0, 43.0, 31.0, 32.0, 23.0, 23.0, 13.0, 10.0, 13.0, 14.0, 11.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.013397216796875, -0.012999773025512695, -0.01260232925415039, -0.012204885482788086, -0.011807441711425781, -0.011409997940063477, -0.011012554168701172, -0.010615110397338867, -0.010217666625976562, -0.009820222854614258, -0.009422779083251953, -0.009025335311889648, -0.008627891540527344, -0.008230447769165039, -0.007833003997802734, -0.00743556022644043, -0.007038116455078125, -0.00664067268371582, -0.006243228912353516, -0.005845785140991211, -0.005448341369628906, -0.0050508975982666016, -0.004653453826904297, -0.004256010055541992, -0.0038585662841796875, -0.003461122512817383, -0.003063678741455078, -0.0026662349700927734, -0.0022687911987304688, -0.001871347427368164, -0.0014739036560058594, -0.0010764598846435547, -0.00067901611328125, -0.0002815723419189453, 0.00011587142944335938, 0.0005133152008056641, 0.0009107589721679688, 0.0013082027435302734, 0.0017056465148925781, 0.002103090286254883, 0.0025005340576171875, 0.002897977828979492, 0.003295421600341797, 0.0036928653717041016, 0.004090309143066406, 0.004487752914428711, 0.004885196685791016, 0.00528264045715332, 0.005680084228515625, 0.00607752799987793, 0.006474971771240234, 0.006872415542602539, 0.007269859313964844, 0.0076673030853271484, 0.008064746856689453, 0.008462190628051758, 0.008859634399414062, 0.009257078170776367, 0.009654521942138672, 0.010051965713500977, 0.010449409484863281, 0.010846853256225586, 0.01124429702758789, 0.011641740798950195, 0.0120391845703125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 11.0, 15.0, 36.0, 73.0, 114.0, 190.0, 210.0, 143.0, 93.0, 39.0, 21.0, 22.0, 9.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5127205848693848, -1.4721118211746216, -1.4315029382705688, -1.3908941745758057, -1.350285291671753, -1.3096765279769897, -1.2690677642822266, -1.2284588813781738, -1.1878501176834106, -1.1472413539886475, -1.1066324710845947, -1.0660237073898315, -1.0254149436950684, -0.9848060607910156, -0.9441972970962524, -0.9035884737968445, -0.8629796504974365, -0.8223708271980286, -0.7817620038986206, -0.7411532402038574, -0.7005444169044495, -0.6599355936050415, -0.6193268299102783, -0.5787180066108704, -0.5381091833114624, -0.49750036001205444, -0.45689156651496887, -0.4162827730178833, -0.37567394971847534, -0.3350651264190674, -0.2944563329219818, -0.25384753942489624, -0.21323871612548828, -0.17262990772724152, -0.13202109932899475, -0.09141229093074799, -0.05080348253250122, -0.010194674134254456, 0.03041413426399231, 0.07102292776107788, 0.11163175106048584, 0.1522405594587326, 0.19284936785697937, 0.23345817625522614, 0.2740669846534729, 0.31467580795288086, 0.35528460144996643, 0.395893394947052, 0.43650221824645996, 0.4771110415458679, 0.5177198648452759, 0.5583286285400391, 0.598937451839447, 0.639546275138855, 0.6801550388336182, 0.7207638621330261, 0.7613726854324341, 0.801981508731842, 0.84259033203125, 0.8831990957260132, 0.9238079190254211, 0.9644167423248291, 1.0050255060195923, 1.0456342697143555, 1.0862431526184082]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 8.0, 12.0, 16.0, 19.0, 34.0, 39.0, 53.0, 84.0, 61.0, 81.0, 88.0, 86.0, 80.0, 79.0, 68.0, 54.0, 32.0, 26.0, 17.0, 18.0, 12.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4622107148170471, -0.4412214159965515, -0.4202321171760559, -0.3992428183555603, -0.3782535195350647, -0.3572642207145691, -0.3362749218940735, -0.3152856230735779, -0.2942963242530823, -0.27330702543258667, -0.25231772661209106, -0.23132842779159546, -0.21033912897109985, -0.18934983015060425, -0.16836051642894745, -0.14737121760845184, -0.12638190388679504, -0.10539260506629944, -0.08440330624580383, -0.06341399997472763, -0.042424701154232025, -0.02143540233373642, -0.0004460960626602173, 0.020543202757835388, 0.041532501578330994, 0.0625218003988266, 0.0835110992193222, 0.10450040549039841, 0.1254897117614746, 0.14647901058197021, 0.16746830940246582, 0.18845760822296143, 0.20944690704345703, 0.23043620586395264, 0.25142550468444824, 0.27241480350494385, 0.29340410232543945, 0.31439340114593506, 0.33538269996643066, 0.35637199878692627, 0.3773612976074219, 0.3983505964279175, 0.4193398952484131, 0.4403291940689087, 0.4613184928894043, 0.4823077917098999, 0.5032970905303955, 0.5242863893508911, 0.5452756881713867, 0.5662649869918823, 0.5872542858123779, 0.6082435846328735, 0.6292328834533691, 0.6502221822738647, 0.6712114810943604, 0.692200779914856, 0.7131901383399963, 0.7341794371604919, 0.7551687359809875, 0.7761580348014832, 0.7971473336219788, 0.8181366324424744, 0.83912593126297, 0.8601152300834656, 0.8811045289039612]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 1.0, 5.0, 12.0, 21.0, 26.0, 51.0, 71.0, 170.0, 346.0, 1022.0, 4003.0, 29785.0, 756761.0, 239546.0, 13249.0, 2246.0, 658.0, 266.0, 110.0, 64.0, 34.0, 22.0, 16.0, 18.0, 12.0, 7.0, 6.0, 6.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.373046875, -1.3336181640625, -1.294189453125, -1.2547607421875, -1.21533203125, -1.1759033203125, -1.136474609375, -1.0970458984375, -1.0576171875, -1.0181884765625, -0.978759765625, -0.9393310546875, -0.89990234375, -0.8604736328125, -0.821044921875, -0.7816162109375, -0.7421875, -0.7027587890625, -0.663330078125, -0.6239013671875, -0.58447265625, -0.5450439453125, -0.505615234375, -0.4661865234375, -0.4267578125, -0.3873291015625, -0.347900390625, -0.3084716796875, -0.26904296875, -0.2296142578125, -0.190185546875, -0.1507568359375, -0.111328125, -0.0718994140625, -0.032470703125, 0.0069580078125, 0.04638671875, 0.0858154296875, 0.125244140625, 0.1646728515625, 0.2041015625, 0.2435302734375, 0.282958984375, 0.3223876953125, 0.36181640625, 0.4012451171875, 0.440673828125, 0.4801025390625, 0.51953125, 0.5589599609375, 0.598388671875, 0.6378173828125, 0.67724609375, 0.7166748046875, 0.756103515625, 0.7955322265625, 0.8349609375, 0.8743896484375, 0.913818359375, 0.9532470703125, 0.99267578125, 1.0321044921875, 1.071533203125, 1.1109619140625, 1.150390625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 25.0, 34.0, 58.0, 90.0, 93.0, 154.0, 121.0, 120.0, 118.0, 61.0, 35.0, 23.0, 19.0, 16.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95947265625, -0.8924484252929688, -0.8254241943359375, -0.7583999633789062, -0.691375732421875, -0.6243515014648438, -0.5573272705078125, -0.49030303955078125, -0.42327880859375, -0.35625457763671875, -0.2892303466796875, -0.22220611572265625, -0.155181884765625, -0.08815765380859375, -0.0211334228515625, 0.04589080810546875, 0.1129150390625, 0.17993927001953125, 0.2469635009765625, 0.31398773193359375, 0.381011962890625, 0.44803619384765625, 0.5150604248046875, 0.5820846557617188, 0.64910888671875, 0.7161331176757812, 0.7831573486328125, 0.8501815795898438, 0.917205810546875, 0.9842300415039062, 1.0512542724609375, 1.1182785034179688, 1.185302734375, 1.2523269653320312, 1.3193511962890625, 1.3863754272460938, 1.453399658203125, 1.5204238891601562, 1.5874481201171875, 1.6544723510742188, 1.72149658203125, 1.7885208129882812, 1.8555450439453125, 1.9225692749023438, 1.989593505859375, 2.0566177368164062, 2.1236419677734375, 2.1906661987304688, 2.2576904296875, 2.3247146606445312, 2.3917388916015625, 2.4587631225585938, 2.525787353515625, 2.5928115844726562, 2.6598358154296875, 2.7268600463867188, 2.79388427734375, 2.8609085083007812, 2.9279327392578125, 2.9949569702148438, 3.061981201171875, 3.1290054321289062, 3.1960296630859375, 3.2630538940429688, 3.330078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 18.0, 9.0, 25.0, 12.0, 22.0, 28.0, 29.0, 48.0, 61.0, 67.0, 97.0, 132.0, 227.0, 500.0, 1553.0, 7529.0, 146891.0, 857348.0, 28591.0, 3382.0, 917.0, 351.0, 180.0, 122.0, 83.0, 77.0, 49.0, 31.0, 27.0, 27.0, 21.0, 14.0, 20.0, 5.0, 8.0, 4.0, 5.0, 6.0, 4.0, 0.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.072265625, -1.0356292724609375, -0.998992919921875, -0.9623565673828125, -0.92572021484375, -0.8890838623046875, -0.852447509765625, -0.8158111572265625, -0.7791748046875, -0.7425384521484375, -0.705902099609375, -0.6692657470703125, -0.63262939453125, -0.5959930419921875, -0.559356689453125, -0.5227203369140625, -0.486083984375, -0.4494476318359375, -0.412811279296875, -0.3761749267578125, -0.33953857421875, -0.3029022216796875, -0.266265869140625, -0.2296295166015625, -0.1929931640625, -0.1563568115234375, -0.119720458984375, -0.0830841064453125, -0.04644775390625, -0.0098114013671875, 0.026824951171875, 0.0634613037109375, 0.10009765625, 0.1367340087890625, 0.173370361328125, 0.2100067138671875, 0.24664306640625, 0.2832794189453125, 0.319915771484375, 0.3565521240234375, 0.3931884765625, 0.4298248291015625, 0.466461181640625, 0.5030975341796875, 0.53973388671875, 0.5763702392578125, 0.613006591796875, 0.6496429443359375, 0.686279296875, 0.7229156494140625, 0.759552001953125, 0.7961883544921875, 0.83282470703125, 0.8694610595703125, 0.906097412109375, 0.9427337646484375, 0.9793701171875, 1.0160064697265625, 1.052642822265625, 1.0892791748046875, 1.12591552734375, 1.1625518798828125, 1.199188232421875, 1.2358245849609375, 1.2724609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 9.0, 7.0, 10.0, 17.0, 12.0, 14.0, 16.0, 20.0, 28.0, 18.0, 39.0, 27.0, 32.0, 25.0, 35.0, 45.0, 37.0, 44.0, 44.0, 38.0, 51.0, 44.0, 47.0, 45.0, 38.0, 29.0, 38.0, 29.0, 24.0, 17.0, 20.0, 15.0, 21.0, 7.0, 12.0, 6.0, 3.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.767578125, -0.7418060302734375, -0.716033935546875, -0.6902618408203125, -0.66448974609375, -0.6387176513671875, -0.612945556640625, -0.5871734619140625, -0.5614013671875, -0.5356292724609375, -0.509857177734375, -0.4840850830078125, -0.45831298828125, -0.4325408935546875, -0.406768798828125, -0.3809967041015625, -0.355224609375, -0.3294525146484375, -0.303680419921875, -0.2779083251953125, -0.25213623046875, -0.2263641357421875, -0.200592041015625, -0.1748199462890625, -0.1490478515625, -0.1232757568359375, -0.097503662109375, -0.0717315673828125, -0.04595947265625, -0.0201873779296875, 0.005584716796875, 0.0313568115234375, 0.05712890625, 0.0829010009765625, 0.108673095703125, 0.1344451904296875, 0.16021728515625, 0.1859893798828125, 0.211761474609375, 0.2375335693359375, 0.2633056640625, 0.2890777587890625, 0.314849853515625, 0.3406219482421875, 0.36639404296875, 0.3921661376953125, 0.417938232421875, 0.4437103271484375, 0.469482421875, 0.4952545166015625, 0.521026611328125, 0.5467987060546875, 0.57257080078125, 0.5983428955078125, 0.624114990234375, 0.6498870849609375, 0.6756591796875, 0.7014312744140625, 0.727203369140625, 0.7529754638671875, 0.77874755859375, 0.8045196533203125, 0.830291748046875, 0.8560638427734375, 0.8818359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 2.0, 10.0, 14.0, 23.0, 35.0, 41.0, 72.0, 103.0, 167.0, 252.0, 443.0, 813.0, 1649.0, 3227.0, 7235.0, 18422.0, 53551.0, 194502.0, 504200.0, 181999.0, 50500.0, 17720.0, 6955.0, 3092.0, 1498.0, 828.0, 413.0, 297.0, 153.0, 98.0, 75.0, 43.0, 44.0, 19.0, 12.0, 8.0, 9.0, 6.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1246337890625, -0.12067413330078125, -0.1167144775390625, -0.11275482177734375, -0.108795166015625, -0.10483551025390625, -0.1008758544921875, -0.09691619873046875, -0.09295654296875, -0.08899688720703125, -0.0850372314453125, -0.08107757568359375, -0.077117919921875, -0.07315826416015625, -0.0691986083984375, -0.06523895263671875, -0.061279296875, -0.05731964111328125, -0.0533599853515625, -0.04940032958984375, -0.045440673828125, -0.04148101806640625, -0.0375213623046875, -0.03356170654296875, -0.02960205078125, -0.02564239501953125, -0.0216827392578125, -0.01772308349609375, -0.013763427734375, -0.00980377197265625, -0.0058441162109375, -0.00188446044921875, 0.0020751953125, 0.00603485107421875, 0.0099945068359375, 0.01395416259765625, 0.017913818359375, 0.02187347412109375, 0.0258331298828125, 0.02979278564453125, 0.03375244140625, 0.03771209716796875, 0.0416717529296875, 0.04563140869140625, 0.049591064453125, 0.05355072021484375, 0.0575103759765625, 0.06147003173828125, 0.0654296875, 0.06938934326171875, 0.0733489990234375, 0.07730865478515625, 0.081268310546875, 0.08522796630859375, 0.0891876220703125, 0.09314727783203125, 0.09710693359375, 0.10106658935546875, 0.1050262451171875, 0.10898590087890625, 0.112945556640625, 0.11690521240234375, 0.1208648681640625, 0.12482452392578125, 0.1287841796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 11.0, 6.0, 12.0, 14.0, 20.0, 26.0, 38.0, 29.0, 49.0, 59.0, 94.0, 83.0, 109.0, 104.0, 79.0, 59.0, 51.0, 41.0, 30.0, 26.0, 14.0, 7.0, 5.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.300739288330078e-05, -2.2224150598049164e-05, -2.1440908312797546e-05, -2.065766602754593e-05, -1.987442374229431e-05, -1.9091181457042694e-05, -1.8307939171791077e-05, -1.752469688653946e-05, -1.6741454601287842e-05, -1.5958212316036224e-05, -1.5174970030784607e-05, -1.439172774553299e-05, -1.3608485460281372e-05, -1.2825243175029755e-05, -1.2042000889778137e-05, -1.125875860452652e-05, -1.0475516319274902e-05, -9.692274034023285e-06, -8.909031748771667e-06, -8.12578946352005e-06, -7.342547178268433e-06, -6.559304893016815e-06, -5.776062607765198e-06, -4.99282032251358e-06, -4.209578037261963e-06, -3.4263357520103455e-06, -2.643093466758728e-06, -1.8598511815071106e-06, -1.0766088962554932e-06, -2.9336661100387573e-07, 4.898756742477417e-07, 1.2731179594993591e-06, 2.0563602447509766e-06, 2.839602530002594e-06, 3.6228448152542114e-06, 4.406087100505829e-06, 5.189329385757446e-06, 5.972571671009064e-06, 6.755813956260681e-06, 7.539056241512299e-06, 8.322298526763916e-06, 9.105540812015533e-06, 9.888783097267151e-06, 1.0672025382518768e-05, 1.1455267667770386e-05, 1.2238509953022003e-05, 1.302175223827362e-05, 1.3804994523525238e-05, 1.4588236808776855e-05, 1.5371479094028473e-05, 1.615472137928009e-05, 1.6937963664531708e-05, 1.7721205949783325e-05, 1.8504448235034943e-05, 1.928769052028656e-05, 2.0070932805538177e-05, 2.0854175090789795e-05, 2.1637417376041412e-05, 2.242065966129303e-05, 2.3203901946544647e-05, 2.3987144231796265e-05, 2.4770386517047882e-05, 2.55536288022995e-05, 2.6336871087551117e-05, 2.7120113372802734e-05]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 8.0, 7.0, 15.0, 13.0, 31.0, 32.0, 44.0, 59.0, 118.0, 189.0, 272.0, 416.0, 746.0, 1470.0, 2739.0, 5830.0, 13833.0, 36685.0, 118906.0, 426771.0, 311079.0, 81902.0, 26790.0, 10637.0, 4692.0, 2338.0, 1199.0, 668.0, 380.0, 243.0, 138.0, 99.0, 72.0, 42.0, 32.0, 21.0, 13.0, 7.0, 11.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1302490234375, -0.12615966796875, -0.1220703125, -0.11798095703125, -0.1138916015625, -0.10980224609375, -0.105712890625, -0.10162353515625, -0.0975341796875, -0.09344482421875, -0.08935546875, -0.08526611328125, -0.0811767578125, -0.07708740234375, -0.072998046875, -0.06890869140625, -0.0648193359375, -0.06072998046875, -0.056640625, -0.05255126953125, -0.0484619140625, -0.04437255859375, -0.040283203125, -0.03619384765625, -0.0321044921875, -0.02801513671875, -0.02392578125, -0.01983642578125, -0.0157470703125, -0.01165771484375, -0.007568359375, -0.00347900390625, 0.0006103515625, 0.00469970703125, 0.0087890625, 0.01287841796875, 0.0169677734375, 0.02105712890625, 0.025146484375, 0.02923583984375, 0.0333251953125, 0.03741455078125, 0.04150390625, 0.04559326171875, 0.0496826171875, 0.05377197265625, 0.057861328125, 0.06195068359375, 0.0660400390625, 0.07012939453125, 0.07421875, 0.07830810546875, 0.0823974609375, 0.08648681640625, 0.090576171875, 0.09466552734375, 0.0987548828125, 0.10284423828125, 0.10693359375, 0.11102294921875, 0.1151123046875, 0.11920166015625, 0.123291015625, 0.12738037109375, 0.1314697265625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 7.0, 9.0, 13.0, 7.0, 16.0, 11.0, 15.0, 27.0, 34.0, 36.0, 39.0, 58.0, 54.0, 82.0, 73.0, 66.0, 58.0, 62.0, 55.0, 42.0, 33.0, 27.0, 22.0, 32.0, 18.0, 22.0, 12.0, 9.0, 9.0, 10.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050384521484375, -0.048601627349853516, -0.04681873321533203, -0.04503583908081055, -0.04325294494628906, -0.04147005081176758, -0.039687156677246094, -0.03790426254272461, -0.036121368408203125, -0.03433847427368164, -0.032555580139160156, -0.030772686004638672, -0.028989791870117188, -0.027206897735595703, -0.02542400360107422, -0.023641109466552734, -0.02185821533203125, -0.020075321197509766, -0.01829242706298828, -0.016509532928466797, -0.014726638793945312, -0.012943744659423828, -0.011160850524902344, -0.00937795639038086, -0.007595062255859375, -0.005812168121337891, -0.004029273986816406, -0.002246379852294922, -0.0004634857177734375, 0.0013194084167480469, 0.0031023025512695312, 0.004885196685791016, 0.0066680908203125, 0.008450984954833984, 0.010233879089355469, 0.012016773223876953, 0.013799667358398438, 0.015582561492919922, 0.017365455627441406, 0.01914834976196289, 0.020931243896484375, 0.02271413803100586, 0.024497032165527344, 0.026279926300048828, 0.028062820434570312, 0.029845714569091797, 0.03162860870361328, 0.033411502838134766, 0.03519439697265625, 0.036977291107177734, 0.03876018524169922, 0.0405430793762207, 0.04232597351074219, 0.04410886764526367, 0.045891761779785156, 0.04767465591430664, 0.049457550048828125, 0.05124044418334961, 0.053023338317871094, 0.05480623245239258, 0.05658912658691406, 0.05837202072143555, 0.06015491485595703, 0.061937808990478516, 0.063720703125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 37.0, 67.0, 102.0, 164.0, 185.0, 150.0, 99.0, 62.0, 40.0, 21.0, 10.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5216164588928223, -2.448578357696533, -2.375540256500244, -2.302502155303955, -2.229464054107666, -2.156425952911377, -2.083387851715088, -2.010349750518799, -1.9373116493225098, -1.8642735481262207, -1.7912354469299316, -1.7181973457336426, -1.6451592445373535, -1.5721211433410645, -1.4990830421447754, -1.4260449409484863, -1.3530068397521973, -1.2799687385559082, -1.2069306373596191, -1.13389253616333, -1.060854434967041, -0.987816333770752, -0.9147782325744629, -0.8417401313781738, -0.7687020301818848, -0.6956639289855957, -0.6226258277893066, -0.5495877265930176, -0.4765496253967285, -0.40351152420043945, -0.3304734230041504, -0.25743532180786133, -0.18439698219299316, -0.1113588809967041, -0.03832077980041504, 0.03471732139587402, 0.10775542259216309, 0.18079352378845215, 0.2538316249847412, 0.3268697261810303, 0.39990782737731934, 0.4729459285736084, 0.5459840297698975, 0.6190221309661865, 0.6920602321624756, 0.7650983333587646, 0.8381364345550537, 0.9111745357513428, 0.9842126369476318, 1.057250738143921, 1.13028883934021, 1.203326940536499, 1.276365041732788, 1.3494031429290771, 1.4224412441253662, 1.4954793453216553, 1.5685174465179443, 1.6415555477142334, 1.7145936489105225, 1.7876317501068115, 1.8606698513031006, 1.9337079524993896, 2.0067460536956787, 2.0797841548919678, 2.152822256088257]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 10.0, 10.0, 25.0, 34.0, 42.0, 71.0, 77.0, 83.0, 89.0, 83.0, 78.0, 73.0, 82.0, 68.0, 60.0, 36.0, 26.0, 19.0, 16.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8335562944412231, -1.7361416816711426, -1.6387271881103516, -1.541312575340271, -1.4438979625701904, -1.3464834690093994, -1.2490688562393188, -1.1516542434692383, -1.0542397499084473, -0.9568251967430115, -0.8594105839729309, -0.7619960308074951, -0.6645814180374146, -0.5671668648719788, -0.46975231170654297, -0.3723376989364624, -0.27492308616638184, -0.17750850319862366, -0.08009393513202667, 0.017320632934570312, 0.11473521590232849, 0.21214979887008667, 0.30956435203552246, 0.406978964805603, 0.5043935179710388, 0.6018080711364746, 0.6992226839065552, 0.796637237071991, 0.8940517902374268, 0.9914664030075073, 1.088881015777588, 1.186295509338379, 1.283710241317749, 1.3811248540878296, 1.4785393476486206, 1.5759539604187012, 1.6733685731887817, 1.7707831859588623, 1.8681976795196533, 1.9656122922897339, 2.0630269050598145, 2.1604413986206055, 2.2578561305999756, 2.3552706241607666, 2.4526851177215576, 2.5500998497009277, 2.6475143432617188, 2.7449288368225098, 2.842343330383301, 2.939757823944092, 3.037172555923462, 3.134587049484253, 3.232001543045044, 3.329416275024414, 3.426830768585205, 3.524245262145996, 3.621659994125366, 3.7190744876861572, 3.8164892196655273, 3.9139037132263184, 4.011318206787109, 4.1087327003479, 4.206147193908691, 4.303562164306641, 4.400976657867432]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 3.0, 9.0, 11.0, 19.0, 11.0, 25.0, 38.0, 57.0, 72.0, 98.0, 163.0, 226.0, 369.0, 572.0, 900.0, 1699.0, 3198.0, 7241.0, 19009.0, 67912.0, 404439.0, 2884403.0, 668016.0, 93994.0, 24540.0, 8678.0, 3796.0, 1898.0, 1091.0, 652.0, 378.0, 246.0, 182.0, 90.0, 85.0, 56.0, 30.0, 22.0, 20.0, 16.0, 7.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.74237060546875, -0.7196044921875, -0.69683837890625, -0.674072265625, -0.65130615234375, -0.6285400390625, -0.60577392578125, -0.5830078125, -0.56024169921875, -0.5374755859375, -0.51470947265625, -0.491943359375, -0.46917724609375, -0.4464111328125, -0.42364501953125, -0.40087890625, -0.37811279296875, -0.3553466796875, -0.33258056640625, -0.309814453125, -0.28704833984375, -0.2642822265625, -0.24151611328125, -0.21875, -0.19598388671875, -0.1732177734375, -0.15045166015625, -0.127685546875, -0.10491943359375, -0.0821533203125, -0.05938720703125, -0.03662109375, -0.01385498046875, 0.0089111328125, 0.03167724609375, 0.054443359375, 0.07720947265625, 0.0999755859375, 0.12274169921875, 0.1455078125, 0.16827392578125, 0.1910400390625, 0.21380615234375, 0.236572265625, 0.25933837890625, 0.2821044921875, 0.30487060546875, 0.32763671875, 0.35040283203125, 0.3731689453125, 0.39593505859375, 0.418701171875, 0.44146728515625, 0.4642333984375, 0.48699951171875, 0.509765625, 0.53253173828125, 0.5552978515625, 0.57806396484375, 0.600830078125, 0.62359619140625, 0.6463623046875, 0.66912841796875, 0.69189453125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 11.0, 7.0, 16.0, 13.0, 23.0, 40.0, 41.0, 42.0, 59.0, 52.0, 63.0, 69.0, 70.0, 67.0, 66.0, 56.0, 61.0, 46.0, 41.0, 33.0, 22.0, 17.0, 18.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.77294921875, -0.7512664794921875, -0.729583740234375, -0.7079010009765625, -0.68621826171875, -0.6645355224609375, -0.642852783203125, -0.6211700439453125, -0.5994873046875, -0.5778045654296875, -0.556121826171875, -0.5344390869140625, -0.51275634765625, -0.4910736083984375, -0.469390869140625, -0.4477081298828125, -0.426025390625, -0.4043426513671875, -0.382659912109375, -0.3609771728515625, -0.33929443359375, -0.3176116943359375, -0.295928955078125, -0.2742462158203125, -0.2525634765625, -0.2308807373046875, -0.209197998046875, -0.1875152587890625, -0.16583251953125, -0.1441497802734375, -0.122467041015625, -0.1007843017578125, -0.0791015625, -0.0574188232421875, -0.035736083984375, -0.0140533447265625, 0.00762939453125, 0.0293121337890625, 0.050994873046875, 0.0726776123046875, 0.0943603515625, 0.1160430908203125, 0.137725830078125, 0.1594085693359375, 0.18109130859375, 0.2027740478515625, 0.224456787109375, 0.2461395263671875, 0.267822265625, 0.2895050048828125, 0.311187744140625, 0.3328704833984375, 0.35455322265625, 0.3762359619140625, 0.397918701171875, 0.4196014404296875, 0.4412841796875, 0.4629669189453125, 0.484649658203125, 0.5063323974609375, 0.52801513671875, 0.5496978759765625, 0.571380615234375, 0.5930633544921875, 0.61474609375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 8.0, 16.0, 17.0, 38.0, 54.0, 121.0, 264.0, 871.0, 5237.0, 108795.0, 4022005.0, 52155.0, 3563.0, 664.0, 217.0, 98.0, 62.0, 26.0, 18.0, 10.0, 12.0, 9.0, 7.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.2282257080078125, -2.161529541015625, -2.0948333740234375, -2.02813720703125, -1.9614410400390625, -1.894744873046875, -1.8280487060546875, -1.7613525390625, -1.6946563720703125, -1.627960205078125, -1.5612640380859375, -1.49456787109375, -1.4278717041015625, -1.361175537109375, -1.2944793701171875, -1.227783203125, -1.1610870361328125, -1.094390869140625, -1.0276947021484375, -0.96099853515625, -0.8943023681640625, -0.827606201171875, -0.7609100341796875, -0.6942138671875, -0.6275177001953125, -0.560821533203125, -0.4941253662109375, -0.42742919921875, -0.3607330322265625, -0.294036865234375, -0.2273406982421875, -0.16064453125, -0.0939483642578125, -0.027252197265625, 0.0394439697265625, 0.10614013671875, 0.1728363037109375, 0.239532470703125, 0.3062286376953125, 0.3729248046875, 0.4396209716796875, 0.506317138671875, 0.5730133056640625, 0.63970947265625, 0.7064056396484375, 0.773101806640625, 0.8397979736328125, 0.906494140625, 0.9731903076171875, 1.039886474609375, 1.1065826416015625, 1.17327880859375, 1.2399749755859375, 1.306671142578125, 1.3733673095703125, 1.4400634765625, 1.5067596435546875, 1.573455810546875, 1.6401519775390625, 1.70684814453125, 1.7735443115234375, 1.840240478515625, 1.9069366455078125, 1.9736328125]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 11.0, 9.0, 12.0, 11.0, 19.0, 25.0, 35.0, 52.0, 71.0, 117.0, 169.0, 317.0, 607.0, 1023.0, 651.0, 363.0, 184.0, 132.0, 79.0, 48.0, 40.0, 31.0, 12.0, 14.0, 11.0, 10.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.303466796875, -0.2956066131591797, -0.2877464294433594, -0.27988624572753906, -0.27202606201171875, -0.26416587829589844, -0.2563056945800781, -0.2484455108642578, -0.2405853271484375, -0.2327251434326172, -0.22486495971679688, -0.21700477600097656, -0.20914459228515625, -0.20128440856933594, -0.19342422485351562, -0.1855640411376953, -0.177703857421875, -0.1698436737060547, -0.16198348999023438, -0.15412330627441406, -0.14626312255859375, -0.13840293884277344, -0.13054275512695312, -0.12268257141113281, -0.1148223876953125, -0.10696220397949219, -0.09910202026367188, -0.09124183654785156, -0.08338165283203125, -0.07552146911621094, -0.06766128540039062, -0.05980110168457031, -0.05194091796875, -0.04408073425292969, -0.036220550537109375, -0.028360366821289062, -0.02050018310546875, -0.012639999389648438, -0.004779815673828125, 0.0030803680419921875, 0.0109405517578125, 0.018800735473632812, 0.026660919189453125, 0.03452110290527344, 0.04238128662109375, 0.05024147033691406, 0.058101654052734375, 0.06596183776855469, 0.073822021484375, 0.08168220520019531, 0.08954238891601562, 0.09740257263183594, 0.10526275634765625, 0.11312294006347656, 0.12098312377929688, 0.1288433074951172, 0.1367034912109375, 0.1445636749267578, 0.15242385864257812, 0.16028404235839844, 0.16814422607421875, 0.17600440979003906, 0.18386459350585938, 0.1917247772216797, 0.1995849609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 8.0, 10.0, 16.0, 20.0, 37.0, 49.0, 76.0, 128.0, 144.0, 115.0, 119.0, 89.0, 64.0, 39.0, 21.0, 15.0, 16.0, 9.0, 8.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9965784549713135, -0.9553521871566772, -0.914125919342041, -0.8728996515274048, -0.8316733837127686, -0.7904471158981323, -0.7492208480834961, -0.7079945802688599, -0.6667683124542236, -0.6255420446395874, -0.5843157768249512, -0.5430895090103149, -0.5018632411956787, -0.4606369733810425, -0.41941070556640625, -0.37818443775177, -0.3369581699371338, -0.29573190212249756, -0.25450563430786133, -0.2132793664932251, -0.17205309867858887, -0.13082683086395264, -0.0896005630493164, -0.048374295234680176, -0.007148027420043945, 0.034078240394592285, 0.07530450820922852, 0.11653077602386475, 0.15775704383850098, 0.1989833116531372, 0.24020957946777344, 0.28143584728240967, 0.3226621150970459, 0.36388838291168213, 0.40511465072631836, 0.4463409185409546, 0.4875671863555908, 0.528793454170227, 0.5700197219848633, 0.6112459897994995, 0.6524722576141357, 0.693698525428772, 0.7349247932434082, 0.7761510610580444, 0.8173773288726807, 0.8586035966873169, 0.8998298645019531, 0.9410561323165894, 0.9822824001312256, 1.0235086679458618, 1.064734935760498, 1.1059612035751343, 1.1471874713897705, 1.1884137392044067, 1.229640007019043, 1.2708662748336792, 1.3120925426483154, 1.3533188104629517, 1.394545078277588, 1.4357713460922241, 1.4769976139068604, 1.5182238817214966, 1.5594501495361328, 1.600676417350769, 1.6419026851654053]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 3.0, 9.0, 9.0, 17.0, 16.0, 17.0, 30.0, 37.0, 31.0, 29.0, 42.0, 33.0, 49.0, 68.0, 56.0, 56.0, 50.0, 52.0, 35.0, 43.0, 38.0, 44.0, 34.0, 28.0, 18.0, 29.0, 22.0, 12.0, 14.0, 7.0, 8.0, 11.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.6031824946403503, -0.5844428539276123, -0.5657031536102295, -0.5469635128974915, -0.5282238721847534, -0.5094842314720154, -0.49074456095695496, -0.47200489044189453, -0.4532652497291565, -0.43452560901641846, -0.41578593850135803, -0.3970462679862976, -0.37830662727355957, -0.35956698656082153, -0.3408273160457611, -0.3220876455307007, -0.30334800481796265, -0.2846083641052246, -0.2658686935901642, -0.24712903797626495, -0.22838938236236572, -0.2096497267484665, -0.19091007113456726, -0.17217041552066803, -0.1534307599067688, -0.13469110429286957, -0.11595144867897034, -0.0972117930650711, -0.07847213745117188, -0.059732481837272644, -0.04099282622337341, -0.022253170609474182, -0.0035134553909301758, 0.015226200222969055, 0.033965855836868286, 0.05270551145076752, 0.07144516706466675, 0.09018482267856598, 0.10892447829246521, 0.12766413390636444, 0.14640378952026367, 0.1651434451341629, 0.18388310074806213, 0.20262275636196136, 0.2213624119758606, 0.24010206758975983, 0.25884172320365906, 0.2775813937187195, 0.2963210344314575, 0.31506067514419556, 0.333800345659256, 0.3525400161743164, 0.37127965688705444, 0.3900192975997925, 0.4087589681148529, 0.42749863862991333, 0.44623827934265137, 0.4649779200553894, 0.48371759057044983, 0.5024572610855103, 0.5211969017982483, 0.5399365425109863, 0.5586762428283691, 0.5774158835411072, 0.5961555242538452]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 10.0, 24.0, 22.0, 28.0, 52.0, 60.0, 104.0, 172.0, 262.0, 393.0, 682.0, 1094.0, 1848.0, 3374.0, 6428.0, 13543.0, 32840.0, 123183.0, 615980.0, 175779.0, 40603.0, 15528.0, 7441.0, 3790.0, 2072.0, 1225.0, 724.0, 433.0, 288.0, 172.0, 116.0, 92.0, 37.0, 43.0, 27.0, 23.0, 17.0, 11.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2105712890625, -0.20411109924316406, -0.19765090942382812, -0.1911907196044922, -0.18473052978515625, -0.1782703399658203, -0.17181015014648438, -0.16534996032714844, -0.1588897705078125, -0.15242958068847656, -0.14596939086914062, -0.1395092010498047, -0.13304901123046875, -0.1265888214111328, -0.12012863159179688, -0.11366844177246094, -0.107208251953125, -0.10074806213378906, -0.09428787231445312, -0.08782768249511719, -0.08136749267578125, -0.07490730285644531, -0.06844711303710938, -0.06198692321777344, -0.0555267333984375, -0.04906654357910156, -0.042606353759765625, -0.03614616394042969, -0.02968597412109375, -0.023225784301757812, -0.016765594482421875, -0.010305404663085938, -0.00384521484375, 0.0026149749755859375, 0.009075164794921875, 0.015535354614257812, 0.02199554443359375, 0.028455734252929688, 0.034915924072265625, 0.04137611389160156, 0.0478363037109375, 0.05429649353027344, 0.060756683349609375, 0.06721687316894531, 0.07367706298828125, 0.08013725280761719, 0.08659744262695312, 0.09305763244628906, 0.099517822265625, 0.10597801208496094, 0.11243820190429688, 0.11889839172363281, 0.12535858154296875, 0.1318187713623047, 0.13827896118164062, 0.14473915100097656, 0.1511993408203125, 0.15765953063964844, 0.16411972045898438, 0.1705799102783203, 0.17704010009765625, 0.1835002899169922, 0.18996047973632812, 0.19642066955566406, 0.202880859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 9.0, 7.0, 9.0, 8.0, 7.0, 21.0, 18.0, 32.0, 37.0, 54.0, 39.0, 68.0, 66.0, 86.0, 63.0, 70.0, 72.0, 50.0, 61.0, 48.0, 40.0, 30.0, 22.0, 19.0, 20.0, 8.0, 8.0, 11.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.481689453125, -0.4642295837402344, -0.44676971435546875, -0.4293098449707031, -0.4118499755859375, -0.3943901062011719, -0.37693023681640625, -0.3594703674316406, -0.342010498046875, -0.3245506286621094, -0.30709075927734375, -0.2896308898925781, -0.2721710205078125, -0.2547111511230469, -0.23725128173828125, -0.21979141235351562, -0.20233154296875, -0.18487167358398438, -0.16741180419921875, -0.14995193481445312, -0.1324920654296875, -0.11503219604492188, -0.09757232666015625, -0.08011245727539062, -0.062652587890625, -0.045192718505859375, -0.02773284912109375, -0.010272979736328125, 0.0071868896484375, 0.024646759033203125, 0.04210662841796875, 0.059566497802734375, 0.0770263671875, 0.09448623657226562, 0.11194610595703125, 0.12940597534179688, 0.1468658447265625, 0.16432571411132812, 0.18178558349609375, 0.19924545288085938, 0.216705322265625, 0.23416519165039062, 0.25162506103515625, 0.2690849304199219, 0.2865447998046875, 0.3040046691894531, 0.32146453857421875, 0.3389244079589844, 0.35638427734375, 0.3738441467285156, 0.39130401611328125, 0.4087638854980469, 0.4262237548828125, 0.4436836242675781, 0.46114349365234375, 0.4786033630371094, 0.496063232421875, 0.5135231018066406, 0.5309829711914062, 0.5484428405761719, 0.5659027099609375, 0.5833625793457031, 0.6008224487304688, 0.6182823181152344, 0.6357421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 5.0, 7.0, 8.0, 5.0, 4.0, 14.0, 9.0, 9.0, 20.0, 30.0, 35.0, 52.0, 69.0, 127.0, 184.0, 320.0, 625.0, 1163.0, 2484.0, 6066.0, 18653.0, 93241.0, 682731.0, 198798.0, 28933.0, 8511.0, 3231.0, 1461.0, 711.0, 358.0, 222.0, 149.0, 105.0, 64.0, 38.0, 31.0, 16.0, 18.0, 13.0, 10.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1756591796875, -0.16881370544433594, -0.16196823120117188, -0.1551227569580078, -0.14827728271484375, -0.1414318084716797, -0.13458633422851562, -0.12774085998535156, -0.1208953857421875, -0.11404991149902344, -0.10720443725585938, -0.10035896301269531, -0.09351348876953125, -0.08666801452636719, -0.07982254028320312, -0.07297706604003906, -0.066131591796875, -0.05928611755371094, -0.052440643310546875, -0.04559516906738281, -0.03874969482421875, -0.03190422058105469, -0.025058746337890625, -0.018213272094726562, -0.0113677978515625, -0.0045223236083984375, 0.002323150634765625, 0.009168624877929688, 0.01601409912109375, 0.022859573364257812, 0.029705047607421875, 0.03655052185058594, 0.04339599609375, 0.05024147033691406, 0.057086944580078125, 0.06393241882324219, 0.07077789306640625, 0.07762336730957031, 0.08446884155273438, 0.09131431579589844, 0.0981597900390625, 0.10500526428222656, 0.11185073852539062, 0.11869621276855469, 0.12554168701171875, 0.1323871612548828, 0.13923263549804688, 0.14607810974121094, 0.152923583984375, 0.15976905822753906, 0.16661453247070312, 0.1734600067138672, 0.18030548095703125, 0.1871509552001953, 0.19399642944335938, 0.20084190368652344, 0.2076873779296875, 0.21453285217285156, 0.22137832641601562, 0.2282238006591797, 0.23506927490234375, 0.2419147491455078, 0.24876022338867188, 0.25560569763183594, 0.262451171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 10.0, 8.0, 3.0, 7.0, 14.0, 12.0, 7.0, 23.0, 17.0, 26.0, 26.0, 28.0, 47.0, 36.0, 52.0, 54.0, 58.0, 44.0, 49.0, 49.0, 35.0, 49.0, 45.0, 47.0, 46.0, 44.0, 36.0, 21.0, 27.0, 10.0, 19.0, 11.0, 8.0, 11.0, 8.0, 4.0, 4.0, 2.0, 3.0, 6.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84814453125, -0.8212203979492188, -0.7942962646484375, -0.7673721313476562, -0.740447998046875, -0.7135238647460938, -0.6865997314453125, -0.6596755981445312, -0.63275146484375, -0.6058273315429688, -0.5789031982421875, -0.5519790649414062, -0.525054931640625, -0.49813079833984375, -0.4712066650390625, -0.44428253173828125, -0.4173583984375, -0.39043426513671875, -0.3635101318359375, -0.33658599853515625, -0.309661865234375, -0.28273773193359375, -0.2558135986328125, -0.22888946533203125, -0.20196533203125, -0.17504119873046875, -0.1481170654296875, -0.12119293212890625, -0.094268798828125, -0.06734466552734375, -0.0404205322265625, -0.01349639892578125, 0.013427734375, 0.04035186767578125, 0.0672760009765625, 0.09420013427734375, 0.121124267578125, 0.14804840087890625, 0.1749725341796875, 0.20189666748046875, 0.22882080078125, 0.25574493408203125, 0.2826690673828125, 0.30959320068359375, 0.336517333984375, 0.36344146728515625, 0.3903656005859375, 0.41728973388671875, 0.4442138671875, 0.47113800048828125, 0.4980621337890625, 0.5249862670898438, 0.551910400390625, 0.5788345336914062, 0.6057586669921875, 0.6326828002929688, 0.65960693359375, 0.6865310668945312, 0.7134552001953125, 0.7403793334960938, 0.767303466796875, 0.7942276000976562, 0.8211517333984375, 0.8480758666992188, 0.875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 5.0, 8.0, 8.0, 19.0, 21.0, 22.0, 64.0, 84.0, 158.0, 247.0, 450.0, 880.0, 1886.0, 4508.0, 13778.0, 81713.0, 830321.0, 90887.0, 14715.0, 4735.0, 2021.0, 934.0, 447.0, 250.0, 139.0, 98.0, 56.0, 31.0, 20.0, 12.0, 13.0, 12.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1717529296875, -0.16717529296875, -0.16259765625, -0.15802001953125, -0.1534423828125, -0.14886474609375, -0.144287109375, -0.13970947265625, -0.1351318359375, -0.13055419921875, -0.1259765625, -0.12139892578125, -0.1168212890625, -0.11224365234375, -0.107666015625, -0.10308837890625, -0.0985107421875, -0.09393310546875, -0.08935546875, -0.08477783203125, -0.0802001953125, -0.07562255859375, -0.071044921875, -0.06646728515625, -0.0618896484375, -0.05731201171875, -0.052734375, -0.04815673828125, -0.0435791015625, -0.03900146484375, -0.034423828125, -0.02984619140625, -0.0252685546875, -0.02069091796875, -0.01611328125, -0.01153564453125, -0.0069580078125, -0.00238037109375, 0.002197265625, 0.00677490234375, 0.0113525390625, 0.01593017578125, 0.0205078125, 0.02508544921875, 0.0296630859375, 0.03424072265625, 0.038818359375, 0.04339599609375, 0.0479736328125, 0.05255126953125, 0.05712890625, 0.06170654296875, 0.0662841796875, 0.07086181640625, 0.075439453125, 0.08001708984375, 0.0845947265625, 0.08917236328125, 0.09375, 0.09832763671875, 0.1029052734375, 0.10748291015625, 0.112060546875, 0.11663818359375, 0.1212158203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 4.0, 16.0, 27.0, 37.0, 68.0, 87.0, 153.0, 205.0, 151.0, 88.0, 57.0, 25.0, 21.0, 14.0, 1.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.511543273925781e-05, -8.277781307697296e-05, -8.044019341468811e-05, -7.810257375240326e-05, -7.576495409011841e-05, -7.342733442783356e-05, -7.10897147655487e-05, -6.875209510326385e-05, -6.6414475440979e-05, -6.407685577869415e-05, -6.17392361164093e-05, -5.940161645412445e-05, -5.70639967918396e-05, -5.472637712955475e-05, -5.23887574672699e-05, -5.0051137804985046e-05, -4.7713518142700195e-05, -4.5375898480415344e-05, -4.303827881813049e-05, -4.070065915584564e-05, -3.836303949356079e-05, -3.602541983127594e-05, -3.368780016899109e-05, -3.135018050670624e-05, -2.9012560844421387e-05, -2.6674941182136536e-05, -2.4337321519851685e-05, -2.1999701857566833e-05, -1.9662082195281982e-05, -1.732446253299713e-05, -1.498684287071228e-05, -1.264922320842743e-05, -1.0311603546142578e-05, -7.973983883857727e-06, -5.636364221572876e-06, -3.298744559288025e-06, -9.611248970031738e-07, 1.3764947652816772e-06, 3.7141144275665283e-06, 6.051734089851379e-06, 8.38935375213623e-06, 1.0726973414421082e-05, 1.3064593076705933e-05, 1.5402212738990784e-05, 1.7739832401275635e-05, 2.0077452063560486e-05, 2.2415071725845337e-05, 2.4752691388130188e-05, 2.709031105041504e-05, 2.942793071269989e-05, 3.176555037498474e-05, 3.410317003726959e-05, 3.644078969955444e-05, 3.8778409361839294e-05, 4.1116029024124146e-05, 4.3453648686408997e-05, 4.579126834869385e-05, 4.81288880109787e-05, 5.046650767326355e-05, 5.28041273355484e-05, 5.514174699783325e-05, 5.74793666601181e-05, 5.9816986322402954e-05, 6.21546059846878e-05, 6.449222564697266e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 6.0, 7.0, 8.0, 12.0, 22.0, 40.0, 51.0, 95.0, 143.0, 238.0, 447.0, 817.0, 1711.0, 3899.0, 9490.0, 32878.0, 345629.0, 587621.0, 44746.0, 11823.0, 4593.0, 2105.0, 973.0, 510.0, 263.0, 143.0, 96.0, 73.0, 23.0, 22.0, 13.0, 11.0, 9.0, 16.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.14306640625, -0.13898944854736328, -0.13491249084472656, -0.13083553314208984, -0.12675857543945312, -0.1226816177368164, -0.11860466003417969, -0.11452770233154297, -0.11045074462890625, -0.10637378692626953, -0.10229682922363281, -0.0982198715209961, -0.09414291381835938, -0.09006595611572266, -0.08598899841308594, -0.08191204071044922, -0.0778350830078125, -0.07375812530517578, -0.06968116760253906, -0.06560420989990234, -0.061527252197265625, -0.057450294494628906, -0.05337333679199219, -0.04929637908935547, -0.04521942138671875, -0.04114246368408203, -0.03706550598144531, -0.032988548278808594, -0.028911590576171875, -0.024834632873535156, -0.020757675170898438, -0.01668071746826172, -0.012603759765625, -0.008526802062988281, -0.0044498443603515625, -0.00037288665771484375, 0.003704071044921875, 0.007781028747558594, 0.011857986450195312, 0.01593494415283203, 0.02001190185546875, 0.02408885955810547, 0.028165817260742188, 0.032242774963378906, 0.036319732666015625, 0.040396690368652344, 0.04447364807128906, 0.04855060577392578, 0.0526275634765625, 0.05670452117919922, 0.06078147888183594, 0.06485843658447266, 0.06893539428710938, 0.0730123519897461, 0.07708930969238281, 0.08116626739501953, 0.08524322509765625, 0.08932018280029297, 0.09339714050292969, 0.0974740982055664, 0.10155105590820312, 0.10562801361083984, 0.10970497131347656, 0.11378192901611328, 0.11785888671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 9.0, 10.0, 14.0, 16.0, 34.0, 40.0, 79.0, 111.0, 156.0, 154.0, 110.0, 71.0, 57.0, 33.0, 24.0, 12.0, 15.0, 10.0, 6.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023895263671875, -0.022979259490966797, -0.022063255310058594, -0.02114725112915039, -0.020231246948242188, -0.019315242767333984, -0.01839923858642578, -0.017483234405517578, -0.016567230224609375, -0.015651226043701172, -0.014735221862792969, -0.013819217681884766, -0.012903213500976562, -0.01198720932006836, -0.011071205139160156, -0.010155200958251953, -0.00923919677734375, -0.008323192596435547, -0.007407188415527344, -0.006491184234619141, -0.0055751800537109375, -0.004659175872802734, -0.0037431716918945312, -0.002827167510986328, -0.001911163330078125, -0.0009951591491699219, -7.915496826171875e-05, 0.0008368492126464844, 0.0017528533935546875, 0.0026688575744628906, 0.0035848617553710938, 0.004500865936279297, 0.0054168701171875, 0.006332874298095703, 0.007248878479003906, 0.00816488265991211, 0.009080886840820312, 0.009996891021728516, 0.010912895202636719, 0.011828899383544922, 0.012744903564453125, 0.013660907745361328, 0.014576911926269531, 0.015492916107177734, 0.016408920288085938, 0.01732492446899414, 0.018240928649902344, 0.019156932830810547, 0.02007293701171875, 0.020988941192626953, 0.021904945373535156, 0.02282094955444336, 0.023736953735351562, 0.024652957916259766, 0.02556896209716797, 0.026484966278076172, 0.027400970458984375, 0.028316974639892578, 0.02923297882080078, 0.030148983001708984, 0.031064987182617188, 0.03198099136352539, 0.032896995544433594, 0.0338129997253418, 0.03472900390625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 13.0, 22.0, 48.0, 71.0, 119.0, 163.0, 183.0, 142.0, 90.0, 42.0, 25.0, 14.0, 17.0, 10.0, 7.0, 7.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8666658401489258, -0.8335991501808167, -0.8005324602127075, -0.7674657702445984, -0.7343990802764893, -0.7013323307037354, -0.6682656407356262, -0.6351989507675171, -0.602132260799408, -0.5690655708312988, -0.5359988808631897, -0.5029321908950806, -0.46986547112464905, -0.4367987811565399, -0.4037320613861084, -0.37066537141799927, -0.33759868144989014, -0.304531991481781, -0.2714653015136719, -0.23839858174324036, -0.20533189177513123, -0.1722652018070221, -0.13919849693775177, -0.10613179206848145, -0.07306510210037231, -0.03999840468168259, -0.006931707262992859, 0.02613499015569687, 0.0592016875743866, 0.09226837754249573, 0.12533508241176605, 0.15840178728103638, 0.1914684772491455, 0.22453516721725464, 0.25760185718536377, 0.2906685769557953, 0.3237352669239044, 0.35680195689201355, 0.38986867666244507, 0.4229353666305542, 0.45600205659866333, 0.48906874656677246, 0.5221354365348816, 0.5552021265029907, 0.5882688760757446, 0.621335506439209, 0.6544022560119629, 0.687468945980072, 0.7205356359481812, 0.7536023259162903, 0.7866690158843994, 0.8197357058525085, 0.8528023958206177, 0.8858691453933716, 0.9189358353614807, 0.9520025253295898, 0.985069215297699, 1.018135905265808, 1.051202654838562, 1.0842692852020264, 1.1173360347747803, 1.1504026651382446, 1.1834694147109985, 1.216536045074463, 1.2496027946472168]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 13.0, 16.0, 25.0, 26.0, 27.0, 47.0, 40.0, 55.0, 54.0, 60.0, 72.0, 80.0, 57.0, 49.0, 57.0, 49.0, 41.0, 32.0, 33.0, 25.0, 26.0, 14.0, 12.0, 13.0, 14.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4369208514690399, -0.42228955030441284, -0.4076582193374634, -0.3930269181728363, -0.37839561700820923, -0.36376428604125977, -0.3491329848766327, -0.3345016837120056, -0.31987035274505615, -0.3052390515804291, -0.2906077206134796, -0.27597641944885254, -0.2613450884819031, -0.246713787317276, -0.23208248615264893, -0.21745117008686066, -0.2028198540210724, -0.18818853795528412, -0.17355722188949585, -0.15892592072486877, -0.1442946046590805, -0.12966328859329224, -0.11503197997808456, -0.10040067136287689, -0.08576935529708862, -0.07113803923130035, -0.05650673061609268, -0.04187541827559471, -0.02724410593509674, -0.012612789869308472, 0.0020185187458992004, 0.016649827361106873, 0.031281113624572754, 0.045912425965070724, 0.060543738305568695, 0.07517504692077637, 0.08980636298656464, 0.1044376790523529, 0.11906898766756058, 0.13370029628276825, 0.14833161234855652, 0.1629629284143448, 0.17759424448013306, 0.19222554564476013, 0.2068568617105484, 0.22148817777633667, 0.23611947894096375, 0.2507507801055908, 0.2653821110725403, 0.28001341223716736, 0.2946447432041168, 0.3092760443687439, 0.32390737533569336, 0.33853867650032043, 0.3531699776649475, 0.367801308631897, 0.38243260979652405, 0.3970639109611511, 0.4116952419281006, 0.42632654309272766, 0.44095784425735474, 0.4555891752243042, 0.4702204763889313, 0.48485177755355835, 0.4994831085205078]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 9.0, 11.0, 24.0, 41.0, 72.0, 167.0, 477.0, 1439.0, 5063.0, 21775.0, 153691.0, 751909.0, 92917.0, 15365.0, 3699.0, 1180.0, 377.0, 142.0, 70.0, 33.0, 22.0, 11.0, 9.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80859375, -0.78363037109375, -0.7586669921875, -0.73370361328125, -0.708740234375, -0.68377685546875, -0.6588134765625, -0.63385009765625, -0.60888671875, -0.58392333984375, -0.5589599609375, -0.53399658203125, -0.509033203125, -0.48406982421875, -0.4591064453125, -0.43414306640625, -0.4091796875, -0.38421630859375, -0.3592529296875, -0.33428955078125, -0.309326171875, -0.28436279296875, -0.2593994140625, -0.23443603515625, -0.20947265625, -0.18450927734375, -0.1595458984375, -0.13458251953125, -0.109619140625, -0.08465576171875, -0.0596923828125, -0.03472900390625, -0.009765625, 0.01519775390625, 0.0401611328125, 0.06512451171875, 0.090087890625, 0.11505126953125, 0.1400146484375, 0.16497802734375, 0.18994140625, 0.21490478515625, 0.2398681640625, 0.26483154296875, 0.289794921875, 0.31475830078125, 0.3397216796875, 0.36468505859375, 0.3896484375, 0.41461181640625, 0.4395751953125, 0.46453857421875, 0.489501953125, 0.51446533203125, 0.5394287109375, 0.56439208984375, 0.58935546875, 0.61431884765625, 0.6392822265625, 0.66424560546875, 0.689208984375, 0.71417236328125, 0.7391357421875, 0.76409912109375, 0.7890625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 17.0, 23.0, 41.0, 74.0, 101.0, 126.0, 167.0, 136.0, 118.0, 65.0, 43.0, 28.0, 24.0, 12.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9563446044921875, -0.880462646484375, -0.8045806884765625, -0.72869873046875, -0.6528167724609375, -0.576934814453125, -0.5010528564453125, -0.4251708984375, -0.3492889404296875, -0.273406982421875, -0.1975250244140625, -0.12164306640625, -0.0457611083984375, 0.030120849609375, 0.1060028076171875, 0.181884765625, 0.2577667236328125, 0.333648681640625, 0.4095306396484375, 0.48541259765625, 0.5612945556640625, 0.637176513671875, 0.7130584716796875, 0.7889404296875, 0.8648223876953125, 0.940704345703125, 1.0165863037109375, 1.09246826171875, 1.1683502197265625, 1.244232177734375, 1.3201141357421875, 1.39599609375, 1.4718780517578125, 1.547760009765625, 1.6236419677734375, 1.69952392578125, 1.7754058837890625, 1.851287841796875, 1.9271697998046875, 2.0030517578125, 2.0789337158203125, 2.154815673828125, 2.2306976318359375, 2.30657958984375, 2.3824615478515625, 2.458343505859375, 2.5342254638671875, 2.610107421875, 2.6859893798828125, 2.761871337890625, 2.8377532958984375, 2.91363525390625, 2.9895172119140625, 3.065399169921875, 3.1412811279296875, 3.2171630859375, 3.2930450439453125, 3.368927001953125, 3.4448089599609375, 3.52069091796875, 3.5965728759765625, 3.672454833984375, 3.7483367919921875, 3.82421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 8.0, 14.0, 11.0, 20.0, 27.0, 25.0, 54.0, 58.0, 70.0, 111.0, 150.0, 266.0, 508.0, 990.0, 2578.0, 7229.0, 26607.0, 141281.0, 681608.0, 146684.0, 27633.0, 7589.0, 2573.0, 1065.0, 506.0, 313.0, 159.0, 98.0, 80.0, 67.0, 32.0, 34.0, 19.0, 17.0, 10.0, 9.0, 8.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.49169921875, -0.4770240783691406, -0.46234893798828125, -0.4476737976074219, -0.4329986572265625, -0.4183235168457031, -0.40364837646484375, -0.3889732360839844, -0.374298095703125, -0.3596229553222656, -0.34494781494140625, -0.3302726745605469, -0.3155975341796875, -0.3009223937988281, -0.28624725341796875, -0.2715721130371094, -0.25689697265625, -0.24222183227539062, -0.22754669189453125, -0.21287155151367188, -0.1981964111328125, -0.18352127075195312, -0.16884613037109375, -0.15417098999023438, -0.139495849609375, -0.12482070922851562, -0.11014556884765625, -0.09547042846679688, -0.0807952880859375, -0.06612014770507812, -0.05144500732421875, -0.036769866943359375, -0.0220947265625, -0.007419586181640625, 0.00725555419921875, 0.021930694580078125, 0.0366058349609375, 0.051280975341796875, 0.06595611572265625, 0.08063125610351562, 0.095306396484375, 0.10998153686523438, 0.12465667724609375, 0.13933181762695312, 0.1540069580078125, 0.16868209838867188, 0.18335723876953125, 0.19803237915039062, 0.21270751953125, 0.22738265991210938, 0.24205780029296875, 0.2567329406738281, 0.2714080810546875, 0.2860832214355469, 0.30075836181640625, 0.3154335021972656, 0.330108642578125, 0.3447837829589844, 0.35945892333984375, 0.3741340637207031, 0.3888092041015625, 0.4034843444824219, 0.41815948486328125, 0.4328346252441406, 0.447509765625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 8.0, 10.0, 5.0, 4.0, 8.0, 20.0, 11.0, 11.0, 21.0, 15.0, 29.0, 29.0, 32.0, 35.0, 27.0, 39.0, 41.0, 45.0, 48.0, 47.0, 49.0, 53.0, 41.0, 43.0, 28.0, 28.0, 35.0, 42.0, 32.0, 31.0, 20.0, 16.0, 19.0, 14.0, 14.0, 11.0, 11.0, 5.0, 7.0, 3.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -1.0006637573242188, -0.9691009521484375, -0.9375381469726562, -0.905975341796875, -0.8744125366210938, -0.8428497314453125, -0.8112869262695312, -0.77972412109375, -0.7481613159179688, -0.7165985107421875, -0.6850357055664062, -0.653472900390625, -0.6219100952148438, -0.5903472900390625, -0.5587844848632812, -0.5272216796875, -0.49565887451171875, -0.4640960693359375, -0.43253326416015625, -0.400970458984375, -0.36940765380859375, -0.3378448486328125, -0.30628204345703125, -0.27471923828125, -0.24315643310546875, -0.2115936279296875, -0.18003082275390625, -0.148468017578125, -0.11690521240234375, -0.0853424072265625, -0.05377960205078125, -0.022216796875, 0.00934600830078125, 0.0409088134765625, 0.07247161865234375, 0.104034423828125, 0.13559722900390625, 0.1671600341796875, 0.19872283935546875, 0.23028564453125, 0.26184844970703125, 0.2934112548828125, 0.32497406005859375, 0.356536865234375, 0.38809967041015625, 0.4196624755859375, 0.45122528076171875, 0.4827880859375, 0.5143508911132812, 0.5459136962890625, 0.5774765014648438, 0.609039306640625, 0.6406021118164062, 0.6721649169921875, 0.7037277221679688, 0.73529052734375, 0.7668533325195312, 0.7984161376953125, 0.8299789428710938, 0.861541748046875, 0.8931045532226562, 0.9246673583984375, 0.9562301635742188, 0.98779296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 4.0, 10.0, 18.0, 22.0, 40.0, 62.0, 101.0, 179.0, 341.0, 684.0, 1568.0, 4593.0, 15899.0, 92898.0, 765449.0, 137357.0, 20337.0, 5413.0, 1913.0, 776.0, 398.0, 207.0, 118.0, 51.0, 29.0, 34.0, 15.0, 13.0, 12.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2017822265625, -0.19446754455566406, -0.18715286254882812, -0.1798381805419922, -0.17252349853515625, -0.1652088165283203, -0.15789413452148438, -0.15057945251464844, -0.1432647705078125, -0.13595008850097656, -0.12863540649414062, -0.12132072448730469, -0.11400604248046875, -0.10669136047363281, -0.09937667846679688, -0.09206199645996094, -0.084747314453125, -0.07743263244628906, -0.07011795043945312, -0.06280326843261719, -0.05548858642578125, -0.04817390441894531, -0.040859222412109375, -0.03354454040527344, -0.0262298583984375, -0.018915176391601562, -0.011600494384765625, -0.0042858123779296875, 0.00302886962890625, 0.010343551635742188, 0.017658233642578125, 0.024972915649414062, 0.03228759765625, 0.03960227966308594, 0.046916961669921875, 0.05423164367675781, 0.06154632568359375, 0.06886100769042969, 0.07617568969726562, 0.08349037170410156, 0.0908050537109375, 0.09811973571777344, 0.10543441772460938, 0.11274909973144531, 0.12006378173828125, 0.1273784637451172, 0.13469314575195312, 0.14200782775878906, 0.149322509765625, 0.15663719177246094, 0.16395187377929688, 0.1712665557861328, 0.17858123779296875, 0.1858959197998047, 0.19321060180664062, 0.20052528381347656, 0.2078399658203125, 0.21515464782714844, 0.22246932983398438, 0.2297840118408203, 0.23709869384765625, 0.2444133758544922, 0.2517280578613281, 0.25904273986816406, 0.266357421875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 9.0, 17.0, 19.0, 22.0, 52.0, 64.0, 108.0, 185.0, 174.0, 100.0, 66.0, 55.0, 35.0, 21.0, 15.0, 11.0, 11.0, 2.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.14984130859375e-05, -5.0212256610393524e-05, -4.892610013484955e-05, -4.763994365930557e-05, -4.63537871837616e-05, -4.506763070821762e-05, -4.3781474232673645e-05, -4.249531775712967e-05, -4.120916128158569e-05, -3.992300480604172e-05, -3.863684833049774e-05, -3.7350691854953766e-05, -3.606453537940979e-05, -3.4778378903865814e-05, -3.349222242832184e-05, -3.220606595277786e-05, -3.091990947723389e-05, -2.963375300168991e-05, -2.8347596526145935e-05, -2.706144005060196e-05, -2.5775283575057983e-05, -2.4489127099514008e-05, -2.3202970623970032e-05, -2.1916814148426056e-05, -2.063065767288208e-05, -1.9344501197338104e-05, -1.805834472179413e-05, -1.6772188246250153e-05, -1.5486031770706177e-05, -1.4199875295162201e-05, -1.2913718819618225e-05, -1.162756234407425e-05, -1.0341405868530273e-05, -9.055249392986298e-06, -7.769092917442322e-06, -6.482936441898346e-06, -5.19677996635437e-06, -3.910623490810394e-06, -2.6244670152664185e-06, -1.3383105397224426e-06, -5.21540641784668e-08, 1.234002411365509e-06, 2.520158886909485e-06, 3.8063153624534607e-06, 5.0924718379974365e-06, 6.378628313541412e-06, 7.664784789085388e-06, 8.950941264629364e-06, 1.023709774017334e-05, 1.1523254215717316e-05, 1.2809410691261292e-05, 1.4095567166805267e-05, 1.5381723642349243e-05, 1.666788011789322e-05, 1.7954036593437195e-05, 1.924019306898117e-05, 2.0526349544525146e-05, 2.1812506020069122e-05, 2.3098662495613098e-05, 2.4384818971157074e-05, 2.567097544670105e-05, 2.6957131922245026e-05, 2.8243288397789e-05, 2.9529444873332977e-05, 3.081560134887695e-05]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 4.0, 15.0, 20.0, 21.0, 36.0, 45.0, 61.0, 90.0, 135.0, 233.0, 382.0, 732.0, 1360.0, 2654.0, 5972.0, 16109.0, 55539.0, 421764.0, 455298.0, 58688.0, 16824.0, 6452.0, 2797.0, 1440.0, 703.0, 387.0, 280.0, 169.0, 109.0, 71.0, 42.0, 28.0, 26.0, 17.0, 10.0, 7.0, 4.0, 2.0, 4.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.2064208984375, -0.20068931579589844, -0.19495773315429688, -0.1892261505126953, -0.18349456787109375, -0.1777629852294922, -0.17203140258789062, -0.16629981994628906, -0.1605682373046875, -0.15483665466308594, -0.14910507202148438, -0.1433734893798828, -0.13764190673828125, -0.1319103240966797, -0.12617874145507812, -0.12044715881347656, -0.114715576171875, -0.10898399353027344, -0.10325241088867188, -0.09752082824707031, -0.09178924560546875, -0.08605766296386719, -0.08032608032226562, -0.07459449768066406, -0.0688629150390625, -0.06313133239746094, -0.057399749755859375, -0.05166816711425781, -0.04593658447265625, -0.04020500183105469, -0.034473419189453125, -0.028741836547851562, -0.02301025390625, -0.017278671264648438, -0.011547088623046875, -0.0058155059814453125, -8.392333984375e-05, 0.0056476593017578125, 0.011379241943359375, 0.017110824584960938, 0.0228424072265625, 0.028573989868164062, 0.034305572509765625, 0.04003715515136719, 0.04576873779296875, 0.05150032043457031, 0.057231903076171875, 0.06296348571777344, 0.068695068359375, 0.07442665100097656, 0.08015823364257812, 0.08588981628417969, 0.09162139892578125, 0.09735298156738281, 0.10308456420898438, 0.10881614685058594, 0.1145477294921875, 0.12027931213378906, 0.12601089477539062, 0.1317424774169922, 0.13747406005859375, 0.1432056427001953, 0.14893722534179688, 0.15466880798339844, 0.160400390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 9.0, 14.0, 20.0, 19.0, 30.0, 44.0, 64.0, 104.0, 170.0, 165.0, 111.0, 61.0, 41.0, 42.0, 24.0, 19.0, 11.0, 10.0, 10.0, 5.0, 5.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09783935546875, -0.09422016143798828, -0.09060096740722656, -0.08698177337646484, -0.08336257934570312, -0.0797433853149414, -0.07612419128417969, -0.07250499725341797, -0.06888580322265625, -0.06526660919189453, -0.06164741516113281, -0.058028221130371094, -0.054409027099609375, -0.050789833068847656, -0.04717063903808594, -0.04355144500732422, -0.0399322509765625, -0.03631305694580078, -0.03269386291503906, -0.029074668884277344, -0.025455474853515625, -0.021836280822753906, -0.018217086791992188, -0.014597892761230469, -0.01097869873046875, -0.007359504699707031, -0.0037403106689453125, -0.00012111663818359375, 0.003498077392578125, 0.007117271423339844, 0.010736465454101562, 0.014355659484863281, 0.017974853515625, 0.02159404754638672, 0.025213241577148438, 0.028832435607910156, 0.032451629638671875, 0.036070823669433594, 0.03969001770019531, 0.04330921173095703, 0.04692840576171875, 0.05054759979248047, 0.05416679382324219, 0.057785987854003906, 0.061405181884765625, 0.06502437591552734, 0.06864356994628906, 0.07226276397705078, 0.0758819580078125, 0.07950115203857422, 0.08312034606933594, 0.08673954010009766, 0.09035873413085938, 0.0939779281616211, 0.09759712219238281, 0.10121631622314453, 0.10483551025390625, 0.10845470428466797, 0.11207389831542969, 0.1156930923461914, 0.11931228637695312, 0.12293148040771484, 0.12655067443847656, 0.13016986846923828, 0.1337890625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 16.0, 20.0, 54.0, 149.0, 277.0, 260.0, 127.0, 40.0, 30.0, 17.0, 3.0, 7.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.733736276626587, -2.619910478591919, -2.506084680557251, -2.392258882522583, -2.278433084487915, -2.164607286453247, -2.05078125, -1.9369555711746216, -1.8231297731399536, -1.7093039751052856, -1.5954781770706177, -1.4816522598266602, -1.3678264617919922, -1.2540006637573242, -1.1401748657226562, -1.0263490676879883, -0.9125232696533203, -0.7986974716186523, -0.6848716735839844, -0.5710458159446716, -0.45722001791000366, -0.3433942198753357, -0.22956836223602295, -0.11574256420135498, -0.0019167661666870117, 0.11190904676914215, 0.2257348597049713, 0.33956068754196167, 0.45338648557662964, 0.5672122836112976, 0.6810381412506104, 0.7948639392852783, 0.9086899757385254, 1.0225157737731934, 1.1363415718078613, 1.2501673698425293, 1.3639931678771973, 1.4778189659118652, 1.5916448831558228, 1.7054706811904907, 1.8192964792251587, 1.9331222772598267, 2.046948194503784, 2.160773992538452, 2.27459979057312, 2.388425588607788, 2.502251386642456, 2.616077184677124, 2.729902982711792, 2.84372878074646, 2.957554578781128, 3.071380376815796, 3.185206174850464, 3.299031972885132, 3.412858009338379, 3.526683807373047, 3.640509605407715, 3.754335403442383, 3.868161201477051, 3.9819869995117188, 4.095812797546387, 4.209638595581055, 4.323464393615723, 4.437290191650391, 4.551115989685059]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 8.0, 4.0, 8.0, 9.0, 22.0, 24.0, 21.0, 25.0, 39.0, 43.0, 50.0, 58.0, 50.0, 60.0, 69.0, 71.0, 66.0, 58.0, 45.0, 53.0, 43.0, 24.0, 35.0, 27.0, 24.0, 18.0, 9.0, 15.0, 5.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9182522296905518, -1.840989112854004, -1.7637261152267456, -1.6864629983901978, -1.60919988155365, -1.5319368839263916, -1.4546737670898438, -1.377410650253296, -1.300147533416748, -1.2228844165802002, -1.145621418952942, -1.068358302116394, -0.9910951852798462, -0.9138321280479431, -0.83656907081604, -0.7593059539794922, -0.6820429563522339, -0.6047798991203308, -0.527516782283783, -0.4502537250518799, -0.3729906380176544, -0.29572755098342896, -0.21846449375152588, -0.14120137691497803, -0.06393831968307495, 0.013324759900569916, 0.09058783948421478, 0.16785091161727905, 0.24511399865150452, 0.32237708568573, 0.39964014291763306, 0.4769032597541809, 0.554166316986084, 0.6314293742179871, 0.7086924910545349, 0.785955548286438, 0.8632186651229858, 0.9404817223548889, 1.017744779586792, 1.0950078964233398, 1.1722710132598877, 1.2495341300964355, 1.3267971277236938, 1.4040602445602417, 1.4813233613967896, 1.5585863590240479, 1.6358494758605957, 1.7131125926971436, 1.7903755903244019, 1.8676387071609497, 1.944901704788208, 2.022164821624756, 2.0994279384613037, 2.1766910552978516, 2.2539539337158203, 2.3312172889709473, 2.408480167388916, 2.485743284225464, 2.5630064010620117, 2.6402692794799805, 2.7175323963165283, 2.794795513153076, 2.872058629989624, 2.949321746826172, 3.0265848636627197]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 6.0, 3.0, 2.0, 9.0, 19.0, 16.0, 17.0, 41.0, 35.0, 62.0, 119.0, 199.0, 291.0, 501.0, 917.0, 1849.0, 4175.0, 11469.0, 45690.0, 338695.0, 3172135.0, 530992.0, 62498.0, 14934.0, 5159.0, 2139.0, 1004.0, 538.0, 295.0, 174.0, 105.0, 68.0, 48.0, 30.0, 17.0, 11.0, 10.0, 10.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.6215896606445312, -0.5952301025390625, -0.5688705444335938, -0.542510986328125, -0.5161514282226562, -0.4897918701171875, -0.46343231201171875, -0.43707275390625, -0.41071319580078125, -0.3843536376953125, -0.35799407958984375, -0.331634521484375, -0.30527496337890625, -0.2789154052734375, -0.25255584716796875, -0.2261962890625, -0.19983673095703125, -0.1734771728515625, -0.14711761474609375, -0.120758056640625, -0.09439849853515625, -0.0680389404296875, -0.04167938232421875, -0.01531982421875, 0.01103973388671875, 0.0373992919921875, 0.06375885009765625, 0.090118408203125, 0.11647796630859375, 0.1428375244140625, 0.16919708251953125, 0.195556640625, 0.22191619873046875, 0.2482757568359375, 0.27463531494140625, 0.300994873046875, 0.32735443115234375, 0.3537139892578125, 0.38007354736328125, 0.40643310546875, 0.43279266357421875, 0.4591522216796875, 0.48551177978515625, 0.511871337890625, 0.5382308959960938, 0.5645904541015625, 0.5909500122070312, 0.6173095703125, 0.6436691284179688, 0.6700286865234375, 0.6963882446289062, 0.722747802734375, 0.7491073608398438, 0.7754669189453125, 0.8018264770507812, 0.82818603515625, 0.8545455932617188, 0.8809051513671875, 0.9072647094726562, 0.933624267578125, 0.9599838256835938, 0.9863433837890625, 1.0127029418945312, 1.0390625]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 6.0, 8.0, 5.0, 17.0, 16.0, 29.0, 25.0, 34.0, 28.0, 55.0, 56.0, 65.0, 62.0, 85.0, 81.0, 66.0, 59.0, 52.0, 50.0, 43.0, 26.0, 21.0, 25.0, 16.0, 8.0, 12.0, 4.0, 4.0, 9.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.6239471435546875, -0.603851318359375, -0.5837554931640625, -0.56365966796875, -0.5435638427734375, -0.523468017578125, -0.5033721923828125, -0.4832763671875, -0.4631805419921875, -0.443084716796875, -0.4229888916015625, -0.40289306640625, -0.3827972412109375, -0.362701416015625, -0.3426055908203125, -0.322509765625, -0.3024139404296875, -0.282318115234375, -0.2622222900390625, -0.24212646484375, -0.2220306396484375, -0.201934814453125, -0.1818389892578125, -0.1617431640625, -0.1416473388671875, -0.121551513671875, -0.1014556884765625, -0.08135986328125, -0.0612640380859375, -0.041168212890625, -0.0210723876953125, -0.0009765625, 0.0191192626953125, 0.039215087890625, 0.0593109130859375, 0.07940673828125, 0.0995025634765625, 0.119598388671875, 0.1396942138671875, 0.1597900390625, 0.1798858642578125, 0.199981689453125, 0.2200775146484375, 0.24017333984375, 0.2602691650390625, 0.280364990234375, 0.3004608154296875, 0.320556640625, 0.3406524658203125, 0.360748291015625, 0.3808441162109375, 0.40093994140625, 0.4210357666015625, 0.441131591796875, 0.4612274169921875, 0.4813232421875, 0.5014190673828125, 0.521514892578125, 0.5416107177734375, 0.56170654296875, 0.5818023681640625, 0.601898193359375, 0.6219940185546875, 0.64208984375]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 14.0, 27.0, 31.0, 55.0, 112.0, 228.0, 398.0, 964.0, 2900.0, 10511.0, 69673.0, 3268452.0, 794746.0, 35887.0, 6767.0, 2042.0, 745.0, 314.0, 171.0, 94.0, 44.0, 36.0, 20.0, 11.0, 6.0, 9.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.3529281616210938, -1.3171844482421875, -1.2814407348632812, -1.245697021484375, -1.2099533081054688, -1.1742095947265625, -1.1384658813476562, -1.10272216796875, -1.0669784545898438, -1.0312347412109375, -0.9954910278320312, -0.959747314453125, -0.9240036010742188, -0.8882598876953125, -0.8525161743164062, -0.8167724609375, -0.7810287475585938, -0.7452850341796875, -0.7095413208007812, -0.673797607421875, -0.6380538940429688, -0.6023101806640625, -0.5665664672851562, -0.53082275390625, -0.49507904052734375, -0.4593353271484375, -0.42359161376953125, -0.387847900390625, -0.35210418701171875, -0.3163604736328125, -0.28061676025390625, -0.244873046875, -0.20912933349609375, -0.1733856201171875, -0.13764190673828125, -0.101898193359375, -0.06615447998046875, -0.0304107666015625, 0.00533294677734375, 0.04107666015625, 0.07682037353515625, 0.1125640869140625, 0.14830780029296875, 0.184051513671875, 0.21979522705078125, 0.2555389404296875, 0.29128265380859375, 0.3270263671875, 0.36277008056640625, 0.3985137939453125, 0.43425750732421875, 0.470001220703125, 0.5057449340820312, 0.5414886474609375, 0.5772323608398438, 0.61297607421875, 0.6487197875976562, 0.6844635009765625, 0.7202072143554688, 0.755950927734375, 0.7916946411132812, 0.8274383544921875, 0.8631820678710938, 0.89892578125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 7.0, 15.0, 21.0, 20.0, 32.0, 56.0, 89.0, 146.0, 274.0, 546.0, 986.0, 887.0, 438.0, 201.0, 116.0, 83.0, 33.0, 30.0, 24.0, 16.0, 13.0, 14.0, 5.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.234375, -0.22564315795898438, -0.21691131591796875, -0.20817947387695312, -0.1994476318359375, -0.19071578979492188, -0.18198394775390625, -0.17325210571289062, -0.164520263671875, -0.15578842163085938, -0.14705657958984375, -0.13832473754882812, -0.1295928955078125, -0.12086105346679688, -0.11212921142578125, -0.10339736938476562, -0.09466552734375, -0.08593368530273438, -0.07720184326171875, -0.06847000122070312, -0.0597381591796875, -0.051006317138671875, -0.04227447509765625, -0.033542633056640625, -0.024810791015625, -0.016078948974609375, -0.00734710693359375, 0.001384735107421875, 0.0101165771484375, 0.018848419189453125, 0.02758026123046875, 0.036312103271484375, 0.0450439453125, 0.053775787353515625, 0.06250762939453125, 0.07123947143554688, 0.0799713134765625, 0.08870315551757812, 0.09743499755859375, 0.10616683959960938, 0.114898681640625, 0.12363052368164062, 0.13236236572265625, 0.14109420776367188, 0.1498260498046875, 0.15855789184570312, 0.16728973388671875, 0.17602157592773438, 0.18475341796875, 0.19348526000976562, 0.20221710205078125, 0.21094894409179688, 0.2196807861328125, 0.22841262817382812, 0.23714447021484375, 0.24587631225585938, 0.254608154296875, 0.2633399963378906, 0.27207183837890625, 0.2808036804199219, 0.2895355224609375, 0.2982673645019531, 0.30699920654296875, 0.3157310485839844, 0.324462890625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 10.0, 8.0, 14.0, 19.0, 34.0, 37.0, 70.0, 107.0, 121.0, 148.0, 111.0, 89.0, 73.0, 48.0, 35.0, 19.0, 11.0, 8.0, 7.0, 3.0, 9.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3823992013931274, -1.3455817699432373, -1.3087643384933472, -1.271946907043457, -1.235129475593567, -1.1983120441436768, -1.161494493484497, -1.124677062034607, -1.0878596305847168, -1.0510421991348267, -1.0142247676849365, -0.9774073362350464, -0.9405898451805115, -0.9037724137306213, -0.8669549822807312, -0.8301374912261963, -0.7933201193809509, -0.7565026879310608, -0.7196852564811707, -0.6828677654266357, -0.6460503339767456, -0.6092329025268555, -0.5724154710769653, -0.5355980396270752, -0.49878057837486267, -0.46196314692497253, -0.42514568567276, -0.3883282542228699, -0.35151082277297974, -0.3146933615207672, -0.2778759300708771, -0.24105846881866455, -0.20424097776412964, -0.1674235314130783, -0.13060608506202698, -0.09378865361213684, -0.05697120726108551, -0.02015376091003418, 0.016663670539855957, 0.05348113179206848, 0.09029856324195862, 0.12711600959300995, 0.16393345594406128, 0.20075088739395142, 0.23756833374500275, 0.2743857800960541, 0.3112032115459442, 0.34802067279815674, 0.3848381042480469, 0.421655535697937, 0.45847299695014954, 0.4952904284000397, 0.5321078896522522, 0.5689253211021423, 0.6057427525520325, 0.6425602436065674, 0.6793776750564575, 0.7161951065063477, 0.7530125379562378, 0.7898299694061279, 0.8266474604606628, 0.863464891910553, 0.9002823233604431, 0.937099814414978, 0.9739171862602234]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 6.0, 8.0, 13.0, 3.0, 16.0, 14.0, 21.0, 28.0, 32.0, 35.0, 53.0, 56.0, 60.0, 54.0, 56.0, 59.0, 65.0, 66.0, 45.0, 42.0, 40.0, 44.0, 25.0, 25.0, 26.0, 26.0, 17.0, 8.0, 6.0, 10.0, 8.0, 2.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.631807267665863, -0.612474262714386, -0.5931412577629089, -0.5738082528114319, -0.5544752478599548, -0.5351423025131226, -0.5158092975616455, -0.49647629261016846, -0.4771432876586914, -0.45781028270721436, -0.4384772777557373, -0.41914427280426025, -0.3998112976551056, -0.38047829270362854, -0.3611452877521515, -0.3418123126029968, -0.3224792778491974, -0.30314627289772034, -0.2838132679462433, -0.2644802927970886, -0.24514728784561157, -0.22581428289413452, -0.20648127794265747, -0.1871482878923416, -0.16781528294086456, -0.1484822779893875, -0.12914928793907166, -0.1098162829875946, -0.09048328548669815, -0.0711502879858017, -0.051817283034324646, -0.03248429298400879, -0.013151288032531738, 0.006181711331009865, 0.025514710694551468, 0.04484771192073822, 0.06418070942163467, 0.08351370692253113, 0.10284671187400818, 0.12217970192432404, 0.1415127068758011, 0.16084571182727814, 0.180178701877594, 0.19951170682907104, 0.2188447117805481, 0.23817770183086395, 0.2575107216835022, 0.27684369683265686, 0.2961767017841339, 0.31550970673561096, 0.334842711687088, 0.3541756868362427, 0.3735086917877197, 0.3928416967391968, 0.41217470169067383, 0.4315077066421509, 0.45084071159362793, 0.470173716545105, 0.48950672149658203, 0.5088397264480591, 0.5281727313995361, 0.5475057363510132, 0.5668387413024902, 0.5861716866493225, 0.6055046916007996]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 4.0, 8.0, 10.0, 17.0, 33.0, 26.0, 50.0, 54.0, 89.0, 134.0, 174.0, 278.0, 413.0, 673.0, 995.0, 1754.0, 3150.0, 5881.0, 12147.0, 27211.0, 71436.0, 230319.0, 415436.0, 176507.0, 56894.0, 22633.0, 10192.0, 5104.0, 2697.0, 1510.0, 923.0, 606.0, 362.0, 265.0, 150.0, 125.0, 78.0, 57.0, 45.0, 37.0, 16.0, 17.0, 8.0, 5.0, 7.0, 9.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.09930419921875, -0.09641647338867188, -0.09352874755859375, -0.09064102172851562, -0.0877532958984375, -0.08486557006835938, -0.08197784423828125, -0.07909011840820312, -0.076202392578125, -0.07331466674804688, -0.07042694091796875, -0.06753921508789062, -0.0646514892578125, -0.061763763427734375, -0.05887603759765625, -0.055988311767578125, -0.0531005859375, -0.050212860107421875, -0.04732513427734375, -0.044437408447265625, -0.0415496826171875, -0.038661956787109375, -0.03577423095703125, -0.032886505126953125, -0.029998779296875, -0.027111053466796875, -0.02422332763671875, -0.021335601806640625, -0.0184478759765625, -0.015560150146484375, -0.01267242431640625, -0.009784698486328125, -0.00689697265625, -0.004009246826171875, -0.00112152099609375, 0.001766204833984375, 0.0046539306640625, 0.007541656494140625, 0.01042938232421875, 0.013317108154296875, 0.016204833984375, 0.019092559814453125, 0.02198028564453125, 0.024868011474609375, 0.0277557373046875, 0.030643463134765625, 0.03353118896484375, 0.036418914794921875, 0.039306640625, 0.042194366455078125, 0.04508209228515625, 0.047969818115234375, 0.0508575439453125, 0.053745269775390625, 0.05663299560546875, 0.059520721435546875, 0.062408447265625, 0.06529617309570312, 0.06818389892578125, 0.07107162475585938, 0.0739593505859375, 0.07684707641601562, 0.07973480224609375, 0.08262252807617188, 0.08551025390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 14.0, 9.0, 17.0, 17.0, 28.0, 21.0, 41.0, 52.0, 59.0, 53.0, 67.0, 59.0, 54.0, 73.0, 64.0, 53.0, 43.0, 43.0, 38.0, 32.0, 27.0, 27.0, 21.0, 15.0, 10.0, 7.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.416259765625, -0.4026756286621094, -0.38909149169921875, -0.3755073547363281, -0.3619232177734375, -0.3483390808105469, -0.33475494384765625, -0.3211708068847656, -0.307586669921875, -0.2940025329589844, -0.28041839599609375, -0.2668342590332031, -0.2532501220703125, -0.23966598510742188, -0.22608184814453125, -0.21249771118164062, -0.19891357421875, -0.18532943725585938, -0.17174530029296875, -0.15816116333007812, -0.1445770263671875, -0.13099288940429688, -0.11740875244140625, -0.10382461547851562, -0.090240478515625, -0.07665634155273438, -0.06307220458984375, -0.049488067626953125, -0.0359039306640625, -0.022319793701171875, -0.00873565673828125, 0.004848480224609375, 0.0184326171875, 0.032016754150390625, 0.04560089111328125, 0.059185028076171875, 0.0727691650390625, 0.08635330200195312, 0.09993743896484375, 0.11352157592773438, 0.127105712890625, 0.14068984985351562, 0.15427398681640625, 0.16785812377929688, 0.1814422607421875, 0.19502639770507812, 0.20861053466796875, 0.22219467163085938, 0.23577880859375, 0.24936294555664062, 0.26294708251953125, 0.2765312194824219, 0.2901153564453125, 0.3036994934082031, 0.31728363037109375, 0.3308677673339844, 0.344451904296875, 0.3580360412597656, 0.37162017822265625, 0.3852043151855469, 0.3987884521484375, 0.4123725891113281, 0.42595672607421875, 0.4395408630371094, 0.453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 2.0, 4.0, 9.0, 13.0, 17.0, 18.0, 19.0, 27.0, 64.0, 106.0, 210.0, 377.0, 760.0, 2228.0, 8085.0, 52065.0, 598575.0, 348275.0, 29578.0, 5297.0, 1585.0, 570.0, 263.0, 151.0, 83.0, 54.0, 37.0, 21.0, 19.0, 8.0, 5.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1773681640625, -0.17162132263183594, -0.16587448120117188, -0.1601276397705078, -0.15438079833984375, -0.1486339569091797, -0.14288711547851562, -0.13714027404785156, -0.1313934326171875, -0.12564659118652344, -0.11989974975585938, -0.11415290832519531, -0.10840606689453125, -0.10265922546386719, -0.09691238403320312, -0.09116554260253906, -0.085418701171875, -0.07967185974121094, -0.07392501831054688, -0.06817817687988281, -0.06243133544921875, -0.05668449401855469, -0.050937652587890625, -0.04519081115722656, -0.0394439697265625, -0.03369712829589844, -0.027950286865234375, -0.022203445434570312, -0.01645660400390625, -0.010709762573242188, -0.004962921142578125, 0.0007839202880859375, 0.00653076171875, 0.012277603149414062, 0.018024444580078125, 0.023771286010742188, 0.02951812744140625, 0.03526496887207031, 0.041011810302734375, 0.04675865173339844, 0.0525054931640625, 0.05825233459472656, 0.06399917602539062, 0.06974601745605469, 0.07549285888671875, 0.08123970031738281, 0.08698654174804688, 0.09273338317871094, 0.098480224609375, 0.10422706604003906, 0.10997390747070312, 0.11572074890136719, 0.12146759033203125, 0.1272144317626953, 0.13296127319335938, 0.13870811462402344, 0.1444549560546875, 0.15020179748535156, 0.15594863891601562, 0.1616954803466797, 0.16744232177734375, 0.1731891632080078, 0.17893600463867188, 0.18468284606933594, 0.1904296875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 5.0, 13.0, 19.0, 20.0, 21.0, 26.0, 38.0, 35.0, 45.0, 41.0, 44.0, 55.0, 49.0, 43.0, 50.0, 62.0, 46.0, 38.0, 49.0, 47.0, 45.0, 26.0, 33.0, 30.0, 29.0, 11.0, 16.0, 13.0, 9.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87548828125, -0.8513031005859375, -0.827117919921875, -0.8029327392578125, -0.77874755859375, -0.7545623779296875, -0.730377197265625, -0.7061920166015625, -0.6820068359375, -0.6578216552734375, -0.633636474609375, -0.6094512939453125, -0.58526611328125, -0.5610809326171875, -0.536895751953125, -0.5127105712890625, -0.488525390625, -0.4643402099609375, -0.440155029296875, -0.4159698486328125, -0.39178466796875, -0.3675994873046875, -0.343414306640625, -0.3192291259765625, -0.2950439453125, -0.2708587646484375, -0.246673583984375, -0.2224884033203125, -0.19830322265625, -0.1741180419921875, -0.149932861328125, -0.1257476806640625, -0.1015625, -0.0773773193359375, -0.053192138671875, -0.0290069580078125, -0.00482177734375, 0.0193634033203125, 0.043548583984375, 0.0677337646484375, 0.0919189453125, 0.1161041259765625, 0.140289306640625, 0.1644744873046875, 0.18865966796875, 0.2128448486328125, 0.237030029296875, 0.2612152099609375, 0.285400390625, 0.3095855712890625, 0.333770751953125, 0.3579559326171875, 0.38214111328125, 0.4063262939453125, 0.430511474609375, 0.4546966552734375, 0.4788818359375, 0.5030670166015625, 0.527252197265625, 0.5514373779296875, 0.57562255859375, 0.5998077392578125, 0.623992919921875, 0.6481781005859375, 0.67236328125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 14.0, 22.0, 26.0, 55.0, 71.0, 158.0, 314.0, 615.0, 1652.0, 5985.0, 35530.0, 561015.0, 408028.0, 27236.0, 5156.0, 1455.0, 597.0, 265.0, 137.0, 82.0, 45.0, 21.0, 18.0, 12.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.09014892578125, -0.0877084732055664, -0.08526802062988281, -0.08282756805419922, -0.08038711547851562, -0.07794666290283203, -0.07550621032714844, -0.07306575775146484, -0.07062530517578125, -0.06818485260009766, -0.06574440002441406, -0.06330394744873047, -0.060863494873046875, -0.05842304229736328, -0.05598258972167969, -0.053542137145996094, -0.0511016845703125, -0.048661231994628906, -0.04622077941894531, -0.04378032684326172, -0.041339874267578125, -0.03889942169189453, -0.03645896911621094, -0.034018516540527344, -0.03157806396484375, -0.029137611389160156, -0.026697158813476562, -0.02425670623779297, -0.021816253662109375, -0.01937580108642578, -0.016935348510742188, -0.014494895935058594, -0.012054443359375, -0.009613990783691406, -0.0071735382080078125, -0.004733085632324219, -0.002292633056640625, 0.00014781951904296875, 0.0025882720947265625, 0.005028724670410156, 0.00746917724609375, 0.009909629821777344, 0.012350082397460938, 0.014790534973144531, 0.017230987548828125, 0.01967144012451172, 0.022111892700195312, 0.024552345275878906, 0.0269927978515625, 0.029433250427246094, 0.03187370300292969, 0.03431415557861328, 0.036754608154296875, 0.03919506072998047, 0.04163551330566406, 0.044075965881347656, 0.04651641845703125, 0.048956871032714844, 0.05139732360839844, 0.05383777618408203, 0.056278228759765625, 0.05871868133544922, 0.06115913391113281, 0.0635995864868164, 0.0660400390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 8.0, 25.0, 35.0, 40.0, 62.0, 73.0, 96.0, 85.0, 118.0, 102.0, 92.0, 70.0, 48.0, 28.0, 22.0, 19.0, 16.0, 8.0, 4.0, 5.0, 7.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2232532501220703e-05, -2.1447427570819855e-05, -2.0662322640419006e-05, -1.9877217710018158e-05, -1.909211277961731e-05, -1.830700784921646e-05, -1.7521902918815613e-05, -1.6736797988414764e-05, -1.5951693058013916e-05, -1.5166588127613068e-05, -1.438148319721222e-05, -1.3596378266811371e-05, -1.2811273336410522e-05, -1.2026168406009674e-05, -1.1241063475608826e-05, -1.0455958545207977e-05, -9.670853614807129e-06, -8.88574868440628e-06, -8.100643754005432e-06, -7.315538823604584e-06, -6.530433893203735e-06, -5.745328962802887e-06, -4.9602240324020386e-06, -4.17511910200119e-06, -3.390014171600342e-06, -2.6049092411994934e-06, -1.819804310798645e-06, -1.0346993803977966e-06, -2.4959444999694824e-07, 5.355104804039001e-07, 1.3206154108047485e-06, 2.105720341205597e-06, 2.8908252716064453e-06, 3.6759302020072937e-06, 4.461035132408142e-06, 5.2461400628089905e-06, 6.031244993209839e-06, 6.816349923610687e-06, 7.601454854011536e-06, 8.386559784412384e-06, 9.171664714813232e-06, 9.95676964521408e-06, 1.074187457561493e-05, 1.1526979506015778e-05, 1.2312084436416626e-05, 1.3097189366817474e-05, 1.3882294297218323e-05, 1.4667399227619171e-05, 1.545250415802002e-05, 1.6237609088420868e-05, 1.7022714018821716e-05, 1.7807818949222565e-05, 1.8592923879623413e-05, 1.937802881002426e-05, 2.016313374042511e-05, 2.0948238670825958e-05, 2.1733343601226807e-05, 2.2518448531627655e-05, 2.3303553462028503e-05, 2.4088658392429352e-05, 2.48737633228302e-05, 2.565886825323105e-05, 2.6443973183631897e-05, 2.7229078114032745e-05, 2.8014183044433594e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 12.0, 12.0, 13.0, 12.0, 32.0, 37.0, 71.0, 91.0, 155.0, 213.0, 399.0, 723.0, 1404.0, 3170.0, 7749.0, 21102.0, 69984.0, 286146.0, 463992.0, 135503.0, 36359.0, 12181.0, 4718.0, 2077.0, 1006.0, 534.0, 296.0, 184.0, 123.0, 73.0, 44.0, 26.0, 19.0, 20.0, 18.0, 11.0, 8.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04132080078125, -0.03999805450439453, -0.03867530822753906, -0.037352561950683594, -0.036029815673828125, -0.034707069396972656, -0.03338432312011719, -0.03206157684326172, -0.03073883056640625, -0.02941608428955078, -0.028093338012695312, -0.026770591735839844, -0.025447845458984375, -0.024125099182128906, -0.022802352905273438, -0.02147960662841797, -0.0201568603515625, -0.01883411407470703, -0.017511367797851562, -0.016188621520996094, -0.014865875244140625, -0.013543128967285156, -0.012220382690429688, -0.010897636413574219, -0.00957489013671875, -0.008252143859863281, -0.0069293975830078125, -0.005606651306152344, -0.004283905029296875, -0.0029611587524414062, -0.0016384124755859375, -0.00031566619873046875, 0.001007080078125, 0.0023298263549804688, 0.0036525726318359375, 0.004975318908691406, 0.006298065185546875, 0.007620811462402344, 0.008943557739257812, 0.010266304016113281, 0.01158905029296875, 0.012911796569824219, 0.014234542846679688, 0.015557289123535156, 0.016880035400390625, 0.018202781677246094, 0.019525527954101562, 0.02084827423095703, 0.0221710205078125, 0.02349376678466797, 0.024816513061523438, 0.026139259338378906, 0.027462005615234375, 0.028784751892089844, 0.030107498168945312, 0.03143024444580078, 0.03275299072265625, 0.03407573699951172, 0.03539848327636719, 0.036721229553222656, 0.038043975830078125, 0.039366722106933594, 0.04068946838378906, 0.04201221466064453, 0.0433349609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 12.0, 12.0, 10.0, 21.0, 23.0, 30.0, 40.0, 61.0, 71.0, 122.0, 110.0, 98.0, 104.0, 70.0, 53.0, 41.0, 27.0, 16.0, 20.0, 18.0, 14.0, 7.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01129913330078125, -0.01082456111907959, -0.01034998893737793, -0.00987541675567627, -0.00940084457397461, -0.00892627239227295, -0.008451700210571289, -0.007977128028869629, -0.007502555847167969, -0.007027983665466309, -0.0065534114837646484, -0.006078839302062988, -0.005604267120361328, -0.005129694938659668, -0.004655122756958008, -0.004180550575256348, -0.0037059783935546875, -0.0032314062118530273, -0.002756834030151367, -0.002282261848449707, -0.0018076896667480469, -0.0013331174850463867, -0.0008585453033447266, -0.0003839731216430664, 9.059906005859375e-05, 0.0005651712417602539, 0.001039743423461914, 0.0015143156051635742, 0.0019888877868652344, 0.0024634599685668945, 0.0029380321502685547, 0.003412604331970215, 0.003887176513671875, 0.004361748695373535, 0.004836320877075195, 0.0053108930587768555, 0.005785465240478516, 0.006260037422180176, 0.006734609603881836, 0.007209181785583496, 0.007683753967285156, 0.008158326148986816, 0.008632898330688477, 0.009107470512390137, 0.009582042694091797, 0.010056614875793457, 0.010531187057495117, 0.011005759239196777, 0.011480331420898438, 0.011954903602600098, 0.012429475784301758, 0.012904047966003418, 0.013378620147705078, 0.013853192329406738, 0.014327764511108398, 0.014802336692810059, 0.015276908874511719, 0.01575148105621338, 0.01622605323791504, 0.0167006254196167, 0.01717519760131836, 0.01764976978302002, 0.01812434196472168, 0.01859891414642334, 0.019073486328125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 12.0, 23.0, 29.0, 70.0, 132.0, 177.0, 215.0, 124.0, 87.0, 42.0, 23.0, 19.0, 9.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0850715637207031, -1.052314043045044, -1.0195565223693848, -0.9867991209030151, -0.954041600227356, -0.9212840795516968, -0.8885266184806824, -0.855769157409668, -0.8230116367340088, -0.7902541160583496, -0.7574966549873352, -0.7247391939163208, -0.6919816732406616, -0.6592241525650024, -0.626466691493988, -0.5937092304229736, -0.5609517097473145, -0.5281941890716553, -0.49543672800064087, -0.4626792371273041, -0.4299217462539673, -0.3971642553806305, -0.3644067645072937, -0.3316492736339569, -0.2988917827606201, -0.2661342918872833, -0.23337680101394653, -0.20061931014060974, -0.16786181926727295, -0.13510432839393616, -0.10234683752059937, -0.06958934664726257, -0.03683185577392578, -0.004074364900588989, 0.028683125972747803, 0.061440616846084595, 0.09419810771942139, 0.12695559859275818, 0.15971308946609497, 0.19247058033943176, 0.22522807121276855, 0.25798556208610535, 0.29074305295944214, 0.32350054383277893, 0.3562580347061157, 0.3890155255794525, 0.4217730164527893, 0.4545305073261261, 0.4872879981994629, 0.5200455188751221, 0.5528029799461365, 0.5855604410171509, 0.6183179616928101, 0.6510754823684692, 0.6838329434394836, 0.716590404510498, 0.7493479251861572, 0.7821054458618164, 0.8148629069328308, 0.8476203680038452, 0.8803778886795044, 0.9131354093551636, 0.945892870426178, 0.9786503314971924, 1.0114078521728516]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 6.0, 5.0, 10.0, 5.0, 8.0, 17.0, 8.0, 20.0, 36.0, 34.0, 39.0, 63.0, 67.0, 69.0, 73.0, 62.0, 67.0, 71.0, 52.0, 53.0, 53.0, 34.0, 20.0, 28.0, 29.0, 18.0, 8.0, 6.0, 11.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.4573909044265747, -0.44344955682754517, -0.429508239030838, -0.41556689143180847, -0.40162554383277893, -0.3876842260360718, -0.37374287843704224, -0.3598015308380127, -0.34586021304130554, -0.331918865442276, -0.31797754764556885, -0.3040362000465393, -0.29009485244750977, -0.2761535346508026, -0.26221218705177307, -0.24827085435390472, -0.23432950675487518, -0.22038817405700684, -0.2064468264579773, -0.19250549376010895, -0.1785641610622406, -0.16462281346321106, -0.1506814807653427, -0.13674014806747437, -0.12279880791902542, -0.10885746777057648, -0.09491613507270813, -0.08097479492425919, -0.06703345477581024, -0.053092122077941895, -0.03915078192949295, -0.025209449231624603, -0.01126810908317566, 0.002673228271305561, 0.01661456562578678, 0.030555903911590576, 0.04449724033474922, 0.05843857675790787, 0.07237991690635681, 0.08632124960422516, 0.1002625897526741, 0.11420392990112305, 0.1281452625989914, 0.14208659529685974, 0.15602794289588928, 0.16996927559375763, 0.18391060829162598, 0.19785195589065552, 0.21179328858852386, 0.2257346212863922, 0.23967596888542175, 0.2536172866821289, 0.26755863428115845, 0.281499981880188, 0.29544132947921753, 0.3093826472759247, 0.3233239948749542, 0.33726534247398376, 0.3512066602706909, 0.36514800786972046, 0.37908935546875, 0.39303067326545715, 0.4069720208644867, 0.42091333866119385, 0.4348546862602234]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 5.0, 7.0, 9.0, 24.0, 23.0, 41.0, 62.0, 96.0, 177.0, 320.0, 537.0, 1203.0, 2500.0, 5946.0, 15385.0, 47213.0, 210176.0, 575753.0, 133941.0, 34315.0, 11868.0, 4718.0, 2114.0, 987.0, 477.0, 259.0, 145.0, 83.0, 57.0, 36.0, 22.0, 15.0, 10.0, 19.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.50244140625, -0.4873847961425781, -0.47232818603515625, -0.4572715759277344, -0.4422149658203125, -0.4271583557128906, -0.41210174560546875, -0.3970451354980469, -0.381988525390625, -0.3669319152832031, -0.35187530517578125, -0.3368186950683594, -0.3217620849609375, -0.3067054748535156, -0.29164886474609375, -0.2765922546386719, -0.26153564453125, -0.24647903442382812, -0.23142242431640625, -0.21636581420898438, -0.2013092041015625, -0.18625259399414062, -0.17119598388671875, -0.15613937377929688, -0.141082763671875, -0.12602615356445312, -0.11096954345703125, -0.09591293334960938, -0.0808563232421875, -0.06579971313476562, -0.05074310302734375, -0.035686492919921875, -0.0206298828125, -0.005573272705078125, 0.00948333740234375, 0.024539947509765625, 0.0395965576171875, 0.054653167724609375, 0.06970977783203125, 0.08476638793945312, 0.099822998046875, 0.11487960815429688, 0.12993621826171875, 0.14499282836914062, 0.1600494384765625, 0.17510604858398438, 0.19016265869140625, 0.20521926879882812, 0.22027587890625, 0.23533248901367188, 0.25038909912109375, 0.2654457092285156, 0.2805023193359375, 0.2955589294433594, 0.31061553955078125, 0.3256721496582031, 0.340728759765625, 0.3557853698730469, 0.37084197998046875, 0.3858985900878906, 0.4009552001953125, 0.4160118103027344, 0.43106842041015625, 0.4461250305175781, 0.461181640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 6.0, 8.0, 9.0, 5.0, 11.0, 24.0, 20.0, 31.0, 42.0, 40.0, 43.0, 52.0, 56.0, 55.0, 69.0, 67.0, 62.0, 62.0, 47.0, 45.0, 36.0, 42.0, 34.0, 24.0, 24.0, 14.0, 15.0, 9.0, 6.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.97119140625, -0.94097900390625, -0.9107666015625, -0.88055419921875, -0.850341796875, -0.82012939453125, -0.7899169921875, -0.75970458984375, -0.7294921875, -0.69927978515625, -0.6690673828125, -0.63885498046875, -0.608642578125, -0.57843017578125, -0.5482177734375, -0.51800537109375, -0.48779296875, -0.45758056640625, -0.4273681640625, -0.39715576171875, -0.366943359375, -0.33673095703125, -0.3065185546875, -0.27630615234375, -0.24609375, -0.21588134765625, -0.1856689453125, -0.15545654296875, -0.125244140625, -0.09503173828125, -0.0648193359375, -0.03460693359375, -0.00439453125, 0.02581787109375, 0.0560302734375, 0.08624267578125, 0.116455078125, 0.14666748046875, 0.1768798828125, 0.20709228515625, 0.2373046875, 0.26751708984375, 0.2977294921875, 0.32794189453125, 0.358154296875, 0.38836669921875, 0.4185791015625, 0.44879150390625, 0.47900390625, 0.50921630859375, 0.5394287109375, 0.56964111328125, 0.599853515625, 0.63006591796875, 0.6602783203125, 0.69049072265625, 0.720703125, 0.75091552734375, 0.7811279296875, 0.81134033203125, 0.841552734375, 0.87176513671875, 0.9019775390625, 0.93218994140625, 0.96240234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 9.0, 17.0, 19.0, 29.0, 27.0, 23.0, 32.0, 59.0, 66.0, 98.0, 177.0, 230.0, 401.0, 629.0, 1235.0, 2748.0, 7066.0, 22403.0, 98055.0, 588388.0, 261147.0, 44751.0, 12539.0, 4301.0, 1798.0, 877.0, 443.0, 285.0, 196.0, 131.0, 108.0, 52.0, 56.0, 44.0, 35.0, 18.0, 14.0, 9.0, 4.0, 8.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869140625, -0.39582061767578125, -0.3829498291015625, -0.37007904052734375, -0.357208251953125, -0.34433746337890625, -0.3314666748046875, -0.31859588623046875, -0.30572509765625, -0.29285430908203125, -0.2799835205078125, -0.26711273193359375, -0.254241943359375, -0.24137115478515625, -0.2285003662109375, -0.21562957763671875, -0.2027587890625, -0.18988800048828125, -0.1770172119140625, -0.16414642333984375, -0.151275634765625, -0.13840484619140625, -0.1255340576171875, -0.11266326904296875, -0.09979248046875, -0.08692169189453125, -0.0740509033203125, -0.06118011474609375, -0.048309326171875, -0.03543853759765625, -0.0225677490234375, -0.00969696044921875, 0.003173828125, 0.01604461669921875, 0.0289154052734375, 0.04178619384765625, 0.054656982421875, 0.06752777099609375, 0.0803985595703125, 0.09326934814453125, 0.10614013671875, 0.11901092529296875, 0.1318817138671875, 0.14475250244140625, 0.157623291015625, 0.17049407958984375, 0.1833648681640625, 0.19623565673828125, 0.2091064453125, 0.22197723388671875, 0.2348480224609375, 0.24771881103515625, 0.260589599609375, 0.27346038818359375, 0.2863311767578125, 0.29920196533203125, 0.31207275390625, 0.32494354248046875, 0.3378143310546875, 0.35068511962890625, 0.363555908203125, 0.37642669677734375, 0.3892974853515625, 0.40216827392578125, 0.4150390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 8.0, 8.0, 6.0, 9.0, 12.0, 27.0, 20.0, 21.0, 30.0, 30.0, 38.0, 33.0, 38.0, 40.0, 45.0, 36.0, 48.0, 56.0, 47.0, 42.0, 45.0, 38.0, 50.0, 46.0, 38.0, 27.0, 19.0, 29.0, 19.0, 11.0, 21.0, 12.0, 10.0, 12.0, 8.0, 7.0, 1.0, 4.0, 4.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0451278686523438, -1.0150604248046875, -0.9849929809570312, -0.954925537109375, -0.9248580932617188, -0.8947906494140625, -0.8647232055664062, -0.83465576171875, -0.8045883178710938, -0.7745208740234375, -0.7444534301757812, -0.714385986328125, -0.6843185424804688, -0.6542510986328125, -0.6241836547851562, -0.5941162109375, -0.5640487670898438, -0.5339813232421875, -0.5039138793945312, -0.473846435546875, -0.44377899169921875, -0.4137115478515625, -0.38364410400390625, -0.35357666015625, -0.32350921630859375, -0.2934417724609375, -0.26337432861328125, -0.233306884765625, -0.20323944091796875, -0.1731719970703125, -0.14310455322265625, -0.113037109375, -0.08296966552734375, -0.0529022216796875, -0.02283477783203125, 0.007232666015625, 0.03730010986328125, 0.0673675537109375, 0.09743499755859375, 0.12750244140625, 0.15756988525390625, 0.1876373291015625, 0.21770477294921875, 0.247772216796875, 0.27783966064453125, 0.3079071044921875, 0.33797454833984375, 0.3680419921875, 0.39810943603515625, 0.4281768798828125, 0.45824432373046875, 0.488311767578125, 0.5183792114257812, 0.5484466552734375, 0.5785140991210938, 0.60858154296875, 0.6386489868164062, 0.6687164306640625, 0.6987838745117188, 0.728851318359375, 0.7589187622070312, 0.7889862060546875, 0.8190536499023438, 0.84912109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 12.0, 9.0, 13.0, 13.0, 33.0, 50.0, 63.0, 90.0, 170.0, 326.0, 600.0, 1349.0, 3766.0, 15681.0, 100572.0, 705225.0, 187045.0, 24805.0, 5418.0, 1765.0, 712.0, 327.0, 190.0, 108.0, 60.0, 49.0, 30.0, 19.0, 19.0, 6.0, 9.0, 7.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1937255859375, -0.18740272521972656, -0.18107986450195312, -0.1747570037841797, -0.16843414306640625, -0.1621112823486328, -0.15578842163085938, -0.14946556091308594, -0.1431427001953125, -0.13681983947753906, -0.13049697875976562, -0.12417411804199219, -0.11785125732421875, -0.11152839660644531, -0.10520553588867188, -0.09888267517089844, -0.092559814453125, -0.08623695373535156, -0.07991409301757812, -0.07359123229980469, -0.06726837158203125, -0.06094551086425781, -0.054622650146484375, -0.04829978942871094, -0.0419769287109375, -0.03565406799316406, -0.029331207275390625, -0.023008346557617188, -0.01668548583984375, -0.010362625122070312, -0.004039764404296875, 0.0022830963134765625, 0.00860595703125, 0.014928817749023438, 0.021251678466796875, 0.027574539184570312, 0.03389739990234375, 0.04022026062011719, 0.046543121337890625, 0.05286598205566406, 0.0591888427734375, 0.06551170349121094, 0.07183456420898438, 0.07815742492675781, 0.08448028564453125, 0.09080314636230469, 0.09712600708007812, 0.10344886779785156, 0.109771728515625, 0.11609458923339844, 0.12241744995117188, 0.1287403106689453, 0.13506317138671875, 0.1413860321044922, 0.14770889282226562, 0.15403175354003906, 0.1603546142578125, 0.16667747497558594, 0.17300033569335938, 0.1793231964111328, 0.18564605712890625, 0.1919689178466797, 0.19829177856445312, 0.20461463928222656, 0.2109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 20.0, 16.0, 27.0, 26.0, 48.0, 78.0, 105.0, 153.0, 148.0, 114.0, 80.0, 51.0, 33.0, 28.0, 11.0, 20.0, 12.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.315376281738281e-05, -4.189833998680115e-05, -4.064291715621948e-05, -3.938749432563782e-05, -3.813207149505615e-05, -3.687664866447449e-05, -3.562122583389282e-05, -3.436580300331116e-05, -3.311038017272949e-05, -3.185495734214783e-05, -3.059953451156616e-05, -2.9344111680984497e-05, -2.8088688850402832e-05, -2.6833266019821167e-05, -2.5577843189239502e-05, -2.4322420358657837e-05, -2.3066997528076172e-05, -2.1811574697494507e-05, -2.0556151866912842e-05, -1.9300729036331177e-05, -1.8045306205749512e-05, -1.6789883375167847e-05, -1.553446054458618e-05, -1.4279037714004517e-05, -1.3023614883422852e-05, -1.1768192052841187e-05, -1.0512769222259521e-05, -9.257346391677856e-06, -8.001923561096191e-06, -6.746500730514526e-06, -5.491077899932861e-06, -4.235655069351196e-06, -2.9802322387695312e-06, -1.7248094081878662e-06, -4.6938657760620117e-07, 7.860362529754639e-07, 2.041459083557129e-06, 3.296881914138794e-06, 4.552304744720459e-06, 5.807727575302124e-06, 7.063150405883789e-06, 8.318573236465454e-06, 9.573996067047119e-06, 1.0829418897628784e-05, 1.208484172821045e-05, 1.3340264558792114e-05, 1.459568738937378e-05, 1.5851110219955444e-05, 1.710653305053711e-05, 1.8361955881118774e-05, 1.961737871170044e-05, 2.0872801542282104e-05, 2.212822437286377e-05, 2.3383647203445435e-05, 2.46390700340271e-05, 2.5894492864608765e-05, 2.714991569519043e-05, 2.8405338525772095e-05, 2.966076135635376e-05, 3.0916184186935425e-05, 3.217160701751709e-05, 3.3427029848098755e-05, 3.468245267868042e-05, 3.5937875509262085e-05, 3.719329833984375e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 10.0, 10.0, 19.0, 17.0, 45.0, 40.0, 73.0, 110.0, 196.0, 299.0, 573.0, 933.0, 2031.0, 4291.0, 10943.0, 32237.0, 124765.0, 556415.0, 235372.0, 52420.0, 16053.0, 6121.0, 2563.0, 1314.0, 673.0, 405.0, 217.0, 116.0, 80.0, 52.0, 39.0, 38.0, 21.0, 14.0, 9.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.121337890625, -0.11710929870605469, -0.11288070678710938, -0.10865211486816406, -0.10442352294921875, -0.10019493103027344, -0.09596633911132812, -0.09173774719238281, -0.0875091552734375, -0.08328056335449219, -0.07905197143554688, -0.07482337951660156, -0.07059478759765625, -0.06636619567871094, -0.062137603759765625, -0.05790901184082031, -0.053680419921875, -0.04945182800292969, -0.045223236083984375, -0.04099464416503906, -0.03676605224609375, -0.03253746032714844, -0.028308868408203125, -0.024080276489257812, -0.0198516845703125, -0.015623092651367188, -0.011394500732421875, -0.0071659088134765625, -0.00293731689453125, 0.0012912750244140625, 0.005519866943359375, 0.009748458862304688, 0.01397705078125, 0.018205642700195312, 0.022434234619140625, 0.026662826538085938, 0.03089141845703125, 0.03512001037597656, 0.039348602294921875, 0.04357719421386719, 0.0478057861328125, 0.05203437805175781, 0.056262969970703125, 0.06049156188964844, 0.06472015380859375, 0.06894874572753906, 0.07317733764648438, 0.07740592956542969, 0.081634521484375, 0.08586311340332031, 0.09009170532226562, 0.09432029724121094, 0.09854888916015625, 0.10277748107910156, 0.10700607299804688, 0.11123466491699219, 0.1154632568359375, 0.11969184875488281, 0.12392044067382812, 0.12814903259277344, 0.13237762451171875, 0.13660621643066406, 0.14083480834960938, 0.1450634002685547, 0.1492919921875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 10.0, 8.0, 7.0, 11.0, 24.0, 24.0, 34.0, 38.0, 44.0, 71.0, 83.0, 112.0, 120.0, 85.0, 61.0, 56.0, 42.0, 44.0, 29.0, 18.0, 19.0, 21.0, 7.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.07302379608154297, -0.07042503356933594, -0.0678262710571289, -0.06522750854492188, -0.06262874603271484, -0.06002998352050781, -0.05743122100830078, -0.05483245849609375, -0.05223369598388672, -0.04963493347167969, -0.047036170959472656, -0.044437408447265625, -0.041838645935058594, -0.03923988342285156, -0.03664112091064453, -0.0340423583984375, -0.03144359588623047, -0.028844833374023438, -0.026246070861816406, -0.023647308349609375, -0.021048545837402344, -0.018449783325195312, -0.01585102081298828, -0.01325225830078125, -0.010653495788574219, -0.008054733276367188, -0.005455970764160156, -0.002857208251953125, -0.00025844573974609375, 0.0023403167724609375, 0.004939079284667969, 0.007537841796875, 0.010136604309082031, 0.012735366821289062, 0.015334129333496094, 0.017932891845703125, 0.020531654357910156, 0.023130416870117188, 0.02572917938232422, 0.02832794189453125, 0.03092670440673828, 0.03352546691894531, 0.036124229431152344, 0.038722991943359375, 0.041321754455566406, 0.04392051696777344, 0.04651927947998047, 0.0491180419921875, 0.05171680450439453, 0.05431556701660156, 0.056914329528808594, 0.059513092041015625, 0.062111854553222656, 0.06471061706542969, 0.06730937957763672, 0.06990814208984375, 0.07250690460205078, 0.07510566711425781, 0.07770442962646484, 0.08030319213867188, 0.0829019546508789, 0.08550071716308594, 0.08809947967529297, 0.0906982421875]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 12.0, 22.0, 36.0, 78.0, 196.0, 278.0, 192.0, 101.0, 35.0, 27.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8401881456375122, -1.7460123300552368, -1.6518365144729614, -1.557660698890686, -1.4634848833084106, -1.3693090677261353, -1.2751331329345703, -1.180957317352295, -1.0867815017700195, -0.9926056861877441, -0.8984298706054688, -0.8042540550231934, -0.710078239440918, -0.6159024238586426, -0.5217265486717224, -0.427550733089447, -0.3333749771118164, -0.23919916152954102, -0.14502333104610443, -0.05084750056266785, 0.043328315019607544, 0.13750413060188293, 0.2316799759864807, 0.3258557915687561, 0.4200316071510315, 0.5142074227333069, 0.6083832383155823, 0.7025591135025024, 0.7967349290847778, 0.8909107446670532, 0.9850865602493286, 1.079262375831604, 1.173438310623169, 1.2676141262054443, 1.3617899417877197, 1.4559657573699951, 1.5501415729522705, 1.644317388534546, 1.7384932041168213, 1.8326690196990967, 1.926844835281372, 2.0210206508636475, 2.115196466445923, 2.2093722820281982, 2.3035480976104736, 2.397723913192749, 2.4918997287750244, 2.5860755443573, 2.6802515983581543, 2.7744274139404297, 2.868603229522705, 2.9627790451049805, 3.056954860687256, 3.1511306762695312, 3.2453064918518066, 3.339482307434082, 3.4336581230163574, 3.527833938598633, 3.622009754180908, 3.7161855697631836, 3.810361385345459, 3.9045372009277344, 3.9987130165100098, 4.092888832092285, 4.1870646476745605]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 16.0, 16.0, 18.0, 23.0, 14.0, 37.0, 22.0, 23.0, 35.0, 36.0, 43.0, 47.0, 51.0, 51.0, 47.0, 53.0, 60.0, 48.0, 53.0, 39.0, 38.0, 33.0, 32.0, 30.0, 26.0, 27.0, 12.0, 10.0, 15.0, 11.0, 6.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1416618824005127, -2.082296848297119, -2.0229318141937256, -1.963566780090332, -1.9042017459869385, -1.844836711883545, -1.7854716777801514, -1.7261066436767578, -1.6667416095733643, -1.6073765754699707, -1.5480115413665771, -1.4886465072631836, -1.42928147315979, -1.3699164390563965, -1.310551404953003, -1.2511863708496094, -1.1918213367462158, -1.1324563026428223, -1.0730912685394287, -1.0137262344360352, -0.9543612003326416, -0.894996166229248, -0.8356311321258545, -0.7762660980224609, -0.7169011831283569, -0.6575361490249634, -0.5981711149215698, -0.5388060808181763, -0.4794410467147827, -0.42007604241371155, -0.360711008310318, -0.30134597420692444, -0.2419809103012085, -0.18261587619781494, -0.12325084954500198, -0.06388582289218903, -0.004520788788795471, 0.05484423041343689, 0.11420926451683044, 0.173574298620224, 0.23293933272361755, 0.2923043668270111, 0.35166940093040466, 0.41103440523147583, 0.4703994393348694, 0.5297644734382629, 0.5891295075416565, 0.64849454164505, 0.7078595757484436, 0.7672246098518372, 0.8265896439552307, 0.8859546780586243, 0.9453197121620178, 1.0046846866607666, 1.0640497207641602, 1.1234147548675537, 1.1827797889709473, 1.2421448230743408, 1.3015098571777344, 1.360874891281128, 1.4202399253845215, 1.479604959487915, 1.5389699935913086, 1.5983350276947021, 1.6577000617980957]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 8.0, 10.0, 28.0, 25.0, 55.0, 82.0, 155.0, 250.0, 466.0, 944.0, 1803.0, 4075.0, 11230.0, 46526.0, 418437.0, 3333933.0, 318048.0, 40709.0, 10204.0, 3697.0, 1714.0, 825.0, 424.0, 250.0, 148.0, 97.0, 59.0, 37.0, 25.0, 12.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6289443969726562, -0.6021270751953125, -0.5753097534179688, -0.548492431640625, -0.5216751098632812, -0.4948577880859375, -0.46804046630859375, -0.44122314453125, -0.41440582275390625, -0.3875885009765625, -0.36077117919921875, -0.333953857421875, -0.30713653564453125, -0.2803192138671875, -0.25350189208984375, -0.2266845703125, -0.19986724853515625, -0.1730499267578125, -0.14623260498046875, -0.119415283203125, -0.09259796142578125, -0.0657806396484375, -0.03896331787109375, -0.01214599609375, 0.01467132568359375, 0.0414886474609375, 0.06830596923828125, 0.095123291015625, 0.12194061279296875, 0.1487579345703125, 0.17557525634765625, 0.202392578125, 0.22920989990234375, 0.2560272216796875, 0.28284454345703125, 0.309661865234375, 0.33647918701171875, 0.3632965087890625, 0.39011383056640625, 0.41693115234375, 0.44374847412109375, 0.4705657958984375, 0.49738311767578125, 0.524200439453125, 0.5510177612304688, 0.5778350830078125, 0.6046524047851562, 0.6314697265625, 0.6582870483398438, 0.6851043701171875, 0.7119216918945312, 0.738739013671875, 0.7655563354492188, 0.7923736572265625, 0.8191909790039062, 0.84600830078125, 0.8728256225585938, 0.8996429443359375, 0.9264602661132812, 0.953277587890625, 0.9800949096679688, 1.0069122314453125, 1.0337295532226562, 1.060546875]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 13.0, 15.0, 10.0, 14.0, 19.0, 37.0, 37.0, 57.0, 64.0, 69.0, 62.0, 97.0, 78.0, 89.0, 62.0, 58.0, 46.0, 34.0, 26.0, 16.0, 15.0, 21.0, 10.0, 9.0, 8.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68798828125, -0.6675872802734375, -0.647186279296875, -0.6267852783203125, -0.60638427734375, -0.5859832763671875, -0.565582275390625, -0.5451812744140625, -0.5247802734375, -0.5043792724609375, -0.483978271484375, -0.4635772705078125, -0.44317626953125, -0.4227752685546875, -0.402374267578125, -0.3819732666015625, -0.361572265625, -0.3411712646484375, -0.320770263671875, -0.3003692626953125, -0.27996826171875, -0.2595672607421875, -0.239166259765625, -0.2187652587890625, -0.1983642578125, -0.1779632568359375, -0.157562255859375, -0.1371612548828125, -0.11676025390625, -0.0963592529296875, -0.075958251953125, -0.0555572509765625, -0.03515625, -0.0147552490234375, 0.005645751953125, 0.0260467529296875, 0.04644775390625, 0.0668487548828125, 0.087249755859375, 0.1076507568359375, 0.1280517578125, 0.1484527587890625, 0.168853759765625, 0.1892547607421875, 0.20965576171875, 0.2300567626953125, 0.250457763671875, 0.2708587646484375, 0.291259765625, 0.3116607666015625, 0.332061767578125, 0.3524627685546875, 0.37286376953125, 0.3932647705078125, 0.413665771484375, 0.4340667724609375, 0.4544677734375, 0.4748687744140625, 0.495269775390625, 0.5156707763671875, 0.53607177734375, 0.5564727783203125, 0.576873779296875, 0.5972747802734375, 0.61767578125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 0.0, 7.0, 6.0, 6.0, 9.0, 15.0, 21.0, 23.0, 54.0, 60.0, 105.0, 193.0, 425.0, 927.0, 2481.0, 8566.0, 49330.0, 1263304.0, 2784622.0, 68354.0, 10685.0, 2977.0, 1100.0, 455.0, 221.0, 133.0, 68.0, 50.0, 33.0, 21.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.6918106079101562, -0.6604766845703125, -0.6291427612304688, -0.597808837890625, -0.5664749145507812, -0.5351409912109375, -0.5038070678710938, -0.47247314453125, -0.44113922119140625, -0.4098052978515625, -0.37847137451171875, -0.347137451171875, -0.31580352783203125, -0.2844696044921875, -0.25313568115234375, -0.2218017578125, -0.19046783447265625, -0.1591339111328125, -0.12779998779296875, -0.096466064453125, -0.06513214111328125, -0.0337982177734375, -0.00246429443359375, 0.02886962890625, 0.06020355224609375, 0.0915374755859375, 0.12287139892578125, 0.154205322265625, 0.18553924560546875, 0.2168731689453125, 0.24820709228515625, 0.279541015625, 0.31087493896484375, 0.3422088623046875, 0.37354278564453125, 0.404876708984375, 0.43621063232421875, 0.4675445556640625, 0.49887847900390625, 0.53021240234375, 0.5615463256835938, 0.5928802490234375, 0.6242141723632812, 0.655548095703125, 0.6868820190429688, 0.7182159423828125, 0.7495498657226562, 0.7808837890625, 0.8122177124023438, 0.8435516357421875, 0.8748855590820312, 0.906219482421875, 0.9375534057617188, 0.9688873291015625, 1.0002212524414062, 1.03155517578125, 1.0628890991210938, 1.0942230224609375, 1.1255569458007812, 1.156890869140625, 1.1882247924804688, 1.2195587158203125, 1.2508926391601562, 1.2822265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 10.0, 5.0, 13.0, 34.0, 40.0, 60.0, 102.0, 130.0, 244.0, 481.0, 922.0, 873.0, 503.0, 234.0, 153.0, 81.0, 50.0, 34.0, 28.0, 17.0, 12.0, 12.0, 12.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259033203125, -0.2511730194091797, -0.24331283569335938, -0.23545265197753906, -0.22759246826171875, -0.21973228454589844, -0.21187210083007812, -0.2040119171142578, -0.1961517333984375, -0.1882915496826172, -0.18043136596679688, -0.17257118225097656, -0.16471099853515625, -0.15685081481933594, -0.14899063110351562, -0.1411304473876953, -0.133270263671875, -0.1254100799560547, -0.11754989624023438, -0.10968971252441406, -0.10182952880859375, -0.09396934509277344, -0.08610916137695312, -0.07824897766113281, -0.0703887939453125, -0.06252861022949219, -0.054668426513671875, -0.04680824279785156, -0.03894805908203125, -0.031087875366210938, -0.023227691650390625, -0.015367507934570312, -0.00750732421875, 0.0003528594970703125, 0.008213043212890625, 0.016073226928710938, 0.02393341064453125, 0.03179359436035156, 0.039653778076171875, 0.04751396179199219, 0.0553741455078125, 0.06323432922363281, 0.07109451293945312, 0.07895469665527344, 0.08681488037109375, 0.09467506408691406, 0.10253524780273438, 0.11039543151855469, 0.118255615234375, 0.1261157989501953, 0.13397598266601562, 0.14183616638183594, 0.14969635009765625, 0.15755653381347656, 0.16541671752929688, 0.1732769012451172, 0.1811370849609375, 0.1889972686767578, 0.19685745239257812, 0.20471763610839844, 0.21257781982421875, 0.22043800354003906, 0.22829818725585938, 0.2361583709716797, 0.2440185546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 11.0, 7.0, 31.0, 29.0, 55.0, 83.0, 126.0, 156.0, 150.0, 135.0, 72.0, 46.0, 33.0, 13.0, 13.0, 9.0, 5.0, 5.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4888819456100464, -1.4494564533233643, -1.4100308418273926, -1.3706053495407104, -1.3311798572540283, -1.2917542457580566, -1.2523287534713745, -1.2129032611846924, -1.1734776496887207, -1.1340521574020386, -1.094626545906067, -1.0552010536193848, -1.0157755613327026, -0.9763500094413757, -0.9369244575500488, -0.8974989652633667, -0.8580734729766846, -0.8186479210853577, -0.7792224287986755, -0.7397968769073486, -0.7003713846206665, -0.6609458327293396, -0.6215202808380127, -0.5820947885513306, -0.5426692366600037, -0.5032436847686768, -0.46381819248199463, -0.4243926405906677, -0.3849671185016632, -0.3455415964126587, -0.3061160445213318, -0.26669052243232727, -0.2272651195526123, -0.1878395974636078, -0.14841406047344208, -0.10898853093385696, -0.06956300139427185, -0.030137479305267334, 0.009288057684898376, 0.04871359467506409, 0.0881391167640686, 0.12756463885307312, 0.16699017584323883, 0.20641571283340454, 0.24584123492240906, 0.2852667570114136, 0.3246923089027405, 0.364117830991745, 0.4035433530807495, 0.44296887516975403, 0.48239439725875854, 0.5218199491500854, 0.5612454414367676, 0.6006709933280945, 0.6400965452194214, 0.6795220375061035, 0.7189475893974304, 0.7583731412887573, 0.7977986335754395, 0.8372241854667664, 0.8766497373580933, 0.9160752296447754, 0.9555007815361023, 0.9949263334274292, 1.0343518257141113]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 8.0, 10.0, 12.0, 11.0, 16.0, 30.0, 25.0, 31.0, 41.0, 38.0, 54.0, 64.0, 61.0, 63.0, 74.0, 66.0, 59.0, 57.0, 42.0, 41.0, 38.0, 34.0, 28.0, 17.0, 17.0, 12.0, 7.0, 10.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6819748282432556, -0.6619782447814941, -0.6419816017150879, -0.6219850182533264, -0.6019884347915649, -0.5819917917251587, -0.5619952082633972, -0.5419986248016357, -0.5220019817352295, -0.502005398273468, -0.48200878500938416, -0.4620121717453003, -0.4420155882835388, -0.42201897501945496, -0.4020223617553711, -0.3820257782936096, -0.36202919483184814, -0.3420325815677643, -0.3220359981060028, -0.30203938484191895, -0.28204280138015747, -0.2620461881160736, -0.24204957485198975, -0.22205297648906708, -0.2020563781261444, -0.18205977976322174, -0.16206318140029907, -0.1420665681362152, -0.12206996977329254, -0.10207337141036987, -0.08207676559686661, -0.06208015978336334, -0.04208362102508545, -0.022087018936872482, -0.0020904168486595154, 0.01790618523955345, 0.03790278732776642, 0.05789938569068909, 0.07789599150419235, 0.09789259731769562, 0.11788919568061829, 0.13788579404354095, 0.15788239240646362, 0.17787900567054749, 0.19787560403347015, 0.21787220239639282, 0.23786881566047668, 0.25786542892456055, 0.277862012386322, 0.2978586256504059, 0.31785520911216736, 0.3378518223762512, 0.3578484058380127, 0.37784501910209656, 0.3978416323661804, 0.4178382158279419, 0.43783482909202576, 0.4578314423561096, 0.4778280258178711, 0.49782463908195496, 0.5178212523460388, 0.5378178358078003, 0.5578144192695618, 0.577811062335968, 0.5978076457977295]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 11.0, 10.0, 16.0, 27.0, 62.0, 79.0, 131.0, 172.0, 318.0, 499.0, 871.0, 1604.0, 3170.0, 6411.0, 15378.0, 39835.0, 125077.0, 369207.0, 324075.0, 102771.0, 33806.0, 13221.0, 5653.0, 2627.0, 1463.0, 832.0, 497.0, 265.0, 139.0, 94.0, 67.0, 51.0, 26.0, 16.0, 18.0, 11.0, 12.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.1009521484375, -0.0979757308959961, -0.09499931335449219, -0.09202289581298828, -0.08904647827148438, -0.08607006072998047, -0.08309364318847656, -0.08011722564697266, -0.07714080810546875, -0.07416439056396484, -0.07118797302246094, -0.06821155548095703, -0.06523513793945312, -0.06225872039794922, -0.05928230285644531, -0.056305885314941406, -0.0533294677734375, -0.050353050231933594, -0.04737663269042969, -0.04440021514892578, -0.041423797607421875, -0.03844738006591797, -0.03547096252441406, -0.032494544982910156, -0.02951812744140625, -0.026541709899902344, -0.023565292358398438, -0.02058887481689453, -0.017612457275390625, -0.014636039733886719, -0.011659622192382812, -0.008683204650878906, -0.005706787109375, -0.0027303695678710938, 0.0002460479736328125, 0.0032224655151367188, 0.006198883056640625, 0.009175300598144531, 0.012151718139648438, 0.015128135681152344, 0.01810455322265625, 0.021080970764160156, 0.024057388305664062, 0.02703380584716797, 0.030010223388671875, 0.03298664093017578, 0.03596305847167969, 0.038939476013183594, 0.0419158935546875, 0.044892311096191406, 0.04786872863769531, 0.05084514617919922, 0.053821563720703125, 0.05679798126220703, 0.05977439880371094, 0.06275081634521484, 0.06572723388671875, 0.06870365142822266, 0.07168006896972656, 0.07465648651123047, 0.07763290405273438, 0.08060932159423828, 0.08358573913574219, 0.0865621566772461, 0.08953857421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 9.0, 11.0, 10.0, 12.0, 11.0, 30.0, 40.0, 39.0, 53.0, 63.0, 84.0, 89.0, 78.0, 78.0, 77.0, 77.0, 52.0, 52.0, 29.0, 32.0, 20.0, 13.0, 10.0, 5.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6181640625, -0.6002120971679688, -0.5822601318359375, -0.5643081665039062, -0.546356201171875, -0.5284042358398438, -0.5104522705078125, -0.49250030517578125, -0.47454833984375, -0.45659637451171875, -0.4386444091796875, -0.42069244384765625, -0.402740478515625, -0.38478851318359375, -0.3668365478515625, -0.34888458251953125, -0.3309326171875, -0.31298065185546875, -0.2950286865234375, -0.27707672119140625, -0.259124755859375, -0.24117279052734375, -0.2232208251953125, -0.20526885986328125, -0.18731689453125, -0.16936492919921875, -0.1514129638671875, -0.13346099853515625, -0.115509033203125, -0.09755706787109375, -0.0796051025390625, -0.06165313720703125, -0.043701171875, -0.02574920654296875, -0.0077972412109375, 0.01015472412109375, 0.028106689453125, 0.04605865478515625, 0.0640106201171875, 0.08196258544921875, 0.09991455078125, 0.11786651611328125, 0.1358184814453125, 0.15377044677734375, 0.171722412109375, 0.18967437744140625, 0.2076263427734375, 0.22557830810546875, 0.2435302734375, 0.26148223876953125, 0.2794342041015625, 0.29738616943359375, 0.315338134765625, 0.33329010009765625, 0.3512420654296875, 0.36919403076171875, 0.38714599609375, 0.40509796142578125, 0.4230499267578125, 0.44100189208984375, 0.458953857421875, 0.47690582275390625, 0.4948577880859375, 0.5128097534179688, 0.53076171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 5.0, 7.0, 10.0, 3.0, 16.0, 9.0, 10.0, 14.0, 30.0, 40.0, 43.0, 67.0, 71.0, 120.0, 187.0, 239.0, 423.0, 741.0, 1355.0, 2850.0, 7076.0, 20028.0, 70396.0, 284454.0, 450341.0, 151772.0, 37681.0, 11554.0, 4429.0, 1956.0, 1001.0, 514.0, 360.0, 229.0, 135.0, 107.0, 61.0, 38.0, 33.0, 26.0, 18.0, 15.0, 15.0, 12.0, 13.0, 6.0, 11.0, 9.0, 4.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08587646484375, -0.0831298828125, -0.08038330078125, -0.07763671875, -0.07489013671875, -0.0721435546875, -0.06939697265625, -0.066650390625, -0.06390380859375, -0.0611572265625, -0.05841064453125, -0.0556640625, -0.05291748046875, -0.0501708984375, -0.04742431640625, -0.044677734375, -0.04193115234375, -0.0391845703125, -0.03643798828125, -0.03369140625, -0.03094482421875, -0.0281982421875, -0.02545166015625, -0.022705078125, -0.01995849609375, -0.0172119140625, -0.01446533203125, -0.01171875, -0.00897216796875, -0.0062255859375, -0.00347900390625, -0.000732421875, 0.00201416015625, 0.0047607421875, 0.00750732421875, 0.01025390625, 0.01300048828125, 0.0157470703125, 0.01849365234375, 0.021240234375, 0.02398681640625, 0.0267333984375, 0.02947998046875, 0.0322265625, 0.03497314453125, 0.0377197265625, 0.04046630859375, 0.043212890625, 0.04595947265625, 0.0487060546875, 0.05145263671875, 0.05419921875, 0.05694580078125, 0.0596923828125, 0.06243896484375, 0.065185546875, 0.06793212890625, 0.0706787109375, 0.07342529296875, 0.076171875, 0.07891845703125, 0.0816650390625, 0.08441162109375, 0.087158203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 6.0, 9.0, 7.0, 5.0, 10.0, 12.0, 4.0, 10.0, 21.0, 23.0, 29.0, 27.0, 22.0, 32.0, 35.0, 31.0, 43.0, 35.0, 45.0, 43.0, 53.0, 58.0, 42.0, 35.0, 36.0, 40.0, 30.0, 34.0, 33.0, 29.0, 25.0, 25.0, 13.0, 23.0, 11.0, 10.0, 17.0, 8.0, 7.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.71240234375, -0.6925582885742188, -0.6727142333984375, -0.6528701782226562, -0.633026123046875, -0.6131820678710938, -0.5933380126953125, -0.5734939575195312, -0.55364990234375, -0.5338058471679688, -0.5139617919921875, -0.49411773681640625, -0.474273681640625, -0.45442962646484375, -0.4345855712890625, -0.41474151611328125, -0.3948974609375, -0.37505340576171875, -0.3552093505859375, -0.33536529541015625, -0.315521240234375, -0.29567718505859375, -0.2758331298828125, -0.25598907470703125, -0.23614501953125, -0.21630096435546875, -0.1964569091796875, -0.17661285400390625, -0.156768798828125, -0.13692474365234375, -0.1170806884765625, -0.09723663330078125, -0.077392578125, -0.05754852294921875, -0.0377044677734375, -0.01786041259765625, 0.001983642578125, 0.02182769775390625, 0.0416717529296875, 0.06151580810546875, 0.08135986328125, 0.10120391845703125, 0.1210479736328125, 0.14089202880859375, 0.160736083984375, 0.18058013916015625, 0.2004241943359375, 0.22026824951171875, 0.2401123046875, 0.25995635986328125, 0.2798004150390625, 0.29964447021484375, 0.319488525390625, 0.33933258056640625, 0.3591766357421875, 0.37902069091796875, 0.39886474609375, 0.41870880126953125, 0.4385528564453125, 0.45839691162109375, 0.478240966796875, 0.49808502197265625, 0.5179290771484375, 0.5377731323242188, 0.5576171875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 6.0, 9.0, 15.0, 14.0, 31.0, 46.0, 57.0, 99.0, 156.0, 218.0, 367.0, 628.0, 1294.0, 2753.0, 6882.0, 23394.0, 118454.0, 599176.0, 238740.0, 38731.0, 10176.0, 3768.0, 1578.0, 814.0, 401.0, 254.0, 156.0, 100.0, 61.0, 51.0, 25.0, 20.0, 26.0, 7.0, 9.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044219970703125, -0.04277849197387695, -0.041337013244628906, -0.03989553451538086, -0.03845405578613281, -0.037012577056884766, -0.03557109832763672, -0.03412961959838867, -0.032688140869140625, -0.031246662139892578, -0.02980518341064453, -0.028363704681396484, -0.026922225952148438, -0.02548074722290039, -0.024039268493652344, -0.022597789764404297, -0.02115631103515625, -0.019714832305908203, -0.018273353576660156, -0.01683187484741211, -0.015390396118164062, -0.013948917388916016, -0.012507438659667969, -0.011065959930419922, -0.009624481201171875, -0.008183002471923828, -0.006741523742675781, -0.005300045013427734, -0.0038585662841796875, -0.0024170875549316406, -0.0009756088256835938, 0.0004658699035644531, 0.0019073486328125, 0.003348827362060547, 0.004790306091308594, 0.006231784820556641, 0.0076732635498046875, 0.009114742279052734, 0.010556221008300781, 0.011997699737548828, 0.013439178466796875, 0.014880657196044922, 0.01632213592529297, 0.017763614654541016, 0.019205093383789062, 0.02064657211303711, 0.022088050842285156, 0.023529529571533203, 0.02497100830078125, 0.026412487030029297, 0.027853965759277344, 0.02929544448852539, 0.030736923217773438, 0.032178401947021484, 0.03361988067626953, 0.03506135940551758, 0.036502838134765625, 0.03794431686401367, 0.03938579559326172, 0.040827274322509766, 0.04226875305175781, 0.04371023178100586, 0.045151710510253906, 0.04659318923950195, 0.04803466796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 4.0, 20.0, 21.0, 48.0, 50.0, 75.0, 81.0, 115.0, 104.0, 106.0, 96.0, 82.0, 49.0, 50.0, 34.0, 16.0, 10.0, 11.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6404857635498047e-05, -2.557411789894104e-05, -2.4743378162384033e-05, -2.3912638425827026e-05, -2.308189868927002e-05, -2.2251158952713013e-05, -2.1420419216156006e-05, -2.0589679479599e-05, -1.9758939743041992e-05, -1.8928200006484985e-05, -1.809746026992798e-05, -1.726672053337097e-05, -1.6435980796813965e-05, -1.5605241060256958e-05, -1.4774501323699951e-05, -1.3943761587142944e-05, -1.3113021850585938e-05, -1.228228211402893e-05, -1.1451542377471924e-05, -1.0620802640914917e-05, -9.79006290435791e-06, -8.959323167800903e-06, -8.128583431243896e-06, -7.29784369468689e-06, -6.467103958129883e-06, -5.636364221572876e-06, -4.805624485015869e-06, -3.974884748458862e-06, -3.1441450119018555e-06, -2.3134052753448486e-06, -1.4826655387878418e-06, -6.51925802230835e-07, 1.7881393432617188e-07, 1.0095536708831787e-06, 1.8402934074401855e-06, 2.6710331439971924e-06, 3.5017728805541992e-06, 4.332512617111206e-06, 5.163252353668213e-06, 5.99399209022522e-06, 6.8247318267822266e-06, 7.655471563339233e-06, 8.48621129989624e-06, 9.316951036453247e-06, 1.0147690773010254e-05, 1.097843050956726e-05, 1.1809170246124268e-05, 1.2639909982681274e-05, 1.3470649719238281e-05, 1.4301389455795288e-05, 1.5132129192352295e-05, 1.5962868928909302e-05, 1.679360866546631e-05, 1.7624348402023315e-05, 1.8455088138580322e-05, 1.928582787513733e-05, 2.0116567611694336e-05, 2.0947307348251343e-05, 2.177804708480835e-05, 2.2608786821365356e-05, 2.3439526557922363e-05, 2.427026629447937e-05, 2.5101006031036377e-05, 2.5931745767593384e-05, 2.676248550415039e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 3.0, 5.0, 7.0, 16.0, 19.0, 24.0, 37.0, 54.0, 89.0, 110.0, 198.0, 371.0, 748.0, 1432.0, 3269.0, 8653.0, 26381.0, 97631.0, 372681.0, 388951.0, 103929.0, 27993.0, 9305.0, 3429.0, 1508.0, 695.0, 395.0, 208.0, 133.0, 96.0, 54.0, 32.0, 35.0, 20.0, 8.0, 5.0, 8.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.04296875, -0.041808128356933594, -0.04064750671386719, -0.03948688507080078, -0.038326263427734375, -0.03716564178466797, -0.03600502014160156, -0.034844398498535156, -0.03368377685546875, -0.032523155212402344, -0.03136253356933594, -0.03020191192626953, -0.029041290283203125, -0.02788066864013672, -0.026720046997070312, -0.025559425354003906, -0.0243988037109375, -0.023238182067871094, -0.022077560424804688, -0.02091693878173828, -0.019756317138671875, -0.01859569549560547, -0.017435073852539062, -0.016274452209472656, -0.01511383056640625, -0.013953208923339844, -0.012792587280273438, -0.011631965637207031, -0.010471343994140625, -0.009310722351074219, -0.008150100708007812, -0.006989479064941406, -0.005828857421875, -0.004668235778808594, -0.0035076141357421875, -0.0023469924926757812, -0.001186370849609375, -2.574920654296875e-05, 0.0011348724365234375, 0.0022954940795898438, 0.00345611572265625, 0.004616737365722656, 0.0057773590087890625, 0.006937980651855469, 0.008098602294921875, 0.009259223937988281, 0.010419845581054688, 0.011580467224121094, 0.0127410888671875, 0.013901710510253906, 0.015062332153320312, 0.01622295379638672, 0.017383575439453125, 0.01854419708251953, 0.019704818725585938, 0.020865440368652344, 0.02202606201171875, 0.023186683654785156, 0.024347305297851562, 0.02550792694091797, 0.026668548583984375, 0.02782917022705078, 0.028989791870117188, 0.030150413513183594, 0.03131103515625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 7.0, 10.0, 12.0, 17.0, 27.0, 23.0, 40.0, 45.0, 63.0, 70.0, 83.0, 87.0, 86.0, 99.0, 62.0, 51.0, 50.0, 35.0, 25.0, 28.0, 12.0, 14.0, 9.0, 9.0, 10.0, 2.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00753021240234375, -0.007199764251708984, -0.006869316101074219, -0.006538867950439453, -0.0062084197998046875, -0.005877971649169922, -0.005547523498535156, -0.005217075347900391, -0.004886627197265625, -0.004556179046630859, -0.004225730895996094, -0.003895282745361328, -0.0035648345947265625, -0.003234386444091797, -0.0029039382934570312, -0.0025734901428222656, -0.0022430419921875, -0.0019125938415527344, -0.0015821456909179688, -0.0012516975402832031, -0.0009212493896484375, -0.0005908012390136719, -0.00026035308837890625, 7.009506225585938e-05, 0.000400543212890625, 0.0007309913635253906, 0.0010614395141601562, 0.0013918876647949219, 0.0017223358154296875, 0.002052783966064453, 0.0023832321166992188, 0.0027136802673339844, 0.00304412841796875, 0.0033745765686035156, 0.0037050247192382812, 0.004035472869873047, 0.0043659210205078125, 0.004696369171142578, 0.005026817321777344, 0.005357265472412109, 0.005687713623046875, 0.006018161773681641, 0.006348609924316406, 0.006679058074951172, 0.0070095062255859375, 0.007339954376220703, 0.007670402526855469, 0.008000850677490234, 0.008331298828125, 0.008661746978759766, 0.008992195129394531, 0.009322643280029297, 0.009653091430664062, 0.009983539581298828, 0.010313987731933594, 0.01064443588256836, 0.010974884033203125, 0.01130533218383789, 0.011635780334472656, 0.011966228485107422, 0.012296676635742188, 0.012627124786376953, 0.012957572937011719, 0.013288021087646484, 0.01361846923828125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 15.0, 23.0, 41.0, 73.0, 133.0, 202.0, 218.0, 129.0, 56.0, 42.0, 21.0, 14.0, 5.0, 8.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3471403121948242, -1.3125070333480835, -1.2778738737106323, -1.2432405948638916, -1.2086074352264404, -1.1739741563796997, -1.139340877532959, -1.1047077178955078, -1.070074439048767, -1.0354411602020264, -1.0008080005645752, -0.9661747217178345, -0.9315415024757385, -0.8969082832336426, -0.8622750639915466, -0.8276418447494507, -0.7930086255073547, -0.7583754062652588, -0.7237421870231628, -0.6891089677810669, -0.6544756889343262, -0.6198424696922302, -0.5852092504501343, -0.5505760312080383, -0.5159428119659424, -0.48130959272384644, -0.4466763436794281, -0.41204312443733215, -0.3774098753929138, -0.34277665615081787, -0.3081434369087219, -0.273510217666626, -0.23887693881988525, -0.2042437046766281, -0.16961047053337097, -0.13497725129127502, -0.10034401714801788, -0.06571078300476074, -0.031077563762664795, 0.003555670380592346, 0.03818890452384949, 0.07282213866710663, 0.10745536535978317, 0.14208859205245972, 0.17672182619571686, 0.211355060338974, 0.24598827958106995, 0.2806215286254883, 0.31525474786758423, 0.3498879671096802, 0.3845212161540985, 0.41915443539619446, 0.4537876844406128, 0.48842090368270874, 0.5230541229248047, 0.5576873421669006, 0.5923205614089966, 0.6269537806510925, 0.6615869998931885, 0.6962202787399292, 0.7308534979820251, 0.7654867172241211, 0.800119936466217, 0.834753155708313, 0.8693864345550537]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 5.0, 3.0, 4.0, 4.0, 4.0, 15.0, 9.0, 16.0, 13.0, 35.0, 27.0, 33.0, 40.0, 57.0, 67.0, 70.0, 72.0, 72.0, 80.0, 59.0, 66.0, 39.0, 46.0, 41.0, 31.0, 18.0, 19.0, 10.0, 11.0, 11.0, 5.0, 4.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5037251710891724, -0.48898470401763916, -0.47424423694610596, -0.45950376987457275, -0.44476330280303955, -0.43002283573150635, -0.41528236865997314, -0.40054190158843994, -0.38580143451690674, -0.37106096744537354, -0.35632050037384033, -0.34158003330230713, -0.3268395662307739, -0.3120990991592407, -0.2973586320877075, -0.2826181650161743, -0.2678777277469635, -0.2531372606754303, -0.2383967936038971, -0.2236563265323639, -0.2089158594608307, -0.19417539238929749, -0.17943494021892548, -0.16469447314739227, -0.14995400607585907, -0.13521353900432587, -0.12047307193279266, -0.10573261231184006, -0.09099214524030685, -0.07625167816877365, -0.061511218547821045, -0.04677075147628784, -0.032030314207077026, -0.017289848998188972, -0.0025493837893009186, 0.012191079556941986, 0.02693154662847519, 0.04167201370000839, 0.056412473320961, 0.0711529403924942, 0.0858934074640274, 0.10063387453556061, 0.11537434160709381, 0.13011479377746582, 0.14485526084899902, 0.15959572792053223, 0.17433619499206543, 0.18907666206359863, 0.20381712913513184, 0.21855759620666504, 0.23329806327819824, 0.24803853034973145, 0.26277899742126465, 0.27751946449279785, 0.29225993156433105, 0.30700039863586426, 0.32174086570739746, 0.33648133277893066, 0.35122179985046387, 0.36596226692199707, 0.3807027339935303, 0.3954432010650635, 0.4101836681365967, 0.4249241352081299, 0.4396645724773407]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 4.0, 9.0, 11.0, 22.0, 17.0, 33.0, 54.0, 58.0, 100.0, 139.0, 236.0, 394.0, 615.0, 1141.0, 2125.0, 4639.0, 11531.0, 43122.0, 463978.0, 456573.0, 42600.0, 11532.0, 4487.0, 2192.0, 1135.0, 671.0, 421.0, 245.0, 157.0, 119.0, 63.0, 32.0, 31.0, 21.0, 13.0, 15.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.5859375, -0.5687026977539062, -0.5514678955078125, -0.5342330932617188, -0.516998291015625, -0.49976348876953125, -0.4825286865234375, -0.46529388427734375, -0.44805908203125, -0.43082427978515625, -0.4135894775390625, -0.39635467529296875, -0.379119873046875, -0.36188507080078125, -0.3446502685546875, -0.32741546630859375, -0.3101806640625, -0.29294586181640625, -0.2757110595703125, -0.25847625732421875, -0.241241455078125, -0.22400665283203125, -0.2067718505859375, -0.18953704833984375, -0.17230224609375, -0.15506744384765625, -0.1378326416015625, -0.12059783935546875, -0.103363037109375, -0.08612823486328125, -0.0688934326171875, -0.05165863037109375, -0.034423828125, -0.01718902587890625, 4.57763671875e-05, 0.01728057861328125, 0.034515380859375, 0.05175018310546875, 0.0689849853515625, 0.08621978759765625, 0.10345458984375, 0.12068939208984375, 0.1379241943359375, 0.15515899658203125, 0.172393798828125, 0.18962860107421875, 0.2068634033203125, 0.22409820556640625, 0.2413330078125, 0.25856781005859375, 0.2758026123046875, 0.29303741455078125, 0.310272216796875, 0.32750701904296875, 0.3447418212890625, 0.36197662353515625, 0.37921142578125, 0.39644622802734375, 0.4136810302734375, 0.43091583251953125, 0.448150634765625, 0.46538543701171875, 0.4826202392578125, 0.49985504150390625, 0.51708984375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 9.0, 19.0, 15.0, 30.0, 16.0, 26.0, 25.0, 50.0, 56.0, 74.0, 77.0, 81.0, 80.0, 77.0, 70.0, 64.0, 45.0, 39.0, 33.0, 26.0, 14.0, 16.0, 8.0, 7.0, 5.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.2021484375, -1.168548583984375, -1.13494873046875, -1.101348876953125, -1.0677490234375, -1.034149169921875, -1.00054931640625, -0.966949462890625, -0.933349609375, -0.899749755859375, -0.86614990234375, -0.832550048828125, -0.7989501953125, -0.765350341796875, -0.73175048828125, -0.698150634765625, -0.66455078125, -0.630950927734375, -0.59735107421875, -0.563751220703125, -0.5301513671875, -0.496551513671875, -0.46295166015625, -0.429351806640625, -0.395751953125, -0.362152099609375, -0.32855224609375, -0.294952392578125, -0.2613525390625, -0.227752685546875, -0.19415283203125, -0.160552978515625, -0.126953125, -0.093353271484375, -0.05975341796875, -0.026153564453125, 0.0074462890625, 0.041046142578125, 0.07464599609375, 0.108245849609375, 0.141845703125, 0.175445556640625, 0.20904541015625, 0.242645263671875, 0.2762451171875, 0.309844970703125, 0.34344482421875, 0.377044677734375, 0.41064453125, 0.444244384765625, 0.47784423828125, 0.511444091796875, 0.5450439453125, 0.578643798828125, 0.61224365234375, 0.645843505859375, 0.679443359375, 0.713043212890625, 0.74664306640625, 0.780242919921875, 0.8138427734375, 0.847442626953125, 0.88104248046875, 0.914642333984375, 0.9482421875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 4.0, 9.0, 27.0, 28.0, 41.0, 39.0, 90.0, 94.0, 190.0, 330.0, 509.0, 1006.0, 1979.0, 4515.0, 12906.0, 67973.0, 761098.0, 164654.0, 21171.0, 6438.0, 2517.0, 1204.0, 623.0, 390.0, 244.0, 171.0, 91.0, 65.0, 37.0, 35.0, 20.0, 11.0, 9.0, 5.0, 5.0, 1.0, 2.0, 6.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.5003128051757812, -0.4850006103515625, -0.46968841552734375, -0.454376220703125, -0.43906402587890625, -0.4237518310546875, -0.40843963623046875, -0.39312744140625, -0.37781524658203125, -0.3625030517578125, -0.34719085693359375, -0.331878662109375, -0.31656646728515625, -0.3012542724609375, -0.28594207763671875, -0.2706298828125, -0.25531768798828125, -0.2400054931640625, -0.22469329833984375, -0.209381103515625, -0.19406890869140625, -0.1787567138671875, -0.16344451904296875, -0.14813232421875, -0.13282012939453125, -0.1175079345703125, -0.10219573974609375, -0.086883544921875, -0.07157135009765625, -0.0562591552734375, -0.04094696044921875, -0.025634765625, -0.01032257080078125, 0.0049896240234375, 0.02030181884765625, 0.035614013671875, 0.05092620849609375, 0.0662384033203125, 0.08155059814453125, 0.09686279296875, 0.11217498779296875, 0.1274871826171875, 0.14279937744140625, 0.158111572265625, 0.17342376708984375, 0.1887359619140625, 0.20404815673828125, 0.2193603515625, 0.23467254638671875, 0.2499847412109375, 0.26529693603515625, 0.280609130859375, 0.29592132568359375, 0.3112335205078125, 0.32654571533203125, 0.34185791015625, 0.35717010498046875, 0.3724822998046875, 0.38779449462890625, 0.403106689453125, 0.41841888427734375, 0.4337310791015625, 0.44904327392578125, 0.46435546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 7.0, 5.0, 2.0, 3.0, 11.0, 7.0, 18.0, 13.0, 11.0, 17.0, 32.0, 30.0, 32.0, 39.0, 45.0, 35.0, 46.0, 54.0, 48.0, 71.0, 43.0, 53.0, 30.0, 46.0, 47.0, 49.0, 32.0, 42.0, 26.0, 22.0, 15.0, 11.0, 9.0, 21.0, 14.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1328125, -1.10101318359375, -1.0692138671875, -1.03741455078125, -1.005615234375, -0.97381591796875, -0.9420166015625, -0.91021728515625, -0.87841796875, -0.84661865234375, -0.8148193359375, -0.78302001953125, -0.751220703125, -0.71942138671875, -0.6876220703125, -0.65582275390625, -0.6240234375, -0.59222412109375, -0.5604248046875, -0.52862548828125, -0.496826171875, -0.46502685546875, -0.4332275390625, -0.40142822265625, -0.36962890625, -0.33782958984375, -0.3060302734375, -0.27423095703125, -0.242431640625, -0.21063232421875, -0.1788330078125, -0.14703369140625, -0.115234375, -0.08343505859375, -0.0516357421875, -0.01983642578125, 0.011962890625, 0.04376220703125, 0.0755615234375, 0.10736083984375, 0.13916015625, 0.17095947265625, 0.2027587890625, 0.23455810546875, 0.266357421875, 0.29815673828125, 0.3299560546875, 0.36175537109375, 0.3935546875, 0.42535400390625, 0.4571533203125, 0.48895263671875, 0.520751953125, 0.55255126953125, 0.5843505859375, 0.61614990234375, 0.64794921875, 0.67974853515625, 0.7115478515625, 0.74334716796875, 0.775146484375, 0.80694580078125, 0.8387451171875, 0.87054443359375, 0.90234375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 8.0, 10.0, 2.0, 12.0, 13.0, 24.0, 42.0, 84.0, 110.0, 239.0, 489.0, 1160.0, 3376.0, 15690.0, 150773.0, 803528.0, 60459.0, 8637.0, 2275.0, 796.0, 400.0, 170.0, 120.0, 62.0, 27.0, 14.0, 16.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.192138671875, -0.18558692932128906, -0.17903518676757812, -0.1724834442138672, -0.16593170166015625, -0.1593799591064453, -0.15282821655273438, -0.14627647399902344, -0.1397247314453125, -0.13317298889160156, -0.12662124633789062, -0.12006950378417969, -0.11351776123046875, -0.10696601867675781, -0.10041427612304688, -0.09386253356933594, -0.087310791015625, -0.08075904846191406, -0.07420730590820312, -0.06765556335449219, -0.06110382080078125, -0.05455207824707031, -0.048000335693359375, -0.04144859313964844, -0.0348968505859375, -0.028345108032226562, -0.021793365478515625, -0.015241622924804688, -0.00868988037109375, -0.0021381378173828125, 0.004413604736328125, 0.010965347290039062, 0.01751708984375, 0.024068832397460938, 0.030620574951171875, 0.03717231750488281, 0.04372406005859375, 0.05027580261230469, 0.056827545166015625, 0.06337928771972656, 0.0699310302734375, 0.07648277282714844, 0.08303451538085938, 0.08958625793457031, 0.09613800048828125, 0.10268974304199219, 0.10924148559570312, 0.11579322814941406, 0.122344970703125, 0.12889671325683594, 0.13544845581054688, 0.1420001983642578, 0.14855194091796875, 0.1551036834716797, 0.16165542602539062, 0.16820716857910156, 0.1747589111328125, 0.18131065368652344, 0.18786239624023438, 0.1944141387939453, 0.20096588134765625, 0.2075176239013672, 0.21406936645507812, 0.22062110900878906, 0.2271728515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 13.0, 14.0, 8.0, 16.0, 29.0, 40.0, 58.0, 88.0, 126.0, 215.0, 122.0, 96.0, 50.0, 27.0, 24.0, 22.0, 20.0, 6.0, 7.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.165006637573242e-05, -3.082677721977234e-05, -3.0003488063812256e-05, -2.9180198907852173e-05, -2.835690975189209e-05, -2.7533620595932007e-05, -2.6710331439971924e-05, -2.588704228401184e-05, -2.5063753128051758e-05, -2.4240463972091675e-05, -2.3417174816131592e-05, -2.259388566017151e-05, -2.1770596504211426e-05, -2.0947307348251343e-05, -2.012401819229126e-05, -1.9300729036331177e-05, -1.8477439880371094e-05, -1.765415072441101e-05, -1.6830861568450928e-05, -1.6007572412490845e-05, -1.5184283256530762e-05, -1.4360994100570679e-05, -1.3537704944610596e-05, -1.2714415788650513e-05, -1.189112663269043e-05, -1.1067837476730347e-05, -1.0244548320770264e-05, -9.42125916481018e-06, -8.597970008850098e-06, -7.774680852890015e-06, -6.951391696929932e-06, -6.128102540969849e-06, -5.304813385009766e-06, -4.481524229049683e-06, -3.6582350730895996e-06, -2.8349459171295166e-06, -2.0116567611694336e-06, -1.1883676052093506e-06, -3.650784492492676e-07, 4.5821070671081543e-07, 1.2814998626708984e-06, 2.1047890186309814e-06, 2.9280781745910645e-06, 3.7513673305511475e-06, 4.5746564865112305e-06, 5.3979456424713135e-06, 6.2212347984313965e-06, 7.0445239543914795e-06, 7.867813110351562e-06, 8.691102266311646e-06, 9.514391422271729e-06, 1.0337680578231812e-05, 1.1160969734191895e-05, 1.1984258890151978e-05, 1.280754804611206e-05, 1.3630837202072144e-05, 1.4454126358032227e-05, 1.527741551399231e-05, 1.6100704669952393e-05, 1.6923993825912476e-05, 1.774728298187256e-05, 1.857057213783264e-05, 1.9393861293792725e-05, 2.0217150449752808e-05, 2.104043960571289e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 6.0, 7.0, 11.0, 22.0, 17.0, 38.0, 53.0, 71.0, 127.0, 229.0, 334.0, 572.0, 1160.0, 2622.0, 6130.0, 17579.0, 65156.0, 461409.0, 402836.0, 61971.0, 17118.0, 6008.0, 2496.0, 1136.0, 550.0, 306.0, 196.0, 146.0, 77.0, 45.0, 30.0, 26.0, 12.0, 21.0, 8.0, 11.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1439208984375, -0.13980674743652344, -0.13569259643554688, -0.1315784454345703, -0.12746429443359375, -0.12335014343261719, -0.11923599243164062, -0.11512184143066406, -0.1110076904296875, -0.10689353942871094, -0.10277938842773438, -0.09866523742675781, -0.09455108642578125, -0.09043693542480469, -0.08632278442382812, -0.08220863342285156, -0.078094482421875, -0.07398033142089844, -0.06986618041992188, -0.06575202941894531, -0.06163787841796875, -0.05752372741699219, -0.053409576416015625, -0.04929542541503906, -0.0451812744140625, -0.04106712341308594, -0.036952972412109375, -0.03283882141113281, -0.02872467041015625, -0.024610519409179688, -0.020496368408203125, -0.016382217407226562, -0.01226806640625, -0.008153915405273438, -0.004039764404296875, 7.43865966796875e-05, 0.00418853759765625, 0.008302688598632812, 0.012416839599609375, 0.016530990600585938, 0.0206451416015625, 0.024759292602539062, 0.028873443603515625, 0.03298759460449219, 0.03710174560546875, 0.04121589660644531, 0.045330047607421875, 0.04944419860839844, 0.053558349609375, 0.05767250061035156, 0.061786651611328125, 0.06590080261230469, 0.07001495361328125, 0.07412910461425781, 0.07824325561523438, 0.08235740661621094, 0.0864715576171875, 0.09058570861816406, 0.09469985961914062, 0.09881401062011719, 0.10292816162109375, 0.10704231262207031, 0.11115646362304688, 0.11527061462402344, 0.119384765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 7.0, 9.0, 11.0, 16.0, 10.0, 14.0, 18.0, 25.0, 27.0, 35.0, 48.0, 76.0, 139.0, 196.0, 94.0, 76.0, 35.0, 35.0, 19.0, 25.0, 20.0, 10.0, 8.0, 11.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05780029296875, -0.055675506591796875, -0.05355072021484375, -0.051425933837890625, -0.0493011474609375, -0.047176361083984375, -0.04505157470703125, -0.042926788330078125, -0.040802001953125, -0.038677215576171875, -0.03655242919921875, -0.034427642822265625, -0.0323028564453125, -0.030178070068359375, -0.02805328369140625, -0.025928497314453125, -0.0238037109375, -0.021678924560546875, -0.01955413818359375, -0.017429351806640625, -0.0153045654296875, -0.013179779052734375, -0.01105499267578125, -0.008930206298828125, -0.006805419921875, -0.004680633544921875, -0.00255584716796875, -0.000431060791015625, 0.0016937255859375, 0.003818511962890625, 0.00594329833984375, 0.008068084716796875, 0.01019287109375, 0.012317657470703125, 0.01444244384765625, 0.016567230224609375, 0.0186920166015625, 0.020816802978515625, 0.02294158935546875, 0.025066375732421875, 0.027191162109375, 0.029315948486328125, 0.03144073486328125, 0.033565521240234375, 0.0356903076171875, 0.037815093994140625, 0.03993988037109375, 0.042064666748046875, 0.044189453125, 0.046314239501953125, 0.04843902587890625, 0.050563812255859375, 0.0526885986328125, 0.054813385009765625, 0.05693817138671875, 0.059062957763671875, 0.061187744140625, 0.06331253051757812, 0.06543731689453125, 0.06756210327148438, 0.0696868896484375, 0.07181167602539062, 0.07393646240234375, 0.07606124877929688, 0.07818603515625]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 11.0, 41.0, 72.0, 234.0, 335.0, 184.0, 55.0, 27.0, 22.0, 9.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8225148916244507, -1.7111507654190063, -1.599786639213562, -1.4884226322174072, -1.377058506011963, -1.2656943798065186, -1.1543302536010742, -1.0429661273956299, -0.9316020011901855, -0.8202378749847412, -0.7088737487792969, -0.5975096821784973, -0.486145555973053, -0.37478142976760864, -0.2634173631668091, -0.15205323696136475, -0.04068911075592041, 0.07067500054836273, 0.18203911185264587, 0.2934032082557678, 0.40476733446121216, 0.5161314606666565, 0.627495527267456, 0.7388596534729004, 0.8502237796783447, 0.9615879058837891, 1.0729520320892334, 1.1843161582946777, 1.295680284500122, 1.4070444107055664, 1.5184084177017212, 1.6297725439071655, 1.7411365509033203, 1.8525006771087646, 1.963864803314209, 2.0752289295196533, 2.1865930557250977, 2.297957181930542, 2.4093213081359863, 2.5206851959228516, 2.632049560546875, 2.7434136867523193, 2.8547778129577637, 2.966141939163208, 3.0775060653686523, 3.1888701915740967, 3.300234317779541, 3.4115982055664062, 3.5229623317718506, 3.634326457977295, 3.7456905841827393, 3.8570547103881836, 3.968418836593628, 4.079782962799072, 4.1911468505859375, 4.302511215209961, 4.413875102996826, 4.525238990783691, 4.636603355407715, 4.74796724319458, 4.8593316078186035, 4.970695495605469, 5.082059860229492, 5.193423748016357, 5.304788112640381]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 10.0, 10.0, 1.0, 9.0, 20.0, 17.0, 8.0, 24.0, 19.0, 29.0, 37.0, 30.0, 36.0, 29.0, 37.0, 39.0, 52.0, 56.0, 38.0, 56.0, 44.0, 46.0, 51.0, 31.0, 43.0, 27.0, 27.0, 22.0, 27.0, 19.0, 16.0, 19.0, 12.0, 18.0, 14.0, 11.0, 6.0, 6.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5644503831863403, -1.5151917934417725, -1.4659332036972046, -1.4166746139526367, -1.3674159049987793, -1.3181573152542114, -1.2688987255096436, -1.2196401357650757, -1.1703815460205078, -1.12112295627594, -1.071864366531372, -1.0226056575775146, -0.9733470678329468, -0.9240884780883789, -0.874829888343811, -0.8255712985992432, -0.7763125896453857, -0.7270539999008179, -0.6777953505516052, -0.6285367608070374, -0.5792781114578247, -0.5300195217132568, -0.48076093196868896, -0.4315023124217987, -0.38224369287490845, -0.3329850733280182, -0.28372645378112793, -0.23446786403656006, -0.1852092444896698, -0.13595062494277954, -0.08669203519821167, -0.03743341565132141, 0.011825084686279297, 0.06108369678258896, 0.11034230887889862, 0.15960091352462769, 0.20885953307151794, 0.2581181526184082, 0.3073767423629761, 0.35663536190986633, 0.4058939814567566, 0.45515260100364685, 0.5044112205505371, 0.553669810295105, 0.6029284000396729, 0.6521870493888855, 0.7014456391334534, 0.750704288482666, 0.7999628782272339, 0.8492214679718018, 0.8984801173210144, 0.9477387070655823, 0.9969973564147949, 1.0462559461593628, 1.0955145359039307, 1.1447731256484985, 1.1940317153930664, 1.2432903051376343, 1.2925488948822021, 1.3418076038360596, 1.3910661935806274, 1.4403247833251953, 1.4895833730697632, 1.538841962814331, 1.5881006717681885]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 9.0, 5.0, 8.0, 14.0, 21.0, 31.0, 41.0, 58.0, 90.0, 114.0, 181.0, 297.0, 562.0, 1007.0, 2047.0, 5116.0, 17855.0, 110753.0, 2679100.0, 1279506.0, 74409.0, 14292.0, 4563.0, 1954.0, 935.0, 490.0, 292.0, 179.0, 133.0, 71.0, 51.0, 32.0, 30.0, 13.0, 8.0, 8.0, 1.0, 7.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97900390625, -0.9501266479492188, -0.9212493896484375, -0.8923721313476562, -0.863494873046875, -0.8346176147460938, -0.8057403564453125, -0.7768630981445312, -0.74798583984375, -0.7191085815429688, -0.6902313232421875, -0.6613540649414062, -0.632476806640625, -0.6035995483398438, -0.5747222900390625, -0.5458450317382812, -0.5169677734375, -0.48809051513671875, -0.4592132568359375, -0.43033599853515625, -0.401458740234375, -0.37258148193359375, -0.3437042236328125, -0.31482696533203125, -0.28594970703125, -0.25707244873046875, -0.2281951904296875, -0.19931793212890625, -0.170440673828125, -0.14156341552734375, -0.1126861572265625, -0.08380889892578125, -0.054931640625, -0.02605438232421875, 0.0028228759765625, 0.03170013427734375, 0.060577392578125, 0.08945465087890625, 0.1183319091796875, 0.14720916748046875, 0.17608642578125, 0.20496368408203125, 0.2338409423828125, 0.26271820068359375, 0.291595458984375, 0.32047271728515625, 0.3493499755859375, 0.37822723388671875, 0.4071044921875, 0.43598175048828125, 0.4648590087890625, 0.49373626708984375, 0.522613525390625, 0.5514907836914062, 0.5803680419921875, 0.6092453002929688, 0.63812255859375, 0.6669998168945312, 0.6958770751953125, 0.7247543334960938, 0.753631591796875, 0.7825088500976562, 0.8113861083984375, 0.8402633666992188, 0.869140625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 19.0, 20.0, 24.0, 35.0, 52.0, 56.0, 86.0, 70.0, 94.0, 76.0, 90.0, 74.0, 57.0, 54.0, 39.0, 37.0, 22.0, 16.0, 19.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7915878295898438, -0.7701873779296875, -0.7487869262695312, -0.727386474609375, -0.7059860229492188, -0.6845855712890625, -0.6631851196289062, -0.64178466796875, -0.6203842163085938, -0.5989837646484375, -0.5775833129882812, -0.556182861328125, -0.5347824096679688, -0.5133819580078125, -0.49198150634765625, -0.4705810546875, -0.44918060302734375, -0.4277801513671875, -0.40637969970703125, -0.384979248046875, -0.36357879638671875, -0.3421783447265625, -0.32077789306640625, -0.29937744140625, -0.27797698974609375, -0.2565765380859375, -0.23517608642578125, -0.213775634765625, -0.19237518310546875, -0.1709747314453125, -0.14957427978515625, -0.128173828125, -0.10677337646484375, -0.0853729248046875, -0.06397247314453125, -0.042572021484375, -0.02117156982421875, 0.0002288818359375, 0.02162933349609375, 0.04302978515625, 0.06443023681640625, 0.0858306884765625, 0.10723114013671875, 0.128631591796875, 0.15003204345703125, 0.1714324951171875, 0.19283294677734375, 0.2142333984375, 0.23563385009765625, 0.2570343017578125, 0.27843475341796875, 0.299835205078125, 0.32123565673828125, 0.3426361083984375, 0.36403656005859375, 0.38543701171875, 0.40683746337890625, 0.4282379150390625, 0.44963836669921875, 0.471038818359375, 0.49243927001953125, 0.5138397216796875, 0.5352401733398438, 0.556640625]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 6.0, 10.0, 5.0, 17.0, 18.0, 40.0, 76.0, 138.0, 236.0, 536.0, 1410.0, 4386.0, 21096.0, 233023.0, 3762302.0, 148513.0, 16556.0, 3725.0, 1209.0, 459.0, 217.0, 121.0, 60.0, 35.0, 22.0, 14.0, 14.0, 10.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9188461303710938, -0.8840789794921875, -0.8493118286132812, -0.814544677734375, -0.7797775268554688, -0.7450103759765625, -0.7102432250976562, -0.67547607421875, -0.6407089233398438, -0.6059417724609375, -0.5711746215820312, -0.536407470703125, -0.5016403198242188, -0.4668731689453125, -0.43210601806640625, -0.3973388671875, -0.36257171630859375, -0.3278045654296875, -0.29303741455078125, -0.258270263671875, -0.22350311279296875, -0.1887359619140625, -0.15396881103515625, -0.11920166015625, -0.08443450927734375, -0.0496673583984375, -0.01490020751953125, 0.019866943359375, 0.05463409423828125, 0.0894012451171875, 0.12416839599609375, 0.158935546875, 0.19370269775390625, 0.2284698486328125, 0.26323699951171875, 0.298004150390625, 0.33277130126953125, 0.3675384521484375, 0.40230560302734375, 0.43707275390625, 0.47183990478515625, 0.5066070556640625, 0.5413742065429688, 0.576141357421875, 0.6109085083007812, 0.6456756591796875, 0.6804428100585938, 0.7152099609375, 0.7499771118164062, 0.7847442626953125, 0.8195114135742188, 0.854278564453125, 0.8890457153320312, 0.9238128662109375, 0.9585800170898438, 0.99334716796875, 1.0281143188476562, 1.0628814697265625, 1.0976486206054688, 1.132415771484375, 1.1671829223632812, 1.2019500732421875, 1.2367172241210938, 1.271484375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 7.0, 7.0, 15.0, 11.0, 16.0, 20.0, 31.0, 51.0, 83.0, 94.0, 157.0, 269.0, 516.0, 935.0, 778.0, 435.0, 226.0, 139.0, 85.0, 53.0, 35.0, 29.0, 19.0, 13.0, 12.0, 9.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.276123046875, -0.2688312530517578, -0.2615394592285156, -0.25424766540527344, -0.24695587158203125, -0.23966407775878906, -0.23237228393554688, -0.2250804901123047, -0.2177886962890625, -0.2104969024658203, -0.20320510864257812, -0.19591331481933594, -0.18862152099609375, -0.18132972717285156, -0.17403793334960938, -0.1667461395263672, -0.159454345703125, -0.1521625518798828, -0.14487075805664062, -0.13757896423339844, -0.13028717041015625, -0.12299537658691406, -0.11570358276367188, -0.10841178894042969, -0.1011199951171875, -0.09382820129394531, -0.08653640747070312, -0.07924461364746094, -0.07195281982421875, -0.06466102600097656, -0.057369232177734375, -0.05007743835449219, -0.04278564453125, -0.03549385070800781, -0.028202056884765625, -0.020910263061523438, -0.01361846923828125, -0.0063266754150390625, 0.000965118408203125, 0.008256912231445312, 0.0155487060546875, 0.022840499877929688, 0.030132293701171875, 0.03742408752441406, 0.04471588134765625, 0.05200767517089844, 0.059299468994140625, 0.06659126281738281, 0.073883056640625, 0.08117485046386719, 0.08846664428710938, 0.09575843811035156, 0.10305023193359375, 0.11034202575683594, 0.11763381958007812, 0.12492561340332031, 0.1322174072265625, 0.1395092010498047, 0.14680099487304688, 0.15409278869628906, 0.16138458251953125, 0.16867637634277344, 0.17596817016601562, 0.1832599639892578, 0.1905517578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 13.0, 15.0, 35.0, 56.0, 70.0, 94.0, 122.0, 126.0, 154.0, 89.0, 67.0, 49.0, 19.0, 22.0, 9.0, 12.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1374131441116333, -1.1022365093231201, -1.067059874534607, -1.0318832397460938, -0.9967066049575806, -0.9615299701690674, -0.9263532757759094, -0.8911766409873962, -0.8560000061988831, -0.8208233714103699, -0.7856467366218567, -0.7504701018333435, -0.7152934074401855, -0.6801167726516724, -0.6449401378631592, -0.609763503074646, -0.5745868682861328, -0.5394102334976196, -0.5042335987091064, -0.4690569341182709, -0.4338802993297577, -0.3987036645412445, -0.36352699995040894, -0.32835036516189575, -0.29317373037338257, -0.2579970955848694, -0.222820445895195, -0.18764379620552063, -0.15246716141700745, -0.11729052662849426, -0.08211387693881989, -0.04693722724914551, -0.011760711669921875, 0.023415930569171906, 0.058592572808265686, 0.09376921504735947, 0.12894585728645325, 0.16412249207496643, 0.1992991417646408, 0.23447579145431519, 0.26965242624282837, 0.30482906103134155, 0.34000569581985474, 0.3751823604106903, 0.4103589951992035, 0.4455356299877167, 0.48071229457855225, 0.5158889293670654, 0.5510655641555786, 0.5862421989440918, 0.621418833732605, 0.6565954685211182, 0.6917721033096313, 0.7269487380981445, 0.7621254324913025, 0.7973020672798157, 0.8324787020683289, 0.867655336856842, 0.9028319716453552, 0.9380086064338684, 0.9731853008270264, 1.0083619356155396, 1.0435385704040527, 1.078715205192566, 1.113891839981079]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 0.0, 4.0, 6.0, 3.0, 5.0, 9.0, 15.0, 8.0, 30.0, 16.0, 23.0, 39.0, 41.0, 49.0, 53.0, 55.0, 56.0, 51.0, 48.0, 67.0, 62.0, 52.0, 47.0, 47.0, 40.0, 40.0, 31.0, 20.0, 14.0, 13.0, 14.0, 8.0, 8.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6562923192977905, -0.6367194652557373, -0.6171466708183289, -0.5975738167762756, -0.5780009627342224, -0.558428168296814, -0.5388553142547607, -0.5192824602127075, -0.4997096359729767, -0.48013681173324585, -0.4605639576911926, -0.4409911334514618, -0.42141830921173096, -0.40184545516967773, -0.3822726309299469, -0.36269980669021606, -0.34312695264816284, -0.323554128408432, -0.3039812743663788, -0.28440845012664795, -0.2648355960845947, -0.2452627718448639, -0.22568994760513306, -0.20611710846424103, -0.186544269323349, -0.16697143018245697, -0.14739859104156494, -0.1278257668018341, -0.10825292766094208, -0.08868008852005005, -0.06910725682973862, -0.049534425139427185, -0.02996164560317993, -0.010388810187578201, 0.009184025228023529, 0.02875686064362526, 0.04832969605922699, 0.06790253520011902, 0.08747536689043045, 0.10704819858074188, 0.1266210377216339, 0.14619387686252594, 0.16576671600341797, 0.1853395402431488, 0.20491237938404083, 0.22448521852493286, 0.2440580427646637, 0.26363086700439453, 0.28320372104644775, 0.3027765452861786, 0.3223493993282318, 0.34192222356796265, 0.36149507761001587, 0.3810679018497467, 0.40064072608947754, 0.42021358013153076, 0.4397864043712616, 0.45935922861099243, 0.47893208265304565, 0.4985049068927765, 0.5180777311325073, 0.5376505851745605, 0.5572234392166138, 0.5767962336540222, 0.5963690876960754]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 13.0, 7.0, 26.0, 38.0, 57.0, 92.0, 152.0, 277.0, 446.0, 869.0, 1815.0, 3884.0, 10529.0, 37396.0, 227221.0, 595862.0, 130936.0, 24891.0, 7756.0, 3089.0, 1476.0, 733.0, 391.0, 226.0, 142.0, 78.0, 56.0, 27.0, 24.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.149169921875, -0.14441299438476562, -0.13965606689453125, -0.13489913940429688, -0.1301422119140625, -0.12538528442382812, -0.12062835693359375, -0.11587142944335938, -0.111114501953125, -0.10635757446289062, -0.10160064697265625, -0.09684371948242188, -0.0920867919921875, -0.08732986450195312, -0.08257293701171875, -0.07781600952148438, -0.07305908203125, -0.06830215454101562, -0.06354522705078125, -0.058788299560546875, -0.0540313720703125, -0.049274444580078125, -0.04451751708984375, -0.039760589599609375, -0.035003662109375, -0.030246734619140625, -0.02548980712890625, -0.020732879638671875, -0.0159759521484375, -0.011219024658203125, -0.00646209716796875, -0.001705169677734375, 0.0030517578125, 0.007808685302734375, 0.01256561279296875, 0.017322540283203125, 0.0220794677734375, 0.026836395263671875, 0.03159332275390625, 0.036350250244140625, 0.041107177734375, 0.045864105224609375, 0.05062103271484375, 0.055377960205078125, 0.0601348876953125, 0.06489181518554688, 0.06964874267578125, 0.07440567016601562, 0.07916259765625, 0.08391952514648438, 0.08867645263671875, 0.09343338012695312, 0.0981903076171875, 0.10294723510742188, 0.10770416259765625, 0.11246109008789062, 0.117218017578125, 0.12197494506835938, 0.12673187255859375, 0.13148880004882812, 0.1362457275390625, 0.14100265502929688, 0.14575958251953125, 0.15051651000976562, 0.1552734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 11.0, 5.0, 7.0, 17.0, 25.0, 18.0, 25.0, 39.0, 34.0, 60.0, 60.0, 53.0, 54.0, 77.0, 65.0, 53.0, 70.0, 55.0, 53.0, 40.0, 30.0, 26.0, 20.0, 27.0, 9.0, 11.0, 7.0, 10.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.4892578125, -0.4752311706542969, -0.46120452880859375, -0.4471778869628906, -0.4331512451171875, -0.4191246032714844, -0.40509796142578125, -0.3910713195800781, -0.377044677734375, -0.3630180358886719, -0.34899139404296875, -0.3349647521972656, -0.3209381103515625, -0.3069114685058594, -0.29288482666015625, -0.2788581848144531, -0.26483154296875, -0.2508049011230469, -0.23677825927734375, -0.22275161743164062, -0.2087249755859375, -0.19469833374023438, -0.18067169189453125, -0.16664505004882812, -0.152618408203125, -0.13859176635742188, -0.12456512451171875, -0.11053848266601562, -0.0965118408203125, -0.08248519897460938, -0.06845855712890625, -0.054431915283203125, -0.0404052734375, -0.026378631591796875, -0.01235198974609375, 0.001674652099609375, 0.0157012939453125, 0.029727935791015625, 0.04375457763671875, 0.057781219482421875, 0.071807861328125, 0.08583450317382812, 0.09986114501953125, 0.11388778686523438, 0.1279144287109375, 0.14194107055664062, 0.15596771240234375, 0.16999435424804688, 0.18402099609375, 0.19804763793945312, 0.21207427978515625, 0.22610092163085938, 0.2401275634765625, 0.2541542053222656, 0.26818084716796875, 0.2822074890136719, 0.296234130859375, 0.3102607727050781, 0.32428741455078125, 0.3383140563964844, 0.3523406982421875, 0.3663673400878906, 0.38039398193359375, 0.3944206237792969, 0.408447265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 2.0, 6.0, 9.0, 8.0, 13.0, 22.0, 30.0, 43.0, 58.0, 83.0, 137.0, 179.0, 318.0, 534.0, 977.0, 1973.0, 4362.0, 12194.0, 49426.0, 335475.0, 527750.0, 86253.0, 17523.0, 5794.0, 2548.0, 1209.0, 651.0, 326.0, 225.0, 125.0, 91.0, 48.0, 35.0, 28.0, 21.0, 13.0, 15.0, 13.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11346435546875, -0.10970211029052734, -0.10593986511230469, -0.10217761993408203, -0.09841537475585938, -0.09465312957763672, -0.09089088439941406, -0.0871286392211914, -0.08336639404296875, -0.0796041488647461, -0.07584190368652344, -0.07207965850830078, -0.06831741333007812, -0.06455516815185547, -0.06079292297363281, -0.057030677795410156, -0.0532684326171875, -0.049506187438964844, -0.04574394226074219, -0.04198169708251953, -0.038219451904296875, -0.03445720672607422, -0.030694961547851562, -0.026932716369628906, -0.02317047119140625, -0.019408226013183594, -0.015645980834960938, -0.011883735656738281, -0.008121490478515625, -0.004359245300292969, -0.0005970001220703125, 0.0031652450561523438, 0.006927490234375, 0.010689735412597656, 0.014451980590820312, 0.01821422576904297, 0.021976470947265625, 0.02573871612548828, 0.029500961303710938, 0.033263206481933594, 0.03702545166015625, 0.040787696838378906, 0.04454994201660156, 0.04831218719482422, 0.052074432373046875, 0.05583667755126953, 0.05959892272949219, 0.06336116790771484, 0.0671234130859375, 0.07088565826416016, 0.07464790344238281, 0.07841014862060547, 0.08217239379882812, 0.08593463897705078, 0.08969688415527344, 0.0934591293334961, 0.09722137451171875, 0.1009836196899414, 0.10474586486816406, 0.10850811004638672, 0.11227035522460938, 0.11603260040283203, 0.11979484558105469, 0.12355709075927734, 0.1273193359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 3.0, 7.0, 5.0, 11.0, 9.0, 14.0, 20.0, 26.0, 21.0, 18.0, 34.0, 38.0, 32.0, 39.0, 54.0, 38.0, 34.0, 36.0, 63.0, 47.0, 46.0, 42.0, 50.0, 47.0, 27.0, 49.0, 32.0, 28.0, 24.0, 15.0, 15.0, 20.0, 11.0, 11.0, 8.0, 9.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7021484375, -0.67999267578125, -0.6578369140625, -0.63568115234375, -0.613525390625, -0.59136962890625, -0.5692138671875, -0.54705810546875, -0.52490234375, -0.50274658203125, -0.4805908203125, -0.45843505859375, -0.436279296875, -0.41412353515625, -0.3919677734375, -0.36981201171875, -0.34765625, -0.32550048828125, -0.3033447265625, -0.28118896484375, -0.259033203125, -0.23687744140625, -0.2147216796875, -0.19256591796875, -0.17041015625, -0.14825439453125, -0.1260986328125, -0.10394287109375, -0.081787109375, -0.05963134765625, -0.0374755859375, -0.01531982421875, 0.0068359375, 0.02899169921875, 0.0511474609375, 0.07330322265625, 0.095458984375, 0.11761474609375, 0.1397705078125, 0.16192626953125, 0.18408203125, 0.20623779296875, 0.2283935546875, 0.25054931640625, 0.272705078125, 0.29486083984375, 0.3170166015625, 0.33917236328125, 0.361328125, 0.38348388671875, 0.4056396484375, 0.42779541015625, 0.449951171875, 0.47210693359375, 0.4942626953125, 0.51641845703125, 0.53857421875, 0.56072998046875, 0.5828857421875, 0.60504150390625, 0.627197265625, 0.64935302734375, 0.6715087890625, 0.69366455078125, 0.7158203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 8.0, 16.0, 27.0, 34.0, 61.0, 84.0, 159.0, 281.0, 487.0, 902.0, 1824.0, 4378.0, 13170.0, 68243.0, 674378.0, 244558.0, 27140.0, 7315.0, 2745.0, 1283.0, 622.0, 359.0, 180.0, 90.0, 80.0, 39.0, 22.0, 18.0, 14.0, 8.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052215576171875, -0.05026388168334961, -0.04831218719482422, -0.04636049270629883, -0.04440879821777344, -0.04245710372924805, -0.040505409240722656, -0.038553714752197266, -0.036602020263671875, -0.034650325775146484, -0.032698631286621094, -0.030746936798095703, -0.028795242309570312, -0.026843547821044922, -0.02489185333251953, -0.02294015884399414, -0.02098846435546875, -0.01903676986694336, -0.01708507537841797, -0.015133380889892578, -0.013181686401367188, -0.011229991912841797, -0.009278297424316406, -0.007326602935791016, -0.005374908447265625, -0.0034232139587402344, -0.0014715194702148438, 0.0004801750183105469, 0.0024318695068359375, 0.004383563995361328, 0.006335258483886719, 0.00828695297241211, 0.0102386474609375, 0.01219034194946289, 0.014142036437988281, 0.016093730926513672, 0.018045425415039062, 0.019997119903564453, 0.021948814392089844, 0.023900508880615234, 0.025852203369140625, 0.027803897857666016, 0.029755592346191406, 0.0317072868347168, 0.03365898132324219, 0.03561067581176758, 0.03756237030029297, 0.03951406478881836, 0.04146575927734375, 0.04341745376586914, 0.04536914825439453, 0.04732084274291992, 0.04927253723144531, 0.0512242317199707, 0.053175926208496094, 0.055127620697021484, 0.057079315185546875, 0.059031009674072266, 0.060982704162597656, 0.06293439865112305, 0.06488609313964844, 0.06683778762817383, 0.06878948211669922, 0.07074117660522461, 0.07269287109375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 4.0, 8.0, 23.0, 26.0, 33.0, 67.0, 87.0, 132.0, 140.0, 143.0, 91.0, 75.0, 63.0, 32.0, 19.0, 10.0, 12.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8908252716064453e-05, -2.793874591588974e-05, -2.6969239115715027e-05, -2.5999732315540314e-05, -2.50302255153656e-05, -2.4060718715190887e-05, -2.3091211915016174e-05, -2.212170511484146e-05, -2.1152198314666748e-05, -2.0182691514492035e-05, -1.9213184714317322e-05, -1.824367791414261e-05, -1.7274171113967896e-05, -1.6304664313793182e-05, -1.533515751361847e-05, -1.4365650713443756e-05, -1.3396143913269043e-05, -1.242663711309433e-05, -1.1457130312919617e-05, -1.0487623512744904e-05, -9.51811671257019e-06, -8.548609912395477e-06, -7.579103112220764e-06, -6.609596312046051e-06, -5.640089511871338e-06, -4.670582711696625e-06, -3.7010759115219116e-06, -2.7315691113471985e-06, -1.7620623111724854e-06, -7.925555109977722e-07, 1.7695128917694092e-07, 1.146458089351654e-06, 2.115964889526367e-06, 3.0854716897010803e-06, 4.0549784898757935e-06, 5.024485290050507e-06, 5.99399209022522e-06, 6.963498890399933e-06, 7.933005690574646e-06, 8.902512490749359e-06, 9.872019290924072e-06, 1.0841526091098785e-05, 1.1811032891273499e-05, 1.2780539691448212e-05, 1.3750046491622925e-05, 1.4719553291797638e-05, 1.568906009197235e-05, 1.6658566892147064e-05, 1.7628073692321777e-05, 1.859758049249649e-05, 1.9567087292671204e-05, 2.0536594092845917e-05, 2.150610089302063e-05, 2.2475607693195343e-05, 2.3445114493370056e-05, 2.441462129354477e-05, 2.5384128093719482e-05, 2.6353634893894196e-05, 2.732314169406891e-05, 2.8292648494243622e-05, 2.9262155294418335e-05, 3.0231662094593048e-05, 3.120116889476776e-05, 3.2170675694942474e-05, 3.314018249511719e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 4.0, 7.0, 10.0, 14.0, 17.0, 28.0, 37.0, 62.0, 108.0, 179.0, 283.0, 520.0, 883.0, 1633.0, 3183.0, 6679.0, 15945.0, 49617.0, 205785.0, 519836.0, 173309.0, 43443.0, 14443.0, 6126.0, 2796.0, 1601.0, 827.0, 442.0, 289.0, 163.0, 95.0, 61.0, 42.0, 24.0, 17.0, 11.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.044891357421875, -0.0435490608215332, -0.042206764221191406, -0.04086446762084961, -0.03952217102050781, -0.038179874420166016, -0.03683757781982422, -0.03549528121948242, -0.034152984619140625, -0.03281068801879883, -0.03146839141845703, -0.030126094818115234, -0.028783798217773438, -0.02744150161743164, -0.026099205017089844, -0.024756908416748047, -0.02341461181640625, -0.022072315216064453, -0.020730018615722656, -0.01938772201538086, -0.018045425415039062, -0.016703128814697266, -0.015360832214355469, -0.014018535614013672, -0.012676239013671875, -0.011333942413330078, -0.009991645812988281, -0.008649349212646484, -0.0073070526123046875, -0.005964756011962891, -0.004622459411621094, -0.003280162811279297, -0.0019378662109375, -0.0005955696105957031, 0.0007467269897460938, 0.0020890235900878906, 0.0034313201904296875, 0.004773616790771484, 0.006115913391113281, 0.007458209991455078, 0.008800506591796875, 0.010142803192138672, 0.011485099792480469, 0.012827396392822266, 0.014169692993164062, 0.01551198959350586, 0.016854286193847656, 0.018196582794189453, 0.01953887939453125, 0.020881175994873047, 0.022223472595214844, 0.02356576919555664, 0.024908065795898438, 0.026250362396240234, 0.02759265899658203, 0.028934955596923828, 0.030277252197265625, 0.03161954879760742, 0.03296184539794922, 0.034304141998291016, 0.03564643859863281, 0.03698873519897461, 0.038331031799316406, 0.0396733283996582, 0.041015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 10.0, 16.0, 13.0, 16.0, 39.0, 34.0, 75.0, 81.0, 103.0, 110.0, 124.0, 91.0, 84.0, 46.0, 41.0, 32.0, 22.0, 12.0, 15.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.01465606689453125, -0.014222502708435059, -0.013788938522338867, -0.013355374336242676, -0.012921810150146484, -0.012488245964050293, -0.012054681777954102, -0.01162111759185791, -0.011187553405761719, -0.010753989219665527, -0.010320425033569336, -0.009886860847473145, -0.009453296661376953, -0.009019732475280762, -0.00858616828918457, -0.008152604103088379, -0.0077190399169921875, -0.007285475730895996, -0.006851911544799805, -0.006418347358703613, -0.005984783172607422, -0.0055512189865112305, -0.005117654800415039, -0.004684090614318848, -0.004250526428222656, -0.003816962242126465, -0.0033833980560302734, -0.002949833869934082, -0.0025162696838378906, -0.0020827054977416992, -0.0016491413116455078, -0.0012155771255493164, -0.000782012939453125, -0.0003484487533569336, 8.511543273925781e-05, 0.0005186796188354492, 0.0009522438049316406, 0.001385807991027832, 0.0018193721771240234, 0.002252936363220215, 0.0026865005493164062, 0.0031200647354125977, 0.003553628921508789, 0.0039871931076049805, 0.004420757293701172, 0.004854321479797363, 0.005287885665893555, 0.005721449851989746, 0.0061550140380859375, 0.006588578224182129, 0.00702214241027832, 0.007455706596374512, 0.007889270782470703, 0.008322834968566895, 0.008756399154663086, 0.009189963340759277, 0.009623527526855469, 0.01005709171295166, 0.010490655899047852, 0.010924220085144043, 0.011357784271240234, 0.011791348457336426, 0.012224912643432617, 0.012658476829528809, 0.013092041015625]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 11.0, 8.0, 17.0, 29.0, 52.0, 103.0, 116.0, 154.0, 170.0, 134.0, 68.0, 41.0, 30.0, 17.0, 8.0, 13.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8422192931175232, -0.8157488107681274, -0.7892783284187317, -0.7628079056739807, -0.736337423324585, -0.7098669409751892, -0.6833964586257935, -0.6569260358810425, -0.6304555535316467, -0.603985071182251, -0.5775145888328552, -0.5510441660881042, -0.5245736837387085, -0.49810320138931274, -0.471632719039917, -0.44516226649284363, -0.4186917841434479, -0.3922213017940521, -0.36575084924697876, -0.339280366897583, -0.31280991435050964, -0.2863394320011139, -0.2598689794540405, -0.23339849710464478, -0.20692802965641022, -0.18045756220817566, -0.1539870947599411, -0.12751662731170654, -0.10104615241289139, -0.07457567751407623, -0.048105210065841675, -0.021634742617607117, 0.004835724830627441, 0.031306192278862, 0.057776663452386856, 0.08424713462591171, 0.11071760207414627, 0.13718807697296143, 0.16365854442119598, 0.19012901186943054, 0.2165994793176651, 0.24306994676589966, 0.2695404291152954, 0.2960108816623688, 0.3224813640117645, 0.3489518165588379, 0.37542229890823364, 0.4018927812576294, 0.42836323380470276, 0.4548337161540985, 0.4813041687011719, 0.5077746510505676, 0.5342451333999634, 0.5607155561447144, 0.5871860384941101, 0.6136565208435059, 0.6401270031929016, 0.6665974855422974, 0.6930679678916931, 0.7195383906364441, 0.7460088729858398, 0.7724793553352356, 0.7989498376846313, 0.8254202604293823, 0.8518907427787781]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 8.0, 11.0, 9.0, 11.0, 25.0, 22.0, 28.0, 46.0, 51.0, 51.0, 59.0, 63.0, 69.0, 58.0, 74.0, 60.0, 57.0, 51.0, 40.0, 51.0, 32.0, 22.0, 18.0, 13.0, 9.0, 14.0, 7.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.46091294288635254, -0.4472023546695709, -0.4334917664527893, -0.4197811484336853, -0.4060705602169037, -0.39235997200012207, -0.37864935398101807, -0.36493876576423645, -0.35122817754745483, -0.3375175893306732, -0.3238070011138916, -0.3100963830947876, -0.296385794878006, -0.28267520666122437, -0.26896458864212036, -0.25525400042533875, -0.24154341220855713, -0.2278328239917755, -0.2141222208738327, -0.2004116177558899, -0.18670102953910828, -0.17299044132232666, -0.15927983820438385, -0.14556923508644104, -0.13185864686965942, -0.11814805120229721, -0.104437455534935, -0.09072685986757278, -0.07701626420021057, -0.06330566853284836, -0.049595072865486145, -0.03588447719812393, -0.02217385172843933, -0.008463256061077118, 0.005247339606285095, 0.01895793527364731, 0.03266853094100952, 0.046379126608371735, 0.06008972227573395, 0.07380031794309616, 0.08751091361045837, 0.10122150927782059, 0.1149321049451828, 0.1286427080631256, 0.14235329627990723, 0.15606388449668884, 0.16977448761463165, 0.18348509073257446, 0.19719567894935608, 0.2109062671661377, 0.2246168702840805, 0.23832747340202332, 0.25203806161880493, 0.26574864983558655, 0.27945923805236816, 0.29316985607147217, 0.3068804442882538, 0.3205910325050354, 0.3343016505241394, 0.348012238740921, 0.36172282695770264, 0.37543341517448425, 0.38914400339126587, 0.4028546214103699, 0.4165652096271515]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 14.0, 19.0, 30.0, 36.0, 49.0, 80.0, 120.0, 234.0, 370.0, 550.0, 1023.0, 2198.0, 4654.0, 11256.0, 34352.0, 182632.0, 691985.0, 83027.0, 21245.0, 7713.0, 3280.0, 1572.0, 856.0, 494.0, 286.0, 167.0, 89.0, 69.0, 44.0, 38.0, 16.0, 15.0, 8.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49169921875, -0.47599029541015625, -0.4602813720703125, -0.44457244873046875, -0.428863525390625, -0.41315460205078125, -0.3974456787109375, -0.38173675537109375, -0.36602783203125, -0.35031890869140625, -0.3346099853515625, -0.31890106201171875, -0.303192138671875, -0.28748321533203125, -0.2717742919921875, -0.25606536865234375, -0.2403564453125, -0.22464752197265625, -0.2089385986328125, -0.19322967529296875, -0.177520751953125, -0.16181182861328125, -0.1461029052734375, -0.13039398193359375, -0.11468505859375, -0.09897613525390625, -0.0832672119140625, -0.06755828857421875, -0.051849365234375, -0.03614044189453125, -0.0204315185546875, -0.00472259521484375, 0.010986328125, 0.02669525146484375, 0.0424041748046875, 0.05811309814453125, 0.073822021484375, 0.08953094482421875, 0.1052398681640625, 0.12094879150390625, 0.13665771484375, 0.15236663818359375, 0.1680755615234375, 0.18378448486328125, 0.199493408203125, 0.21520233154296875, 0.2309112548828125, 0.24662017822265625, 0.2623291015625, 0.27803802490234375, 0.2937469482421875, 0.30945587158203125, 0.325164794921875, 0.34087371826171875, 0.3565826416015625, 0.37229156494140625, 0.38800048828125, 0.40370941162109375, 0.4194183349609375, 0.43512725830078125, 0.450836181640625, 0.46654510498046875, 0.4822540283203125, 0.49796295166015625, 0.513671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 10.0, 5.0, 6.0, 8.0, 10.0, 13.0, 22.0, 33.0, 31.0, 48.0, 58.0, 67.0, 62.0, 62.0, 75.0, 72.0, 67.0, 62.0, 55.0, 44.0, 38.0, 30.0, 25.0, 26.0, 14.0, 11.0, 11.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.0439453125, -1.0154342651367188, -0.9869232177734375, -0.9584121704101562, -0.929901123046875, -0.9013900756835938, -0.8728790283203125, -0.8443679809570312, -0.81585693359375, -0.7873458862304688, -0.7588348388671875, -0.7303237915039062, -0.701812744140625, -0.6733016967773438, -0.6447906494140625, -0.6162796020507812, -0.5877685546875, -0.5592575073242188, -0.5307464599609375, -0.5022354125976562, -0.473724365234375, -0.44521331787109375, -0.4167022705078125, -0.38819122314453125, -0.35968017578125, -0.33116912841796875, -0.3026580810546875, -0.27414703369140625, -0.245635986328125, -0.21712493896484375, -0.1886138916015625, -0.16010284423828125, -0.131591796875, -0.10308074951171875, -0.0745697021484375, -0.04605865478515625, -0.017547607421875, 0.01096343994140625, 0.0394744873046875, 0.06798553466796875, 0.09649658203125, 0.12500762939453125, 0.1535186767578125, 0.18202972412109375, 0.210540771484375, 0.23905181884765625, 0.2675628662109375, 0.29607391357421875, 0.3245849609375, 0.35309600830078125, 0.3816070556640625, 0.41011810302734375, 0.438629150390625, 0.46714019775390625, 0.4956512451171875, 0.5241622924804688, 0.55267333984375, 0.5811843872070312, 0.6096954345703125, 0.6382064819335938, 0.666717529296875, 0.6952285766601562, 0.7237396240234375, 0.7522506713867188, 0.78076171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 13.0, 10.0, 7.0, 20.0, 27.0, 26.0, 47.0, 68.0, 103.0, 169.0, 297.0, 842.0, 2658.0, 12897.0, 116771.0, 855813.0, 48432.0, 7455.0, 1672.0, 528.0, 259.0, 116.0, 67.0, 59.0, 43.0, 35.0, 24.0, 16.0, 7.0, 11.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7109375, -0.6866989135742188, -0.6624603271484375, -0.6382217407226562, -0.613983154296875, -0.5897445678710938, -0.5655059814453125, -0.5412673950195312, -0.51702880859375, -0.49279022216796875, -0.4685516357421875, -0.44431304931640625, -0.420074462890625, -0.39583587646484375, -0.3715972900390625, -0.34735870361328125, -0.3231201171875, -0.29888153076171875, -0.2746429443359375, -0.25040435791015625, -0.226165771484375, -0.20192718505859375, -0.1776885986328125, -0.15345001220703125, -0.12921142578125, -0.10497283935546875, -0.0807342529296875, -0.05649566650390625, -0.032257080078125, -0.00801849365234375, 0.0162200927734375, 0.04045867919921875, 0.064697265625, 0.08893585205078125, 0.1131744384765625, 0.13741302490234375, 0.161651611328125, 0.18589019775390625, 0.2101287841796875, 0.23436737060546875, 0.25860595703125, 0.28284454345703125, 0.3070831298828125, 0.33132171630859375, 0.355560302734375, 0.37979888916015625, 0.4040374755859375, 0.42827606201171875, 0.4525146484375, 0.47675323486328125, 0.5009918212890625, 0.5252304077148438, 0.549468994140625, 0.5737075805664062, 0.5979461669921875, 0.6221847534179688, 0.64642333984375, 0.6706619262695312, 0.6949005126953125, 0.7191390991210938, 0.743377685546875, 0.7676162719726562, 0.7918548583984375, 0.8160934448242188, 0.84033203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 5.0, 10.0, 8.0, 3.0, 7.0, 13.0, 19.0, 25.0, 22.0, 26.0, 33.0, 39.0, 64.0, 57.0, 74.0, 54.0, 69.0, 53.0, 51.0, 72.0, 41.0, 42.0, 33.0, 31.0, 30.0, 24.0, 21.0, 18.0, 18.0, 14.0, 9.0, 4.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9958343505859375, -0.962371826171875, -0.9289093017578125, -0.89544677734375, -0.8619842529296875, -0.828521728515625, -0.7950592041015625, -0.7615966796875, -0.7281341552734375, -0.694671630859375, -0.6612091064453125, -0.62774658203125, -0.5942840576171875, -0.560821533203125, -0.5273590087890625, -0.493896484375, -0.4604339599609375, -0.426971435546875, -0.3935089111328125, -0.36004638671875, -0.3265838623046875, -0.293121337890625, -0.2596588134765625, -0.2261962890625, -0.1927337646484375, -0.159271240234375, -0.1258087158203125, -0.09234619140625, -0.0588836669921875, -0.025421142578125, 0.0080413818359375, 0.04150390625, 0.0749664306640625, 0.108428955078125, 0.1418914794921875, 0.17535400390625, 0.2088165283203125, 0.242279052734375, 0.2757415771484375, 0.3092041015625, 0.3426666259765625, 0.376129150390625, 0.4095916748046875, 0.44305419921875, 0.4765167236328125, 0.509979248046875, 0.5434417724609375, 0.576904296875, 0.6103668212890625, 0.643829345703125, 0.6772918701171875, 0.71075439453125, 0.7442169189453125, 0.777679443359375, 0.8111419677734375, 0.8446044921875, 0.8780670166015625, 0.911529541015625, 0.9449920654296875, 0.97845458984375, 1.0119171142578125, 1.045379638671875, 1.0788421630859375, 1.1123046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 6.0, 7.0, 9.0, 12.0, 16.0, 28.0, 39.0, 89.0, 192.0, 412.0, 983.0, 3357.0, 17940.0, 244841.0, 743217.0, 30346.0, 4762.0, 1314.0, 514.0, 217.0, 119.0, 62.0, 29.0, 19.0, 7.0, 4.0, 7.0, 1.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.364990234375, -0.3561134338378906, -0.34723663330078125, -0.3383598327636719, -0.3294830322265625, -0.3206062316894531, -0.31172943115234375, -0.3028526306152344, -0.293975830078125, -0.2850990295410156, -0.27622222900390625, -0.2673454284667969, -0.2584686279296875, -0.24959182739257812, -0.24071502685546875, -0.23183822631835938, -0.22296142578125, -0.21408462524414062, -0.20520782470703125, -0.19633102416992188, -0.1874542236328125, -0.17857742309570312, -0.16970062255859375, -0.16082382202148438, -0.151947021484375, -0.14307022094726562, -0.13419342041015625, -0.12531661987304688, -0.1164398193359375, -0.10756301879882812, -0.09868621826171875, -0.08980941772460938, -0.0809326171875, -0.07205581665039062, -0.06317901611328125, -0.054302215576171875, -0.0454254150390625, -0.036548614501953125, -0.02767181396484375, -0.018795013427734375, -0.009918212890625, -0.001041412353515625, 0.00783538818359375, 0.016712188720703125, 0.0255889892578125, 0.034465789794921875, 0.04334259033203125, 0.052219390869140625, 0.06109619140625, 0.06997299194335938, 0.07884979248046875, 0.08772659301757812, 0.0966033935546875, 0.10548019409179688, 0.11435699462890625, 0.12323379516601562, 0.132110595703125, 0.14098739624023438, 0.14986419677734375, 0.15874099731445312, 0.1676177978515625, 0.17649459838867188, 0.18537139892578125, 0.19424819946289062, 0.203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 3.0, 7.0, 5.0, 9.0, 17.0, 24.0, 24.0, 17.0, 30.0, 43.0, 71.0, 100.0, 244.0, 154.0, 69.0, 48.0, 36.0, 24.0, 17.0, 14.0, 5.0, 11.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.205371856689453e-05, -2.1224841475486755e-05, -2.039596438407898e-05, -1.9567087292671204e-05, -1.8738210201263428e-05, -1.7909333109855652e-05, -1.7080456018447876e-05, -1.62515789270401e-05, -1.5422701835632324e-05, -1.4593824744224548e-05, -1.3764947652816772e-05, -1.2936070561408997e-05, -1.210719347000122e-05, -1.1278316378593445e-05, -1.0449439287185669e-05, -9.620562195777893e-06, -8.791685104370117e-06, -7.962808012962341e-06, -7.1339309215545654e-06, -6.3050538301467896e-06, -5.476176738739014e-06, -4.647299647331238e-06, -3.818422555923462e-06, -2.989545464515686e-06, -2.16066837310791e-06, -1.3317912817001343e-06, -5.029141902923584e-07, 3.259629011154175e-07, 1.1548399925231934e-06, 1.9837170839309692e-06, 2.812594175338745e-06, 3.641471266746521e-06, 4.470348358154297e-06, 5.299225449562073e-06, 6.128102540969849e-06, 6.9569796323776245e-06, 7.7858567237854e-06, 8.614733815193176e-06, 9.443610906600952e-06, 1.0272487998008728e-05, 1.1101365089416504e-05, 1.193024218082428e-05, 1.2759119272232056e-05, 1.3587996363639832e-05, 1.4416873455047607e-05, 1.5245750546455383e-05, 1.607462763786316e-05, 1.6903504729270935e-05, 1.773238182067871e-05, 1.8561258912086487e-05, 1.9390136003494263e-05, 2.021901309490204e-05, 2.1047890186309814e-05, 2.187676727771759e-05, 2.2705644369125366e-05, 2.3534521460533142e-05, 2.4363398551940918e-05, 2.5192275643348694e-05, 2.602115273475647e-05, 2.6850029826164246e-05, 2.767890691757202e-05, 2.8507784008979797e-05, 2.9336661100387573e-05, 3.016553819179535e-05, 3.0994415283203125e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 8.0, 8.0, 17.0, 23.0, 33.0, 31.0, 82.0, 155.0, 292.0, 843.0, 2644.0, 12747.0, 93399.0, 844149.0, 79115.0, 11246.0, 2440.0, 743.0, 276.0, 125.0, 69.0, 34.0, 24.0, 13.0, 14.0, 9.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2293701171875, -0.2213115692138672, -0.21325302124023438, -0.20519447326660156, -0.19713592529296875, -0.18907737731933594, -0.18101882934570312, -0.1729602813720703, -0.1649017333984375, -0.1568431854248047, -0.14878463745117188, -0.14072608947753906, -0.13266754150390625, -0.12460899353027344, -0.11655044555664062, -0.10849189758300781, -0.100433349609375, -0.09237480163574219, -0.08431625366210938, -0.07625770568847656, -0.06819915771484375, -0.06014060974121094, -0.052082061767578125, -0.04402351379394531, -0.0359649658203125, -0.027906417846679688, -0.019847869873046875, -0.011789321899414062, -0.00373077392578125, 0.0043277740478515625, 0.012386322021484375, 0.020444869995117188, 0.02850341796875, 0.03656196594238281, 0.044620513916015625, 0.05267906188964844, 0.06073760986328125, 0.06879615783691406, 0.07685470581054688, 0.08491325378417969, 0.0929718017578125, 0.10103034973144531, 0.10908889770507812, 0.11714744567871094, 0.12520599365234375, 0.13326454162597656, 0.14132308959960938, 0.1493816375732422, 0.157440185546875, 0.1654987335205078, 0.17355728149414062, 0.18161582946777344, 0.18967437744140625, 0.19773292541503906, 0.20579147338867188, 0.2138500213623047, 0.2219085693359375, 0.2299671173095703, 0.23802566528320312, 0.24608421325683594, 0.25414276123046875, 0.26220130920410156, 0.2702598571777344, 0.2783184051513672, 0.286376953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 9.0, 13.0, 18.0, 38.0, 44.0, 73.0, 125.0, 310.0, 130.0, 71.0, 50.0, 25.0, 28.0, 19.0, 14.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1536865234375, -0.15006542205810547, -0.14644432067871094, -0.1428232192993164, -0.13920211791992188, -0.13558101654052734, -0.1319599151611328, -0.12833881378173828, -0.12471771240234375, -0.12109661102294922, -0.11747550964355469, -0.11385440826416016, -0.11023330688476562, -0.1066122055053711, -0.10299110412597656, -0.09937000274658203, -0.0957489013671875, -0.09212779998779297, -0.08850669860839844, -0.0848855972290039, -0.08126449584960938, -0.07764339447021484, -0.07402229309082031, -0.07040119171142578, -0.06678009033203125, -0.06315898895263672, -0.05953788757324219, -0.055916786193847656, -0.052295684814453125, -0.048674583435058594, -0.04505348205566406, -0.04143238067626953, -0.037811279296875, -0.03419017791748047, -0.030569076538085938, -0.026947975158691406, -0.023326873779296875, -0.019705772399902344, -0.016084671020507812, -0.012463569641113281, -0.00884246826171875, -0.005221366882324219, -0.0016002655029296875, 0.0020208358764648438, 0.005641937255859375, 0.009263038635253906, 0.012884140014648438, 0.01650524139404297, 0.0201263427734375, 0.02374744415283203, 0.027368545532226562, 0.030989646911621094, 0.034610748291015625, 0.038231849670410156, 0.04185295104980469, 0.04547405242919922, 0.04909515380859375, 0.05271625518798828, 0.05633735656738281, 0.059958457946777344, 0.06357955932617188, 0.0672006607055664, 0.07082176208496094, 0.07444286346435547, 0.07806396484375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 6.0, 12.0, 41.0, 66.0, 178.0, 274.0, 231.0, 99.0, 48.0, 20.0, 11.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9080429077148438, -1.8107364177703857, -1.7134299278259277, -1.6161233186721802, -1.5188168287277222, -1.4215103387832642, -1.3242037296295166, -1.2268972396850586, -1.1295907497406006, -1.0322842597961426, -0.9349777102470398, -0.837671160697937, -0.740364670753479, -0.643058180809021, -0.5457516312599182, -0.44844508171081543, -0.3511385917663574, -0.253832072019577, -0.15652555227279663, -0.059219032526016235, 0.03808748722076416, 0.13539400696754456, 0.23270052671432495, 0.33000707626342773, 0.42731356620788574, 0.5246200561523438, 0.6219266057014465, 0.7192331552505493, 0.8165396451950073, 0.9138461351394653, 1.011152744293213, 1.108459234237671, 1.205765724182129, 1.303072214126587, 1.400378704071045, 1.4976853132247925, 1.5949918031692505, 1.6922982931137085, 1.789604902267456, 1.886911392211914, 1.984217882156372, 2.08152437210083, 2.178830862045288, 2.276137351989746, 2.373444080352783, 2.470750570297241, 2.568057060241699, 2.6653635501861572, 2.7626700401306152, 2.8599765300750732, 2.9572830200195312, 3.0545895099639893, 3.1518959999084473, 3.2492027282714844, 3.3465092182159424, 3.4438157081604004, 3.5411221981048584, 3.6384286880493164, 3.7357351779937744, 3.8330416679382324, 3.9303483963012695, 4.027654647827148, 4.1249613761901855, 4.222268104553223, 4.319574356079102]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 11.0, 13.0, 9.0, 17.0, 24.0, 26.0, 24.0, 27.0, 26.0, 31.0, 22.0, 27.0, 46.0, 41.0, 38.0, 49.0, 42.0, 53.0, 40.0, 42.0, 38.0, 38.0, 28.0, 30.0, 31.0, 33.0, 31.0, 25.0, 23.0, 11.0, 20.0, 13.0, 10.0, 6.0, 12.0, 5.0, 5.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.432656168937683, -1.3903820514678955, -1.3481080532073975, -1.3058339357376099, -1.2635598182678223, -1.2212857007980347, -1.1790117025375366, -1.136737585067749, -1.0944634675979614, -1.0521893501281738, -1.0099153518676758, -0.9676412343978882, -0.9253671169281006, -0.8830930590629578, -0.8408190011978149, -0.7985448837280273, -0.7562708258628845, -0.7139967679977417, -0.6717226505279541, -0.6294485926628113, -0.5871744751930237, -0.5449004173278809, -0.5026262998580933, -0.46035224199295044, -0.41807815432548523, -0.37580406665802, -0.3335299789905548, -0.2912558913230896, -0.24898181855678558, -0.20670773088932037, -0.16443365812301636, -0.12215957045555115, -0.07988548278808594, -0.037611398845911026, 0.0046626850962638855, 0.0469367653131485, 0.08921085298061371, 0.13148494064807892, 0.17375901341438293, 0.21603310108184814, 0.25830718874931335, 0.30058127641677856, 0.3428553640842438, 0.385129451751709, 0.4274035096168518, 0.4696776270866394, 0.5119516849517822, 0.5542258024215698, 0.5964998602867126, 0.6387739181518555, 0.6810480356216431, 0.7233220934867859, 0.7655962109565735, 0.8078702688217163, 0.8501443862915039, 0.8924184441566467, 0.9346925020217896, 0.9769665598869324, 1.0192406177520752, 1.0615147352218628, 1.1037888526916504, 1.146062970161438, 1.188336968421936, 1.2306110858917236, 1.2728852033615112]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 12.0, 9.0, 17.0, 16.0, 20.0, 28.0, 24.0, 39.0, 28.0, 63.0, 96.0, 148.0, 255.0, 526.0, 1259.0, 3691.0, 17035.0, 258304.0, 3776173.0, 118716.0, 12451.0, 3065.0, 1128.0, 446.0, 233.0, 128.0, 73.0, 50.0, 46.0, 28.0, 18.0, 18.0, 23.0, 16.0, 16.0, 8.0, 13.0, 7.0, 9.0, 6.0, 5.0, 8.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.1279296875, -1.0882110595703125, -1.048492431640625, -1.0087738037109375, -0.96905517578125, -0.9293365478515625, -0.889617919921875, -0.8498992919921875, -0.8101806640625, -0.7704620361328125, -0.730743408203125, -0.6910247802734375, -0.65130615234375, -0.6115875244140625, -0.571868896484375, -0.5321502685546875, -0.492431640625, -0.4527130126953125, -0.412994384765625, -0.3732757568359375, -0.33355712890625, -0.2938385009765625, -0.254119873046875, -0.2144012451171875, -0.1746826171875, -0.1349639892578125, -0.095245361328125, -0.0555267333984375, -0.01580810546875, 0.0239105224609375, 0.063629150390625, 0.1033477783203125, 0.14306640625, 0.1827850341796875, 0.222503662109375, 0.2622222900390625, 0.30194091796875, 0.3416595458984375, 0.381378173828125, 0.4210968017578125, 0.4608154296875, 0.5005340576171875, 0.540252685546875, 0.5799713134765625, 0.61968994140625, 0.6594085693359375, 0.699127197265625, 0.7388458251953125, 0.778564453125, 0.8182830810546875, 0.858001708984375, 0.8977203369140625, 0.93743896484375, 0.9771575927734375, 1.016876220703125, 1.0565948486328125, 1.0963134765625, 1.1360321044921875, 1.175750732421875, 1.2154693603515625, 1.25518798828125, 1.2949066162109375, 1.334625244140625, 1.3743438720703125, 1.4140625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 4.0, 3.0, 4.0, 6.0, 10.0, 11.0, 22.0, 27.0, 34.0, 45.0, 71.0, 62.0, 85.0, 76.0, 79.0, 81.0, 71.0, 65.0, 67.0, 38.0, 31.0, 31.0, 20.0, 17.0, 12.0, 4.0, 8.0, 5.0, 0.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65771484375, -0.6391677856445312, -0.6206207275390625, -0.6020736694335938, -0.583526611328125, -0.5649795532226562, -0.5464324951171875, -0.5278854370117188, -0.50933837890625, -0.49079132080078125, -0.4722442626953125, -0.45369720458984375, -0.435150146484375, -0.41660308837890625, -0.3980560302734375, -0.37950897216796875, -0.3609619140625, -0.34241485595703125, -0.3238677978515625, -0.30532073974609375, -0.286773681640625, -0.26822662353515625, -0.2496795654296875, -0.23113250732421875, -0.21258544921875, -0.19403839111328125, -0.1754913330078125, -0.15694427490234375, -0.138397216796875, -0.11985015869140625, -0.1013031005859375, -0.08275604248046875, -0.064208984375, -0.04566192626953125, -0.0271148681640625, -0.00856781005859375, 0.009979248046875, 0.02852630615234375, 0.0470733642578125, 0.06562042236328125, 0.08416748046875, 0.10271453857421875, 0.1212615966796875, 0.13980865478515625, 0.158355712890625, 0.17690277099609375, 0.1954498291015625, 0.21399688720703125, 0.2325439453125, 0.25109100341796875, 0.2696380615234375, 0.28818511962890625, 0.306732177734375, 0.32527923583984375, 0.3438262939453125, 0.36237335205078125, 0.38092041015625, 0.39946746826171875, 0.4180145263671875, 0.43656158447265625, 0.455108642578125, 0.47365570068359375, 0.4922027587890625, 0.5107498168945312, 0.529296875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 9.0, 10.0, 6.0, 7.0, 16.0, 20.0, 33.0, 44.0, 110.0, 160.0, 358.0, 787.0, 1937.0, 6799.0, 36900.0, 800895.0, 3259619.0, 71206.0, 10588.0, 2797.0, 1047.0, 431.0, 213.0, 95.0, 66.0, 43.0, 27.0, 17.0, 5.0, 7.0, 5.0, 3.0, 4.0, 8.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.99951171875, -0.9626998901367188, -0.9258880615234375, -0.8890762329101562, -0.852264404296875, -0.8154525756835938, -0.7786407470703125, -0.7418289184570312, -0.70501708984375, -0.6682052612304688, -0.6313934326171875, -0.5945816040039062, -0.557769775390625, -0.5209579467773438, -0.4841461181640625, -0.44733428955078125, -0.4105224609375, -0.37371063232421875, -0.3368988037109375, -0.30008697509765625, -0.263275146484375, -0.22646331787109375, -0.1896514892578125, -0.15283966064453125, -0.11602783203125, -0.07921600341796875, -0.0424041748046875, -0.00559234619140625, 0.031219482421875, 0.06803131103515625, 0.1048431396484375, 0.14165496826171875, 0.178466796875, 0.21527862548828125, 0.2520904541015625, 0.28890228271484375, 0.325714111328125, 0.36252593994140625, 0.3993377685546875, 0.43614959716796875, 0.47296142578125, 0.5097732543945312, 0.5465850830078125, 0.5833969116210938, 0.620208740234375, 0.6570205688476562, 0.6938323974609375, 0.7306442260742188, 0.7674560546875, 0.8042678833007812, 0.8410797119140625, 0.8778915405273438, 0.914703369140625, 0.9515151977539062, 0.9883270263671875, 1.0251388549804688, 1.06195068359375, 1.0987625122070312, 1.1355743408203125, 1.1723861694335938, 1.209197998046875, 1.2460098266601562, 1.2828216552734375, 1.3196334838867188, 1.3564453125]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 15.0, 17.0, 26.0, 22.0, 41.0, 63.0, 82.0, 138.0, 219.0, 430.0, 681.0, 915.0, 541.0, 318.0, 192.0, 99.0, 68.0, 49.0, 27.0, 33.0, 26.0, 12.0, 9.0, 7.0, 4.0, 6.0, 4.0, 6.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.260498046875, -0.25310516357421875, -0.2457122802734375, -0.23831939697265625, -0.230926513671875, -0.22353363037109375, -0.2161407470703125, -0.20874786376953125, -0.20135498046875, -0.19396209716796875, -0.1865692138671875, -0.17917633056640625, -0.171783447265625, -0.16439056396484375, -0.1569976806640625, -0.14960479736328125, -0.1422119140625, -0.13481903076171875, -0.1274261474609375, -0.12003326416015625, -0.112640380859375, -0.10524749755859375, -0.0978546142578125, -0.09046173095703125, -0.08306884765625, -0.07567596435546875, -0.0682830810546875, -0.06089019775390625, -0.053497314453125, -0.04610443115234375, -0.0387115478515625, -0.03131866455078125, -0.02392578125, -0.01653289794921875, -0.0091400146484375, -0.00174713134765625, 0.005645751953125, 0.01303863525390625, 0.0204315185546875, 0.02782440185546875, 0.03521728515625, 0.04261016845703125, 0.0500030517578125, 0.05739593505859375, 0.064788818359375, 0.07218170166015625, 0.0795745849609375, 0.08696746826171875, 0.0943603515625, 0.10175323486328125, 0.1091461181640625, 0.11653900146484375, 0.123931884765625, 0.13132476806640625, 0.1387176513671875, 0.14611053466796875, 0.15350341796875, 0.16089630126953125, 0.1682891845703125, 0.17568206787109375, 0.183074951171875, 0.19046783447265625, 0.1978607177734375, 0.20525360107421875, 0.212646484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 9.0, 12.0, 18.0, 44.0, 59.0, 84.0, 115.0, 133.0, 130.0, 147.0, 86.0, 58.0, 38.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3423888683319092, -1.3028398752212524, -1.2632908821105957, -1.223741888999939, -1.1841928958892822, -1.144644021987915, -1.1050950288772583, -1.0655460357666016, -1.0259970426559448, -0.9864480495452881, -0.9468990564346313, -0.9073501229286194, -0.8678011298179626, -0.8282521367073059, -0.788703203201294, -0.7491542100906372, -0.7096052169799805, -0.6700562238693237, -0.630507230758667, -0.590958297252655, -0.5514093041419983, -0.5118603110313416, -0.4723113477230072, -0.43276238441467285, -0.3932133913040161, -0.3536643981933594, -0.314115434885025, -0.2745664715766907, -0.23501747846603394, -0.1954685002565384, -0.15591952204704285, -0.1163705587387085, -0.07682168483734131, -0.037272706627845764, 0.0022762715816497803, 0.041825249791145325, 0.08137422800064087, 0.12092320621013641, 0.16047218441963196, 0.2000211477279663, 0.23957014083862305, 0.2791191339492798, 0.31866809725761414, 0.3582170605659485, 0.3977660536766052, 0.43731504678726196, 0.4768640100955963, 0.5164129734039307, 0.5559619665145874, 0.5955109596252441, 0.6350599527359009, 0.6746088862419128, 0.7141578793525696, 0.7537068724632263, 0.7932558059692383, 0.832804799079895, 0.8723537921905518, 0.9119027853012085, 0.9514517784118652, 0.9910007119178772, 1.0305497646331787, 1.070098638534546, 1.1096476316452026, 1.1491966247558594, 1.1887456178665161]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 9.0, 9.0, 17.0, 15.0, 19.0, 23.0, 25.0, 29.0, 39.0, 47.0, 53.0, 44.0, 48.0, 50.0, 55.0, 49.0, 59.0, 52.0, 49.0, 42.0, 41.0, 35.0, 29.0, 36.0, 30.0, 20.0, 8.0, 17.0, 6.0, 5.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0], "bins": [-0.699561357498169, -0.6815537810325623, -0.6635462045669556, -0.6455386281013489, -0.6275310516357422, -0.6095234751701355, -0.5915158987045288, -0.5735083222389221, -0.5555007457733154, -0.5374931693077087, -0.519485592842102, -0.5014780163764954, -0.48347043991088867, -0.465462863445282, -0.4474552869796753, -0.4294477105140686, -0.4114401340484619, -0.3934325575828552, -0.37542498111724854, -0.35741740465164185, -0.33940982818603516, -0.32140225172042847, -0.3033946752548218, -0.2853870987892151, -0.2673795223236084, -0.2493719458580017, -0.23136436939239502, -0.21335679292678833, -0.19534921646118164, -0.17734163999557495, -0.15933406352996826, -0.14132648706436157, -0.12331891059875488, -0.1053113341331482, -0.0873037576675415, -0.06929618120193481, -0.051288604736328125, -0.033281028270721436, -0.015273451805114746, 0.0027341246604919434, 0.020741701126098633, 0.03874927759170532, 0.05675685405731201, 0.0747644305229187, 0.09277200698852539, 0.11077958345413208, 0.12878715991973877, 0.14679473638534546, 0.16480231285095215, 0.18280988931655884, 0.20081746578216553, 0.21882504224777222, 0.2368326187133789, 0.2548401951789856, 0.2728477716445923, 0.290855348110199, 0.30886292457580566, 0.32687050104141235, 0.34487807750701904, 0.36288565397262573, 0.3808932304382324, 0.3989008069038391, 0.4169083833694458, 0.4349159598350525, 0.4529235363006592]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 10.0, 3.0, 13.0, 30.0, 33.0, 56.0, 91.0, 138.0, 285.0, 539.0, 1072.0, 2534.0, 6547.0, 21749.0, 145047.0, 731776.0, 109819.0, 18615.0, 5676.0, 2320.0, 1028.0, 541.0, 277.0, 151.0, 74.0, 50.0, 29.0, 19.0, 16.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.324462890625, -0.31555938720703125, -0.3066558837890625, -0.29775238037109375, -0.288848876953125, -0.27994537353515625, -0.2710418701171875, -0.26213836669921875, -0.25323486328125, -0.24433135986328125, -0.2354278564453125, -0.22652435302734375, -0.217620849609375, -0.20871734619140625, -0.1998138427734375, -0.19091033935546875, -0.1820068359375, -0.17310333251953125, -0.1641998291015625, -0.15529632568359375, -0.146392822265625, -0.13748931884765625, -0.1285858154296875, -0.11968231201171875, -0.11077880859375, -0.10187530517578125, -0.0929718017578125, -0.08406829833984375, -0.075164794921875, -0.06626129150390625, -0.0573577880859375, -0.04845428466796875, -0.03955078125, -0.03064727783203125, -0.0217437744140625, -0.01284027099609375, -0.003936767578125, 0.00496673583984375, 0.0138702392578125, 0.02277374267578125, 0.03167724609375, 0.04058074951171875, 0.0494842529296875, 0.05838775634765625, 0.067291259765625, 0.07619476318359375, 0.0850982666015625, 0.09400177001953125, 0.1029052734375, 0.11180877685546875, 0.1207122802734375, 0.12961578369140625, 0.138519287109375, 0.14742279052734375, 0.1563262939453125, 0.16522979736328125, 0.17413330078125, 0.18303680419921875, 0.1919403076171875, 0.20084381103515625, 0.209747314453125, 0.21865081787109375, 0.2275543212890625, 0.23645782470703125, 0.245361328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 2.0, 6.0, 8.0, 13.0, 14.0, 23.0, 19.0, 25.0, 40.0, 65.0, 65.0, 85.0, 85.0, 87.0, 96.0, 80.0, 64.0, 63.0, 55.0, 31.0, 26.0, 15.0, 12.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5655593872070312, -0.5442047119140625, -0.5228500366210938, -0.501495361328125, -0.48014068603515625, -0.4587860107421875, -0.43743133544921875, -0.41607666015625, -0.39472198486328125, -0.3733673095703125, -0.35201263427734375, -0.330657958984375, -0.30930328369140625, -0.2879486083984375, -0.26659393310546875, -0.2452392578125, -0.22388458251953125, -0.2025299072265625, -0.18117523193359375, -0.159820556640625, -0.13846588134765625, -0.1171112060546875, -0.09575653076171875, -0.07440185546875, -0.05304718017578125, -0.0316925048828125, -0.01033782958984375, 0.011016845703125, 0.03237152099609375, 0.0537261962890625, 0.07508087158203125, 0.096435546875, 0.11779022216796875, 0.1391448974609375, 0.16049957275390625, 0.181854248046875, 0.20320892333984375, 0.2245635986328125, 0.24591827392578125, 0.26727294921875, 0.28862762451171875, 0.3099822998046875, 0.33133697509765625, 0.352691650390625, 0.37404632568359375, 0.3954010009765625, 0.41675567626953125, 0.4381103515625, 0.45946502685546875, 0.4808197021484375, 0.5021743774414062, 0.523529052734375, 0.5448837280273438, 0.5662384033203125, 0.5875930786132812, 0.60894775390625, 0.6303024291992188, 0.6516571044921875, 0.6730117797851562, 0.694366455078125, 0.7157211303710938, 0.7370758056640625, 0.7584304809570312, 0.77978515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 11.0, 10.0, 11.0, 10.0, 23.0, 30.0, 41.0, 54.0, 75.0, 124.0, 217.0, 363.0, 699.0, 1319.0, 2925.0, 7724.0, 27698.0, 183299.0, 674710.0, 117790.0, 20165.0, 6220.0, 2493.0, 1092.0, 563.0, 312.0, 204.0, 123.0, 74.0, 51.0, 33.0, 19.0, 10.0, 15.0, 16.0, 7.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.20166015625, -0.1957988739013672, -0.18993759155273438, -0.18407630920410156, -0.17821502685546875, -0.17235374450683594, -0.16649246215820312, -0.1606311798095703, -0.1547698974609375, -0.1489086151123047, -0.14304733276367188, -0.13718605041503906, -0.13132476806640625, -0.12546348571777344, -0.11960220336914062, -0.11374092102050781, -0.107879638671875, -0.10201835632324219, -0.09615707397460938, -0.09029579162597656, -0.08443450927734375, -0.07857322692871094, -0.07271194458007812, -0.06685066223144531, -0.0609893798828125, -0.05512809753417969, -0.049266815185546875, -0.04340553283691406, -0.03754425048828125, -0.03168296813964844, -0.025821685791015625, -0.019960403442382812, -0.01409912109375, -0.008237838745117188, -0.002376556396484375, 0.0034847259521484375, 0.00934600830078125, 0.015207290649414062, 0.021068572998046875, 0.026929855346679688, 0.0327911376953125, 0.03865242004394531, 0.044513702392578125, 0.05037498474121094, 0.05623626708984375, 0.06209754943847656, 0.06795883178710938, 0.07382011413574219, 0.079681396484375, 0.08554267883300781, 0.09140396118164062, 0.09726524353027344, 0.10312652587890625, 0.10898780822753906, 0.11484909057617188, 0.12071037292480469, 0.1265716552734375, 0.1324329376220703, 0.13829421997070312, 0.14415550231933594, 0.15001678466796875, 0.15587806701660156, 0.16173934936523438, 0.1676006317138672, 0.1734619140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 7.0, 10.0, 5.0, 6.0, 18.0, 6.0, 16.0, 23.0, 22.0, 32.0, 37.0, 38.0, 38.0, 37.0, 38.0, 35.0, 37.0, 39.0, 58.0, 42.0, 54.0, 38.0, 46.0, 38.0, 37.0, 28.0, 21.0, 24.0, 22.0, 19.0, 19.0, 24.0, 12.0, 13.0, 11.0, 9.0, 11.0, 8.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.8173828125, -0.7937469482421875, -0.770111083984375, -0.7464752197265625, -0.72283935546875, -0.6992034912109375, -0.675567626953125, -0.6519317626953125, -0.6282958984375, -0.6046600341796875, -0.581024169921875, -0.5573883056640625, -0.53375244140625, -0.5101165771484375, -0.486480712890625, -0.4628448486328125, -0.439208984375, -0.4155731201171875, -0.391937255859375, -0.3683013916015625, -0.34466552734375, -0.3210296630859375, -0.297393798828125, -0.2737579345703125, -0.2501220703125, -0.2264862060546875, -0.202850341796875, -0.1792144775390625, -0.15557861328125, -0.1319427490234375, -0.108306884765625, -0.0846710205078125, -0.06103515625, -0.0373992919921875, -0.013763427734375, 0.0098724365234375, 0.03350830078125, 0.0571441650390625, 0.080780029296875, 0.1044158935546875, 0.1280517578125, 0.1516876220703125, 0.175323486328125, 0.1989593505859375, 0.22259521484375, 0.2462310791015625, 0.269866943359375, 0.2935028076171875, 0.317138671875, 0.3407745361328125, 0.364410400390625, 0.3880462646484375, 0.41168212890625, 0.4353179931640625, 0.458953857421875, 0.4825897216796875, 0.5062255859375, 0.5298614501953125, 0.553497314453125, 0.5771331787109375, 0.60076904296875, 0.6244049072265625, 0.648040771484375, 0.6716766357421875, 0.6953125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 4.0, 1.0, 7.0, 10.0, 12.0, 16.0, 30.0, 51.0, 71.0, 137.0, 207.0, 314.0, 605.0, 1021.0, 2104.0, 4828.0, 13218.0, 52068.0, 452573.0, 447059.0, 51740.0, 13221.0, 4611.0, 2141.0, 1044.0, 604.0, 318.0, 191.0, 125.0, 58.0, 46.0, 23.0, 29.0, 18.0, 12.0, 11.0, 5.0, 3.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.09124755859375, -0.08884620666503906, -0.08644485473632812, -0.08404350280761719, -0.08164215087890625, -0.07924079895019531, -0.07683944702148438, -0.07443809509277344, -0.0720367431640625, -0.06963539123535156, -0.06723403930664062, -0.06483268737792969, -0.06243133544921875, -0.06002998352050781, -0.057628631591796875, -0.05522727966308594, -0.052825927734375, -0.05042457580566406, -0.048023223876953125, -0.04562187194824219, -0.04322052001953125, -0.04081916809082031, -0.038417816162109375, -0.03601646423339844, -0.0336151123046875, -0.031213760375976562, -0.028812408447265625, -0.026411056518554688, -0.02400970458984375, -0.021608352661132812, -0.019207000732421875, -0.016805648803710938, -0.014404296875, -0.012002944946289062, -0.009601593017578125, -0.0072002410888671875, -0.00479888916015625, -0.0023975372314453125, 3.814697265625e-06, 0.0024051666259765625, 0.0048065185546875, 0.0072078704833984375, 0.009609222412109375, 0.012010574340820312, 0.01441192626953125, 0.016813278198242188, 0.019214630126953125, 0.021615982055664062, 0.024017333984375, 0.026418685913085938, 0.028820037841796875, 0.031221389770507812, 0.03362274169921875, 0.03602409362792969, 0.038425445556640625, 0.04082679748535156, 0.0432281494140625, 0.04562950134277344, 0.048030853271484375, 0.05043220520019531, 0.05283355712890625, 0.05523490905761719, 0.057636260986328125, 0.06003761291503906, 0.06243896484375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 12.0, 6.0, 6.0, 10.0, 26.0, 25.0, 33.0, 56.0, 73.0, 87.0, 120.0, 118.0, 111.0, 76.0, 57.0, 43.0, 28.0, 19.0, 19.0, 6.0, 14.0, 10.0, 6.0, 5.0, 9.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0219554901123047e-05, -2.925284206867218e-05, -2.8286129236221313e-05, -2.7319416403770447e-05, -2.635270357131958e-05, -2.5385990738868713e-05, -2.4419277906417847e-05, -2.345256507396698e-05, -2.2485852241516113e-05, -2.1519139409065247e-05, -2.055242657661438e-05, -1.9585713744163513e-05, -1.8619000911712646e-05, -1.765228807926178e-05, -1.6685575246810913e-05, -1.5718862414360046e-05, -1.475214958190918e-05, -1.3785436749458313e-05, -1.2818723917007446e-05, -1.185201108455658e-05, -1.0885298252105713e-05, -9.918585419654846e-06, -8.95187258720398e-06, -7.985159754753113e-06, -7.018446922302246e-06, -6.051734089851379e-06, -5.085021257400513e-06, -4.118308424949646e-06, -3.1515955924987793e-06, -2.1848827600479126e-06, -1.218169927597046e-06, -2.514570951461792e-07, 7.152557373046875e-07, 1.6819685697555542e-06, 2.648681402206421e-06, 3.6153942346572876e-06, 4.582107067108154e-06, 5.548819899559021e-06, 6.515532732009888e-06, 7.482245564460754e-06, 8.448958396911621e-06, 9.415671229362488e-06, 1.0382384061813354e-05, 1.1349096894264221e-05, 1.2315809726715088e-05, 1.3282522559165955e-05, 1.4249235391616821e-05, 1.5215948224067688e-05, 1.6182661056518555e-05, 1.714937388896942e-05, 1.8116086721420288e-05, 1.9082799553871155e-05, 2.004951238632202e-05, 2.1016225218772888e-05, 2.1982938051223755e-05, 2.294965088367462e-05, 2.3916363716125488e-05, 2.4883076548576355e-05, 2.584978938102722e-05, 2.681650221347809e-05, 2.7783215045928955e-05, 2.8749927878379822e-05, 2.971664071083069e-05, 3.0683353543281555e-05, 3.165006637573242e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 12.0, 17.0, 22.0, 45.0, 67.0, 114.0, 188.0, 355.0, 620.0, 1326.0, 2692.0, 6732.0, 20408.0, 84564.0, 552210.0, 304032.0, 51647.0, 14273.0, 4979.0, 2048.0, 971.0, 513.0, 250.0, 174.0, 96.0, 71.0, 32.0, 25.0, 14.0, 11.0, 12.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0802001953125, -0.0776815414428711, -0.07516288757324219, -0.07264423370361328, -0.07012557983398438, -0.06760692596435547, -0.06508827209472656, -0.06256961822509766, -0.06005096435546875, -0.057532310485839844, -0.05501365661621094, -0.05249500274658203, -0.049976348876953125, -0.04745769500732422, -0.04493904113769531, -0.042420387268066406, -0.0399017333984375, -0.037383079528808594, -0.03486442565917969, -0.03234577178955078, -0.029827117919921875, -0.02730846405029297, -0.024789810180664062, -0.022271156311035156, -0.01975250244140625, -0.017233848571777344, -0.014715194702148438, -0.012196540832519531, -0.009677886962890625, -0.007159233093261719, -0.0046405792236328125, -0.0021219253540039062, 0.000396728515625, 0.0029153823852539062, 0.0054340362548828125, 0.007952690124511719, 0.010471343994140625, 0.012989997863769531, 0.015508651733398438, 0.018027305603027344, 0.02054595947265625, 0.023064613342285156, 0.025583267211914062, 0.02810192108154297, 0.030620574951171875, 0.03313922882080078, 0.03565788269042969, 0.038176536560058594, 0.0406951904296875, 0.043213844299316406, 0.04573249816894531, 0.04825115203857422, 0.050769805908203125, 0.05328845977783203, 0.05580711364746094, 0.058325767517089844, 0.06084442138671875, 0.06336307525634766, 0.06588172912597656, 0.06840038299560547, 0.07091903686523438, 0.07343769073486328, 0.07595634460449219, 0.0784749984741211, 0.08099365234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 10.0, 8.0, 10.0, 13.0, 15.0, 20.0, 25.0, 29.0, 44.0, 57.0, 77.0, 107.0, 184.0, 113.0, 69.0, 38.0, 40.0, 30.0, 27.0, 19.0, 15.0, 12.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021881103515625, -0.021160125732421875, -0.02043914794921875, -0.019718170166015625, -0.0189971923828125, -0.018276214599609375, -0.01755523681640625, -0.016834259033203125, -0.01611328125, -0.015392303466796875, -0.01467132568359375, -0.013950347900390625, -0.0132293701171875, -0.012508392333984375, -0.01178741455078125, -0.011066436767578125, -0.010345458984375, -0.009624481201171875, -0.00890350341796875, -0.008182525634765625, -0.0074615478515625, -0.006740570068359375, -0.00601959228515625, -0.005298614501953125, -0.00457763671875, -0.003856658935546875, -0.00313568115234375, -0.002414703369140625, -0.0016937255859375, -0.000972747802734375, -0.00025177001953125, 0.000469207763671875, 0.001190185546875, 0.001911163330078125, 0.00263214111328125, 0.003353118896484375, 0.0040740966796875, 0.004795074462890625, 0.00551605224609375, 0.006237030029296875, 0.0069580078125, 0.007678985595703125, 0.00839996337890625, 0.009120941162109375, 0.0098419189453125, 0.010562896728515625, 0.01128387451171875, 0.012004852294921875, 0.012725830078125, 0.013446807861328125, 0.01416778564453125, 0.014888763427734375, 0.0156097412109375, 0.016330718994140625, 0.01705169677734375, 0.017772674560546875, 0.01849365234375, 0.019214630126953125, 0.01993560791015625, 0.020656585693359375, 0.0213775634765625, 0.022098541259765625, 0.02281951904296875, 0.023540496826171875, 0.024261474609375]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 11.0, 43.0, 80.0, 132.0, 198.0, 225.0, 137.0, 85.0, 41.0, 19.0, 12.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5845848321914673, -1.5428975820541382, -1.5012104511260986, -1.4595232009887695, -1.4178359508514404, -1.3761487007141113, -1.3344614505767822, -1.2927743196487427, -1.2510870695114136, -1.2093998193740845, -1.167712688446045, -1.1260254383087158, -1.0843381881713867, -1.0426509380340576, -1.0009636878967285, -0.959276556968689, -0.9175893068313599, -0.8759020566940308, -0.8342148661613464, -0.7925276756286621, -0.750840425491333, -0.7091531753540039, -0.6674659848213196, -0.6257787942886353, -0.5840915441513062, -0.542404294013977, -0.5007171034812927, -0.459029883146286, -0.4173426628112793, -0.3756554424762726, -0.33396822214126587, -0.29228100180625916, -0.2505936622619629, -0.20890644192695618, -0.16721922159194946, -0.12553200125694275, -0.08384478092193604, -0.04215756058692932, -0.0004703402519226074, 0.041216880083084106, 0.08290410041809082, 0.12459132075309753, 0.16627854108810425, 0.20796576142311096, 0.24965298175811768, 0.2913402020931244, 0.3330274224281311, 0.3747146427631378, 0.41640186309814453, 0.45808908343315125, 0.49977630376815796, 0.5414634943008423, 0.5831507444381714, 0.6248379945755005, 0.6665251851081848, 0.7082123756408691, 0.7498996257781982, 0.7915868759155273, 0.8332740664482117, 0.874961256980896, 0.9166485071182251, 0.9583357572555542, 1.0000228881835938, 1.0417101383209229, 1.083397388458252]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 10.0, 14.0, 31.0, 22.0, 36.0, 48.0, 75.0, 85.0, 85.0, 68.0, 89.0, 86.0, 80.0, 59.0, 53.0, 51.0, 35.0, 21.0, 15.0, 6.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48361650109291077, -0.46334394812583923, -0.4430713951587677, -0.42279884219169617, -0.40252628922462463, -0.3822537362575531, -0.36198121309280396, -0.3417086601257324, -0.3214361071586609, -0.30116355419158936, -0.2808910012245178, -0.2606184482574463, -0.24034589529037476, -0.22007334232330322, -0.19980080425739288, -0.17952825129032135, -0.15925568342208862, -0.1389831304550171, -0.11871057748794556, -0.09843803197145462, -0.07816547900438309, -0.057892926037311554, -0.03762038052082062, -0.017347827553749084, 0.0029247254133224487, 0.023197276517748833, 0.04346982762217522, 0.06374237686395645, 0.08401492983102798, 0.10428748279809952, 0.12456002831459045, 0.144832581281662, 0.16510510444641113, 0.18537765741348267, 0.2056502103805542, 0.22592276334762573, 0.24619531631469727, 0.2664678692817688, 0.28674042224884033, 0.30701297521591187, 0.3272855281829834, 0.34755808115005493, 0.36783063411712646, 0.388103187084198, 0.40837574005126953, 0.42864829301834106, 0.4489208459854126, 0.46919339895248413, 0.4894659221172333, 0.5097384452819824, 0.530010998249054, 0.5502835512161255, 0.570556104183197, 0.5908286571502686, 0.6111012101173401, 0.6313737630844116, 0.6516463160514832, 0.6719188690185547, 0.6921914219856262, 0.7124639749526978, 0.7327365279197693, 0.7530090808868408, 0.7732816338539124, 0.7935541868209839, 0.8138267397880554]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 13.0, 13.0, 26.0, 35.0, 48.0, 113.0, 157.0, 203.0, 374.0, 678.0, 1351.0, 2752.0, 6377.0, 16769.0, 59002.0, 308447.0, 519136.0, 93464.0, 23871.0, 8508.0, 3586.0, 1652.0, 846.0, 429.0, 244.0, 172.0, 99.0, 47.0, 49.0, 33.0, 13.0, 11.0, 10.0, 5.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.417724609375, -0.4043159484863281, -0.39090728759765625, -0.3774986267089844, -0.3640899658203125, -0.3506813049316406, -0.33727264404296875, -0.3238639831542969, -0.310455322265625, -0.2970466613769531, -0.28363800048828125, -0.2702293395996094, -0.2568206787109375, -0.24341201782226562, -0.23000335693359375, -0.21659469604492188, -0.20318603515625, -0.18977737426757812, -0.17636871337890625, -0.16296005249023438, -0.1495513916015625, -0.13614273071289062, -0.12273406982421875, -0.10932540893554688, -0.095916748046875, -0.08250808715820312, -0.06909942626953125, -0.055690765380859375, -0.0422821044921875, -0.028873443603515625, -0.01546478271484375, -0.002056121826171875, 0.0113525390625, 0.024761199951171875, 0.03816986083984375, 0.051578521728515625, 0.0649871826171875, 0.07839584350585938, 0.09180450439453125, 0.10521316528320312, 0.118621826171875, 0.13203048706054688, 0.14543914794921875, 0.15884780883789062, 0.1722564697265625, 0.18566513061523438, 0.19907379150390625, 0.21248245239257812, 0.22589111328125, 0.23929977416992188, 0.25270843505859375, 0.2661170959472656, 0.2795257568359375, 0.2929344177246094, 0.30634307861328125, 0.3197517395019531, 0.333160400390625, 0.3465690612792969, 0.35997772216796875, 0.3733863830566406, 0.3867950439453125, 0.4002037048339844, 0.41361236572265625, 0.4270210266113281, 0.4404296875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 9.0, 14.0, 16.0, 28.0, 30.0, 33.0, 51.0, 71.0, 62.0, 65.0, 72.0, 72.0, 75.0, 75.0, 62.0, 51.0, 39.0, 36.0, 34.0, 29.0, 18.0, 15.0, 7.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9755859375, -0.94219970703125, -0.9088134765625, -0.87542724609375, -0.842041015625, -0.80865478515625, -0.7752685546875, -0.74188232421875, -0.70849609375, -0.67510986328125, -0.6417236328125, -0.60833740234375, -0.574951171875, -0.54156494140625, -0.5081787109375, -0.47479248046875, -0.44140625, -0.40802001953125, -0.3746337890625, -0.34124755859375, -0.307861328125, -0.27447509765625, -0.2410888671875, -0.20770263671875, -0.17431640625, -0.14093017578125, -0.1075439453125, -0.07415771484375, -0.040771484375, -0.00738525390625, 0.0260009765625, 0.05938720703125, 0.0927734375, 0.12615966796875, 0.1595458984375, 0.19293212890625, 0.226318359375, 0.25970458984375, 0.2930908203125, 0.32647705078125, 0.35986328125, 0.39324951171875, 0.4266357421875, 0.46002197265625, 0.493408203125, 0.52679443359375, 0.5601806640625, 0.59356689453125, 0.626953125, 0.66033935546875, 0.6937255859375, 0.72711181640625, 0.760498046875, 0.79388427734375, 0.8272705078125, 0.86065673828125, 0.89404296875, 0.92742919921875, 0.9608154296875, 0.99420166015625, 1.027587890625, 1.06097412109375, 1.0943603515625, 1.12774658203125, 1.1611328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 6.0, 6.0, 7.0, 9.0, 18.0, 17.0, 14.0, 31.0, 35.0, 49.0, 51.0, 86.0, 132.0, 211.0, 668.0, 4867.0, 443277.0, 592278.0, 5349.0, 713.0, 241.0, 151.0, 90.0, 58.0, 35.0, 29.0, 27.0, 18.0, 19.0, 14.0, 15.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.958984375, -1.90606689453125, -1.8531494140625, -1.80023193359375, -1.747314453125, -1.69439697265625, -1.6414794921875, -1.58856201171875, -1.53564453125, -1.48272705078125, -1.4298095703125, -1.37689208984375, -1.323974609375, -1.27105712890625, -1.2181396484375, -1.16522216796875, -1.1123046875, -1.05938720703125, -1.0064697265625, -0.95355224609375, -0.900634765625, -0.84771728515625, -0.7947998046875, -0.74188232421875, -0.68896484375, -0.63604736328125, -0.5831298828125, -0.53021240234375, -0.477294921875, -0.42437744140625, -0.3714599609375, -0.31854248046875, -0.265625, -0.21270751953125, -0.1597900390625, -0.10687255859375, -0.053955078125, -0.00103759765625, 0.0518798828125, 0.10479736328125, 0.15771484375, 0.21063232421875, 0.2635498046875, 0.31646728515625, 0.369384765625, 0.42230224609375, 0.4752197265625, 0.52813720703125, 0.5810546875, 0.63397216796875, 0.6868896484375, 0.73980712890625, 0.792724609375, 0.84564208984375, 0.8985595703125, 0.95147705078125, 1.00439453125, 1.05731201171875, 1.1102294921875, 1.16314697265625, 1.216064453125, 1.26898193359375, 1.3218994140625, 1.37481689453125, 1.427734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 9.0, 12.0, 15.0, 11.0, 15.0, 21.0, 18.0, 33.0, 36.0, 37.0, 43.0, 57.0, 45.0, 55.0, 46.0, 68.0, 41.0, 56.0, 54.0, 50.0, 39.0, 39.0, 20.0, 37.0, 26.0, 17.0, 15.0, 19.0, 12.0, 12.0, 10.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.9918289184570312, -0.9602203369140625, -0.9286117553710938, -0.897003173828125, -0.8653945922851562, -0.8337860107421875, -0.8021774291992188, -0.77056884765625, -0.7389602661132812, -0.7073516845703125, -0.6757431030273438, -0.644134521484375, -0.6125259399414062, -0.5809173583984375, -0.5493087768554688, -0.5177001953125, -0.48609161376953125, -0.4544830322265625, -0.42287445068359375, -0.391265869140625, -0.35965728759765625, -0.3280487060546875, -0.29644012451171875, -0.26483154296875, -0.23322296142578125, -0.2016143798828125, -0.17000579833984375, -0.138397216796875, -0.10678863525390625, -0.0751800537109375, -0.04357147216796875, -0.011962890625, 0.01964569091796875, 0.0512542724609375, 0.08286285400390625, 0.114471435546875, 0.14608001708984375, 0.1776885986328125, 0.20929718017578125, 0.24090576171875, 0.27251434326171875, 0.3041229248046875, 0.33573150634765625, 0.367340087890625, 0.39894866943359375, 0.4305572509765625, 0.46216583251953125, 0.4937744140625, 0.5253829956054688, 0.5569915771484375, 0.5886001586914062, 0.620208740234375, 0.6518173217773438, 0.6834259033203125, 0.7150344848632812, 0.74664306640625, 0.7782516479492188, 0.8098602294921875, 0.8414688110351562, 0.873077392578125, 0.9046859741210938, 0.9362945556640625, 0.9679031372070312, 0.99951171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 5.0, 14.0, 24.0, 42.0, 68.0, 153.0, 392.0, 1190.0, 10626.0, 667221.0, 359542.0, 7528.0, 1068.0, 371.0, 136.0, 71.0, 34.0, 19.0, 13.0, 6.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35693359375, -0.34539794921875, -0.3338623046875, -0.32232666015625, -0.310791015625, -0.29925537109375, -0.2877197265625, -0.27618408203125, -0.2646484375, -0.25311279296875, -0.2415771484375, -0.23004150390625, -0.218505859375, -0.20697021484375, -0.1954345703125, -0.18389892578125, -0.17236328125, -0.16082763671875, -0.1492919921875, -0.13775634765625, -0.126220703125, -0.11468505859375, -0.1031494140625, -0.09161376953125, -0.080078125, -0.06854248046875, -0.0570068359375, -0.04547119140625, -0.033935546875, -0.02239990234375, -0.0108642578125, 0.00067138671875, 0.01220703125, 0.02374267578125, 0.0352783203125, 0.04681396484375, 0.058349609375, 0.06988525390625, 0.0814208984375, 0.09295654296875, 0.1044921875, 0.11602783203125, 0.1275634765625, 0.13909912109375, 0.150634765625, 0.16217041015625, 0.1737060546875, 0.18524169921875, 0.19677734375, 0.20831298828125, 0.2198486328125, 0.23138427734375, 0.242919921875, 0.25445556640625, 0.2659912109375, 0.27752685546875, 0.2890625, 0.30059814453125, 0.3121337890625, 0.32366943359375, 0.335205078125, 0.34674072265625, 0.3582763671875, 0.36981201171875, 0.38134765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 4.0, 7.0, 11.0, 14.0, 14.0, 28.0, 34.0, 48.0, 78.0, 133.0, 178.0, 131.0, 80.0, 79.0, 48.0, 29.0, 21.0, 11.0, 15.0, 8.0, 9.0, 5.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5212764739990234e-05, -2.436712384223938e-05, -2.3521482944488525e-05, -2.267584204673767e-05, -2.1830201148986816e-05, -2.0984560251235962e-05, -2.0138919353485107e-05, -1.9293278455734253e-05, -1.84476375579834e-05, -1.7601996660232544e-05, -1.675635576248169e-05, -1.5910714864730835e-05, -1.506507396697998e-05, -1.4219433069229126e-05, -1.3373792171478271e-05, -1.2528151273727417e-05, -1.1682510375976562e-05, -1.0836869478225708e-05, -9.991228580474854e-06, -9.145587682723999e-06, -8.299946784973145e-06, -7.45430588722229e-06, -6.6086649894714355e-06, -5.763024091720581e-06, -4.9173831939697266e-06, -4.071742296218872e-06, -3.2261013984680176e-06, -2.380460500717163e-06, -1.5348196029663086e-06, -6.891787052154541e-07, 1.564621925354004e-07, 1.0021030902862549e-06, 1.8477439880371094e-06, 2.693384885787964e-06, 3.5390257835388184e-06, 4.384666681289673e-06, 5.230307579040527e-06, 6.075948476791382e-06, 6.921589374542236e-06, 7.76723027229309e-06, 8.612871170043945e-06, 9.4585120677948e-06, 1.0304152965545654e-05, 1.1149793863296509e-05, 1.1995434761047363e-05, 1.2841075658798218e-05, 1.3686716556549072e-05, 1.4532357454299927e-05, 1.537799835205078e-05, 1.6223639249801636e-05, 1.706928014755249e-05, 1.7914921045303345e-05, 1.87605619430542e-05, 1.9606202840805054e-05, 2.0451843738555908e-05, 2.1297484636306763e-05, 2.2143125534057617e-05, 2.298876643180847e-05, 2.3834407329559326e-05, 2.468004822731018e-05, 2.5525689125061035e-05, 2.637133002281189e-05, 2.7216970920562744e-05, 2.80626118183136e-05, 2.8908252716064453e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 13.0, 12.0, 12.0, 22.0, 32.0, 63.0, 135.0, 269.0, 705.0, 2527.0, 14421.0, 193059.0, 781517.0, 47716.0, 5790.0, 1325.0, 505.0, 223.0, 81.0, 46.0, 21.0, 21.0, 11.0, 8.0, 1.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.32080078125, -0.31241607666015625, -0.3040313720703125, -0.29564666748046875, -0.287261962890625, -0.27887725830078125, -0.2704925537109375, -0.26210784912109375, -0.25372314453125, -0.24533843994140625, -0.2369537353515625, -0.22856903076171875, -0.220184326171875, -0.21179962158203125, -0.2034149169921875, -0.19503021240234375, -0.1866455078125, -0.17826080322265625, -0.1698760986328125, -0.16149139404296875, -0.153106689453125, -0.14472198486328125, -0.1363372802734375, -0.12795257568359375, -0.11956787109375, -0.11118316650390625, -0.1027984619140625, -0.09441375732421875, -0.086029052734375, -0.07764434814453125, -0.0692596435546875, -0.06087493896484375, -0.052490234375, -0.04410552978515625, -0.0357208251953125, -0.02733612060546875, -0.018951416015625, -0.01056671142578125, -0.0021820068359375, 0.00620269775390625, 0.01458740234375, 0.02297210693359375, 0.0313568115234375, 0.03974151611328125, 0.048126220703125, 0.05651092529296875, 0.0648956298828125, 0.07328033447265625, 0.0816650390625, 0.09004974365234375, 0.0984344482421875, 0.10681915283203125, 0.115203857421875, 0.12358856201171875, 0.1319732666015625, 0.14035797119140625, 0.14874267578125, 0.15712738037109375, 0.1655120849609375, 0.17389678955078125, 0.182281494140625, 0.19066619873046875, 0.1990509033203125, 0.20743560791015625, 0.2158203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 2.0, 13.0, 15.0, 7.0, 18.0, 23.0, 19.0, 32.0, 33.0, 66.0, 91.0, 168.0, 162.0, 95.0, 74.0, 47.0, 28.0, 21.0, 22.0, 11.0, 13.0, 6.0, 5.0, 7.0, 3.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06744384765625, -0.06474494934082031, -0.062046051025390625, -0.05934715270996094, -0.05664825439453125, -0.05394935607910156, -0.051250457763671875, -0.04855155944824219, -0.0458526611328125, -0.04315376281738281, -0.040454864501953125, -0.03775596618652344, -0.03505706787109375, -0.03235816955566406, -0.029659271240234375, -0.026960372924804688, -0.024261474609375, -0.021562576293945312, -0.018863677978515625, -0.016164779663085938, -0.01346588134765625, -0.010766983032226562, -0.008068084716796875, -0.0053691864013671875, -0.0026702880859375, 2.86102294921875e-05, 0.002727508544921875, 0.0054264068603515625, 0.00812530517578125, 0.010824203491210938, 0.013523101806640625, 0.016222000122070312, 0.0189208984375, 0.021619796752929688, 0.024318695068359375, 0.027017593383789062, 0.02971649169921875, 0.03241539001464844, 0.035114288330078125, 0.03781318664550781, 0.0405120849609375, 0.04321098327636719, 0.045909881591796875, 0.04860877990722656, 0.05130767822265625, 0.05400657653808594, 0.056705474853515625, 0.05940437316894531, 0.062103271484375, 0.06480216979980469, 0.06750106811523438, 0.07019996643066406, 0.07289886474609375, 0.07559776306152344, 0.07829666137695312, 0.08099555969238281, 0.0836944580078125, 0.08639335632324219, 0.08909225463867188, 0.09179115295410156, 0.09449005126953125, 0.09718894958496094, 0.09988784790039062, 0.10258674621582031, 0.10528564453125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 14.0, 16.0, 20.0, 32.0, 39.0, 64.0, 84.0, 109.0, 116.0, 121.0, 101.0, 83.0, 64.0, 46.0, 24.0, 19.0, 13.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650704145431519, -1.1197429895401, -1.074415683746338, -1.0290882587432861, -0.9837608337402344, -0.9384334087371826, -0.8931060433387756, -0.8477786779403687, -0.8024512529373169, -0.7571238279342651, -0.7117964625358582, -0.6664690971374512, -0.6211416721343994, -0.5758142471313477, -0.5304868817329407, -0.4851594865322113, -0.43983209133148193, -0.39450469613075256, -0.3491773009300232, -0.3038499057292938, -0.25852251052856445, -0.21319511532783508, -0.1678677201271057, -0.12254032492637634, -0.07721292972564697, -0.0318855345249176, 0.013441860675811768, 0.05876925587654114, 0.10409665107727051, 0.14942404627799988, 0.19475144147872925, 0.24007883667945862, 0.28540611267089844, 0.3307335078716278, 0.3760609030723572, 0.42138829827308655, 0.4667156934738159, 0.5120431184768677, 0.5573704838752747, 0.6026978492736816, 0.6480252742767334, 0.6933526992797852, 0.7386800646781921, 0.7840074300765991, 0.8293348550796509, 0.8746622800827026, 0.9199896454811096, 0.9653170108795166, 1.0106444358825684, 1.0559718608856201, 1.1012992858886719, 1.146626591682434, 1.1919540166854858, 1.2372814416885376, 1.2826087474822998, 1.3279361724853516, 1.3732635974884033, 1.418591022491455, 1.4639184474945068, 1.509245753288269, 1.5545731782913208, 1.5999006032943726, 1.6452279090881348, 1.6905553340911865, 1.7358827590942383]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 7.0, 9.0, 4.0, 14.0, 11.0, 24.0, 17.0, 14.0, 16.0, 27.0, 31.0, 27.0, 25.0, 36.0, 32.0, 28.0, 29.0, 32.0, 47.0, 34.0, 37.0, 36.0, 38.0, 36.0, 47.0, 44.0, 35.0, 38.0, 32.0, 28.0, 30.0, 27.0, 14.0, 14.0, 9.0, 10.0, 11.0, 10.0, 5.0, 9.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 0.0, 4.0], "bins": [-1.4448002576828003, -1.4044328927993774, -1.3640656471252441, -1.3236982822418213, -1.2833309173583984, -1.2429635524749756, -1.2025963068008423, -1.1622289419174194, -1.1218616962432861, -1.0814943313598633, -1.04112708568573, -1.0007597208023071, -0.9603923559188843, -0.9200250506401062, -0.8796577453613281, -0.8392903804779053, -0.7989230155944824, -0.7585557103157043, -0.7181883454322815, -0.6778210401535034, -0.6374536752700806, -0.5970863699913025, -0.5567190647125244, -0.5163516998291016, -0.4759843945503235, -0.435617059469223, -0.39524972438812256, -0.3548824191093445, -0.314515084028244, -0.27414774894714355, -0.23378042876720428, -0.19341310858726501, -0.153045654296875, -0.11267832666635513, -0.07231099903583527, -0.0319436714053154, 0.008423656225204468, 0.04879099130630493, 0.0891583114862442, 0.12952563166618347, 0.16989296674728394, 0.2102603018283844, 0.25062763690948486, 0.29099494218826294, 0.3313622772693634, 0.37172961235046387, 0.41209691762924194, 0.4524642527103424, 0.49283158779144287, 0.533198893070221, 0.5735662579536438, 0.6139335632324219, 0.6543009281158447, 0.6946682333946228, 0.7350355386734009, 0.7754029035568237, 0.8157702088356018, 0.8561375141143799, 0.8965048789978027, 0.9368721842765808, 0.9772394895553589, 1.0176068544387817, 1.0579742193222046, 1.098341464996338, 1.1387088298797607]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 9.0, 20.0, 17.0, 19.0, 41.0, 44.0, 76.0, 106.0, 169.0, 294.0, 486.0, 826.0, 1932.0, 4404.0, 14529.0, 81399.0, 1892925.0, 2082649.0, 89530.0, 15801.0, 4804.0, 1937.0, 937.0, 492.0, 285.0, 182.0, 107.0, 77.0, 48.0, 41.0, 26.0, 21.0, 4.0, 8.0, 10.0, 7.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.810546875, -0.7816162109375, -0.752685546875, -0.7237548828125, -0.69482421875, -0.6658935546875, -0.636962890625, -0.6080322265625, -0.5791015625, -0.5501708984375, -0.521240234375, -0.4923095703125, -0.46337890625, -0.4344482421875, -0.405517578125, -0.3765869140625, -0.34765625, -0.3187255859375, -0.289794921875, -0.2608642578125, -0.23193359375, -0.2030029296875, -0.174072265625, -0.1451416015625, -0.1162109375, -0.0872802734375, -0.058349609375, -0.0294189453125, -0.00048828125, 0.0284423828125, 0.057373046875, 0.0863037109375, 0.115234375, 0.1441650390625, 0.173095703125, 0.2020263671875, 0.23095703125, 0.2598876953125, 0.288818359375, 0.3177490234375, 0.3466796875, 0.3756103515625, 0.404541015625, 0.4334716796875, 0.46240234375, 0.4913330078125, 0.520263671875, 0.5491943359375, 0.578125, 0.6070556640625, 0.635986328125, 0.6649169921875, 0.69384765625, 0.7227783203125, 0.751708984375, 0.7806396484375, 0.8095703125, 0.8385009765625, 0.867431640625, 0.8963623046875, 0.92529296875, 0.9542236328125, 0.983154296875, 1.0120849609375, 1.041015625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 7.0, 3.0, 8.0, 9.0, 13.0, 16.0, 22.0, 29.0, 25.0, 37.0, 29.0, 50.0, 51.0, 67.0, 52.0, 57.0, 55.0, 50.0, 49.0, 58.0, 53.0, 55.0, 39.0, 38.0, 32.0, 16.0, 22.0, 13.0, 9.0, 7.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.458251953125, -0.44446563720703125, -0.4306793212890625, -0.41689300537109375, -0.403106689453125, -0.38932037353515625, -0.3755340576171875, -0.36174774169921875, -0.34796142578125, -0.33417510986328125, -0.3203887939453125, -0.30660247802734375, -0.292816162109375, -0.27902984619140625, -0.2652435302734375, -0.25145721435546875, -0.2376708984375, -0.22388458251953125, -0.2100982666015625, -0.19631195068359375, -0.182525634765625, -0.16873931884765625, -0.1549530029296875, -0.14116668701171875, -0.12738037109375, -0.11359405517578125, -0.0998077392578125, -0.08602142333984375, -0.072235107421875, -0.05844879150390625, -0.0446624755859375, -0.03087615966796875, -0.01708984375, -0.00330352783203125, 0.0104827880859375, 0.02426910400390625, 0.038055419921875, 0.05184173583984375, 0.0656280517578125, 0.07941436767578125, 0.09320068359375, 0.10698699951171875, 0.1207733154296875, 0.13455963134765625, 0.148345947265625, 0.16213226318359375, 0.1759185791015625, 0.18970489501953125, 0.2034912109375, 0.21727752685546875, 0.2310638427734375, 0.24485015869140625, 0.258636474609375, 0.27242279052734375, 0.2862091064453125, 0.29999542236328125, 0.31378173828125, 0.32756805419921875, 0.3413543701171875, 0.35514068603515625, 0.368927001953125, 0.38271331787109375, 0.3964996337890625, 0.41028594970703125, 0.424072265625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 5.0, 10.0, 10.0, 16.0, 21.0, 36.0, 51.0, 69.0, 100.0, 153.0, 266.0, 483.0, 1048.0, 2923.0, 12783.0, 104028.0, 3553192.0, 481523.0, 29024.0, 5370.0, 1577.0, 693.0, 321.0, 202.0, 111.0, 73.0, 49.0, 47.0, 23.0, 20.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4074859619140625, -1.365753173828125, -1.3240203857421875, -1.28228759765625, -1.2405548095703125, -1.198822021484375, -1.1570892333984375, -1.1153564453125, -1.0736236572265625, -1.031890869140625, -0.9901580810546875, -0.94842529296875, -0.9066925048828125, -0.864959716796875, -0.8232269287109375, -0.781494140625, -0.7397613525390625, -0.698028564453125, -0.6562957763671875, -0.61456298828125, -0.5728302001953125, -0.531097412109375, -0.4893646240234375, -0.4476318359375, -0.4058990478515625, -0.364166259765625, -0.3224334716796875, -0.28070068359375, -0.2389678955078125, -0.197235107421875, -0.1555023193359375, -0.11376953125, -0.0720367431640625, -0.030303955078125, 0.0114288330078125, 0.05316162109375, 0.0948944091796875, 0.136627197265625, 0.1783599853515625, 0.2200927734375, 0.2618255615234375, 0.303558349609375, 0.3452911376953125, 0.38702392578125, 0.4287567138671875, 0.470489501953125, 0.5122222900390625, 0.553955078125, 0.5956878662109375, 0.637420654296875, 0.6791534423828125, 0.72088623046875, 0.7626190185546875, 0.804351806640625, 0.8460845947265625, 0.8878173828125, 0.9295501708984375, 0.971282958984375, 1.0130157470703125, 1.05474853515625, 1.0964813232421875, 1.138214111328125, 1.1799468994140625, 1.2216796875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 7.0, 15.0, 17.0, 38.0, 43.0, 70.0, 116.0, 197.0, 363.0, 583.0, 893.0, 721.0, 404.0, 207.0, 133.0, 85.0, 39.0, 35.0, 24.0, 16.0, 16.0, 8.0, 6.0, 5.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.297119140625, -0.2874183654785156, -0.27771759033203125, -0.2680168151855469, -0.2583160400390625, -0.24861526489257812, -0.23891448974609375, -0.22921371459960938, -0.219512939453125, -0.20981216430664062, -0.20011138916015625, -0.19041061401367188, -0.1807098388671875, -0.17100906372070312, -0.16130828857421875, -0.15160751342773438, -0.14190673828125, -0.13220596313476562, -0.12250518798828125, -0.11280441284179688, -0.1031036376953125, -0.09340286254882812, -0.08370208740234375, -0.07400131225585938, -0.064300537109375, -0.054599761962890625, -0.04489898681640625, -0.035198211669921875, -0.0254974365234375, -0.015796661376953125, -0.00609588623046875, 0.003604888916015625, 0.0133056640625, 0.023006439208984375, 0.03270721435546875, 0.042407989501953125, 0.0521087646484375, 0.061809539794921875, 0.07151031494140625, 0.08121109008789062, 0.090911865234375, 0.10061264038085938, 0.11031341552734375, 0.12001419067382812, 0.1297149658203125, 0.13941574096679688, 0.14911651611328125, 0.15881729125976562, 0.16851806640625, 0.17821884155273438, 0.18791961669921875, 0.19762039184570312, 0.2073211669921875, 0.21702194213867188, 0.22672271728515625, 0.23642349243164062, 0.246124267578125, 0.2558250427246094, 0.26552581787109375, 0.2752265930175781, 0.2849273681640625, 0.2946281433105469, 0.30432891845703125, 0.3140296936035156, 0.32373046875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 0.0, 2.0, 5.0, 4.0, 8.0, 14.0, 15.0, 14.0, 32.0, 32.0, 30.0, 47.0, 65.0, 67.0, 89.0, 84.0, 89.0, 88.0, 67.0, 63.0, 48.0, 31.0, 29.0, 23.0, 14.0, 11.0, 9.0, 9.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8688849210739136, -0.8431196808815002, -0.8173544406890869, -0.7915891408920288, -0.7658239006996155, -0.7400586605072021, -0.7142934203147888, -0.6885281801223755, -0.6627628803253174, -0.636997640132904, -0.6112323999404907, -0.5854671001434326, -0.5597018599510193, -0.533936619758606, -0.5081713795661926, -0.4824061393737793, -0.45664089918136597, -0.43087565898895264, -0.4051103889942169, -0.3793451488018036, -0.35357987880706787, -0.32781463861465454, -0.3020493984222412, -0.2762841582298279, -0.25051888823509216, -0.22475363314151764, -0.19898837804794312, -0.17322313785552979, -0.14745788276195526, -0.12169262766838074, -0.09592738747596741, -0.07016213238239288, -0.044396936893463135, -0.01863168552517891, 0.007133565843105316, 0.03289881348609924, 0.05866406857967377, 0.08442932367324829, 0.11019456386566162, 0.13595981895923615, 0.16172507405281067, 0.1874903291463852, 0.21325558423995972, 0.23902082443237305, 0.2647860646247864, 0.2905513346195221, 0.3163165748119354, 0.34208184480667114, 0.3678470849990845, 0.3936123251914978, 0.4193775951862335, 0.44514283537864685, 0.47090810537338257, 0.4966733455657959, 0.5224385857582092, 0.5482038259506226, 0.5739691257476807, 0.599734365940094, 0.6254996061325073, 0.6512649059295654, 0.6770301461219788, 0.7027953863143921, 0.7285606265068054, 0.7543258666992188, 0.7800911068916321]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 6.0, 14.0, 9.0, 19.0, 7.0, 24.0, 24.0, 32.0, 30.0, 28.0, 38.0, 29.0, 36.0, 46.0, 49.0, 51.0, 56.0, 50.0, 42.0, 46.0, 40.0, 46.0, 35.0, 41.0, 32.0, 31.0, 21.0, 22.0, 21.0, 14.0, 13.0, 8.0, 11.0, 6.0, 5.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5837039947509766, -0.5664398670196533, -0.5491757988929749, -0.5319116711616516, -0.5146476030349731, -0.4973834753036499, -0.48011937737464905, -0.4628552794456482, -0.44559118151664734, -0.4283270835876465, -0.41106298565864563, -0.3937988877296448, -0.37653475999832153, -0.35927069187164307, -0.3420065641403198, -0.32474246621131897, -0.3074783682823181, -0.29021427035331726, -0.2729501724243164, -0.25568607449531555, -0.2384219616651535, -0.22115786373615265, -0.2038937509059906, -0.18662965297698975, -0.1693655550479889, -0.15210145711898804, -0.13483735918998718, -0.11757324635982513, -0.10030914843082428, -0.08304505050182343, -0.06578094512224197, -0.04851683974266052, -0.03125268220901489, -0.01398858055472374, 0.0032755210995674133, 0.020539622753858566, 0.03780372440814972, 0.055067822337150574, 0.07233192771673203, 0.08959603309631348, 0.10686013102531433, 0.12412422895431519, 0.14138832688331604, 0.1586524397134781, 0.17591653764247894, 0.1931806355714798, 0.21044474840164185, 0.2277088463306427, 0.24497294425964355, 0.2622370421886444, 0.27950114011764526, 0.2967652380466461, 0.314029335975647, 0.3312934637069702, 0.34855756163597107, 0.3658216595649719, 0.3830857574939728, 0.40034985542297363, 0.4176139533519745, 0.43487805128097534, 0.4521421790122986, 0.46940624713897705, 0.4866703748703003, 0.5039345026016235, 0.521198570728302]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 10.0, 6.0, 9.0, 27.0, 29.0, 53.0, 66.0, 90.0, 131.0, 224.0, 359.0, 596.0, 1114.0, 2087.0, 4040.0, 8338.0, 19034.0, 46272.0, 128440.0, 348262.0, 308992.0, 108431.0, 39847.0, 16684.0, 7384.0, 3657.0, 1816.0, 1027.0, 566.0, 340.0, 195.0, 130.0, 87.0, 66.0, 45.0, 27.0, 17.0, 17.0, 8.0, 8.0, 3.0, 1.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1319580078125, -0.12828445434570312, -0.12461090087890625, -0.12093734741210938, -0.1172637939453125, -0.11359024047851562, -0.10991668701171875, -0.10624313354492188, -0.102569580078125, -0.09889602661132812, -0.09522247314453125, -0.09154891967773438, -0.0878753662109375, -0.08420181274414062, -0.08052825927734375, -0.07685470581054688, -0.07318115234375, -0.06950759887695312, -0.06583404541015625, -0.062160491943359375, -0.0584869384765625, -0.054813385009765625, -0.05113983154296875, -0.047466278076171875, -0.043792724609375, -0.040119171142578125, -0.03644561767578125, -0.032772064208984375, -0.0290985107421875, -0.025424957275390625, -0.02175140380859375, -0.018077850341796875, -0.014404296875, -0.010730743408203125, -0.00705718994140625, -0.003383636474609375, 0.0002899169921875, 0.003963470458984375, 0.00763702392578125, 0.011310577392578125, 0.014984130859375, 0.018657684326171875, 0.02233123779296875, 0.026004791259765625, 0.0296783447265625, 0.033351898193359375, 0.03702545166015625, 0.040699005126953125, 0.04437255859375, 0.048046112060546875, 0.05171966552734375, 0.055393218994140625, 0.0590667724609375, 0.06274032592773438, 0.06641387939453125, 0.07008743286132812, 0.073760986328125, 0.07743453979492188, 0.08110809326171875, 0.08478164672851562, 0.0884552001953125, 0.09212875366210938, 0.09580230712890625, 0.09947586059570312, 0.1031494140625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 17.0, 18.0, 22.0, 26.0, 33.0, 35.0, 34.0, 43.0, 38.0, 59.0, 54.0, 66.0, 46.0, 69.0, 50.0, 44.0, 48.0, 40.0, 39.0, 35.0, 25.0, 26.0, 26.0, 10.0, 14.0, 12.0, 9.0, 9.0, 7.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.3874168395996094, -0.37541961669921875, -0.3634223937988281, -0.3514251708984375, -0.3394279479980469, -0.32743072509765625, -0.3154335021972656, -0.303436279296875, -0.2914390563964844, -0.27944183349609375, -0.2674446105957031, -0.2554473876953125, -0.24345016479492188, -0.23145294189453125, -0.21945571899414062, -0.20745849609375, -0.19546127319335938, -0.18346405029296875, -0.17146682739257812, -0.1594696044921875, -0.14747238159179688, -0.13547515869140625, -0.12347793579101562, -0.111480712890625, -0.09948348999023438, -0.08748626708984375, -0.07548904418945312, -0.0634918212890625, -0.051494598388671875, -0.03949737548828125, -0.027500152587890625, -0.0155029296875, -0.003505706787109375, 0.00849151611328125, 0.020488739013671875, 0.0324859619140625, 0.044483184814453125, 0.05648040771484375, 0.06847763061523438, 0.080474853515625, 0.09247207641601562, 0.10446929931640625, 0.11646652221679688, 0.1284637451171875, 0.14046096801757812, 0.15245819091796875, 0.16445541381835938, 0.17645263671875, 0.18844985961914062, 0.20044708251953125, 0.21244430541992188, 0.2244415283203125, 0.23643875122070312, 0.24843597412109375, 0.2604331970214844, 0.272430419921875, 0.2844276428222656, 0.29642486572265625, 0.3084220886230469, 0.3204193115234375, 0.3324165344238281, 0.34441375732421875, 0.3564109802246094, 0.368408203125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 5.0, 17.0, 19.0, 27.0, 42.0, 68.0, 97.0, 171.0, 305.0, 593.0, 1266.0, 3054.0, 10104.0, 44758.0, 290606.0, 567130.0, 102774.0, 18826.0, 5147.0, 1803.0, 808.0, 387.0, 221.0, 126.0, 63.0, 38.0, 29.0, 22.0, 13.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1614990234375, -0.15663909912109375, -0.1517791748046875, -0.14691925048828125, -0.142059326171875, -0.13719940185546875, -0.1323394775390625, -0.12747955322265625, -0.12261962890625, -0.11775970458984375, -0.1128997802734375, -0.10803985595703125, -0.103179931640625, -0.09832000732421875, -0.0934600830078125, -0.08860015869140625, -0.083740234375, -0.07888031005859375, -0.0740203857421875, -0.06916046142578125, -0.064300537109375, -0.05944061279296875, -0.0545806884765625, -0.04972076416015625, -0.04486083984375, -0.04000091552734375, -0.0351409912109375, -0.03028106689453125, -0.025421142578125, -0.02056121826171875, -0.0157012939453125, -0.01084136962890625, -0.0059814453125, -0.00112152099609375, 0.0037384033203125, 0.00859832763671875, 0.013458251953125, 0.01831817626953125, 0.0231781005859375, 0.02803802490234375, 0.03289794921875, 0.03775787353515625, 0.0426177978515625, 0.04747772216796875, 0.052337646484375, 0.05719757080078125, 0.0620574951171875, 0.06691741943359375, 0.07177734375, 0.07663726806640625, 0.0814971923828125, 0.08635711669921875, 0.091217041015625, 0.09607696533203125, 0.1009368896484375, 0.10579681396484375, 0.11065673828125, 0.11551666259765625, 0.1203765869140625, 0.12523651123046875, 0.130096435546875, 0.13495635986328125, 0.1398162841796875, 0.14467620849609375, 0.1495361328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 9.0, 4.0, 6.0, 7.0, 9.0, 11.0, 12.0, 17.0, 14.0, 15.0, 26.0, 42.0, 25.0, 22.0, 38.0, 30.0, 40.0, 42.0, 49.0, 61.0, 47.0, 45.0, 65.0, 30.0, 55.0, 39.0, 41.0, 34.0, 24.0, 24.0, 21.0, 16.0, 14.0, 19.0, 7.0, 5.0, 9.0, 5.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.67236328125, -0.650604248046875, -0.62884521484375, -0.607086181640625, -0.5853271484375, -0.563568115234375, -0.54180908203125, -0.520050048828125, -0.498291015625, -0.476531982421875, -0.45477294921875, -0.433013916015625, -0.4112548828125, -0.389495849609375, -0.36773681640625, -0.345977783203125, -0.32421875, -0.302459716796875, -0.28070068359375, -0.258941650390625, -0.2371826171875, -0.215423583984375, -0.19366455078125, -0.171905517578125, -0.150146484375, -0.128387451171875, -0.10662841796875, -0.084869384765625, -0.0631103515625, -0.041351318359375, -0.01959228515625, 0.002166748046875, 0.02392578125, 0.045684814453125, 0.06744384765625, 0.089202880859375, 0.1109619140625, 0.132720947265625, 0.15447998046875, 0.176239013671875, 0.197998046875, 0.219757080078125, 0.24151611328125, 0.263275146484375, 0.2850341796875, 0.306793212890625, 0.32855224609375, 0.350311279296875, 0.3720703125, 0.393829345703125, 0.41558837890625, 0.437347412109375, 0.4591064453125, 0.480865478515625, 0.50262451171875, 0.524383544921875, 0.546142578125, 0.567901611328125, 0.58966064453125, 0.611419677734375, 0.6331787109375, 0.654937744140625, 0.67669677734375, 0.698455810546875, 0.72021484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 8.0, 9.0, 13.0, 29.0, 33.0, 43.0, 90.0, 152.0, 278.0, 600.0, 1112.0, 2431.0, 6358.0, 20085.0, 93995.0, 632245.0, 235594.0, 38019.0, 10455.0, 3688.0, 1508.0, 800.0, 396.0, 216.0, 135.0, 86.0, 52.0, 30.0, 21.0, 20.0, 11.0, 15.0, 6.0, 1.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0], "bins": [-0.1046142578125, -0.1019124984741211, -0.09921073913574219, -0.09650897979736328, -0.09380722045898438, -0.09110546112060547, -0.08840370178222656, -0.08570194244384766, -0.08300018310546875, -0.08029842376708984, -0.07759666442871094, -0.07489490509033203, -0.07219314575195312, -0.06949138641357422, -0.06678962707519531, -0.0640878677368164, -0.0613861083984375, -0.058684349060058594, -0.05598258972167969, -0.05328083038330078, -0.050579071044921875, -0.04787731170654297, -0.04517555236816406, -0.042473793029785156, -0.03977203369140625, -0.037070274353027344, -0.03436851501464844, -0.03166675567626953, -0.028964996337890625, -0.02626323699951172, -0.023561477661132812, -0.020859718322753906, -0.018157958984375, -0.015456199645996094, -0.012754440307617188, -0.010052680969238281, -0.007350921630859375, -0.004649162292480469, -0.0019474029541015625, 0.0007543563842773438, 0.00345611572265625, 0.006157875061035156, 0.008859634399414062, 0.011561393737792969, 0.014263153076171875, 0.01696491241455078, 0.019666671752929688, 0.022368431091308594, 0.0250701904296875, 0.027771949768066406, 0.030473709106445312, 0.03317546844482422, 0.035877227783203125, 0.03857898712158203, 0.04128074645996094, 0.043982505798339844, 0.04668426513671875, 0.049386024475097656, 0.05208778381347656, 0.05478954315185547, 0.057491302490234375, 0.06019306182861328, 0.06289482116699219, 0.0655965805053711, 0.06829833984375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 14.0, 13.0, 17.0, 25.0, 30.0, 54.0, 68.0, 85.0, 117.0, 145.0, 101.0, 72.0, 76.0, 46.0, 46.0, 18.0, 10.0, 12.0, 15.0, 7.0, 7.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.947185516357422e-05, -4.8177316784858704e-05, -4.688277840614319e-05, -4.558824002742767e-05, -4.429370164871216e-05, -4.299916326999664e-05, -4.170462489128113e-05, -4.041008651256561e-05, -3.91155481338501e-05, -3.782100975513458e-05, -3.652647137641907e-05, -3.523193299770355e-05, -3.393739461898804e-05, -3.264285624027252e-05, -3.134831786155701e-05, -3.0053779482841492e-05, -2.8759241104125977e-05, -2.746470272541046e-05, -2.6170164346694946e-05, -2.487562596797943e-05, -2.3581087589263916e-05, -2.22865492105484e-05, -2.0992010831832886e-05, -1.969747245311737e-05, -1.8402934074401855e-05, -1.710839569568634e-05, -1.5813857316970825e-05, -1.451931893825531e-05, -1.3224780559539795e-05, -1.193024218082428e-05, -1.0635703802108765e-05, -9.34116542339325e-06, -8.046627044677734e-06, -6.752088665962219e-06, -5.457550287246704e-06, -4.163011908531189e-06, -2.868473529815674e-06, -1.5739351511001587e-06, -2.7939677238464355e-07, 1.0151416063308716e-06, 2.3096799850463867e-06, 3.604218363761902e-06, 4.898756742477417e-06, 6.193295121192932e-06, 7.487833499908447e-06, 8.782371878623962e-06, 1.0076910257339478e-05, 1.1371448636054993e-05, 1.2665987014770508e-05, 1.3960525393486023e-05, 1.5255063772201538e-05, 1.6549602150917053e-05, 1.784414052963257e-05, 1.9138678908348083e-05, 2.04332172870636e-05, 2.1727755665779114e-05, 2.302229404449463e-05, 2.4316832423210144e-05, 2.561137080192566e-05, 2.6905909180641174e-05, 2.820044755935669e-05, 2.9494985938072205e-05, 3.078952431678772e-05, 3.2084062695503235e-05, 3.337860107421875e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 21.0, 34.0, 32.0, 75.0, 120.0, 199.0, 309.0, 590.0, 1081.0, 2015.0, 3961.0, 8769.0, 21196.0, 56299.0, 186724.0, 492887.0, 181585.0, 54909.0, 20626.0, 8714.0, 3950.0, 2007.0, 1046.0, 564.0, 333.0, 207.0, 101.0, 59.0, 54.0, 29.0, 16.0, 12.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06670761108398438, -0.06444549560546875, -0.062183380126953125, -0.0599212646484375, -0.057659149169921875, -0.05539703369140625, -0.053134918212890625, -0.050872802734375, -0.048610687255859375, -0.04634857177734375, -0.044086456298828125, -0.0418243408203125, -0.039562225341796875, -0.03730010986328125, -0.035037994384765625, -0.03277587890625, -0.030513763427734375, -0.02825164794921875, -0.025989532470703125, -0.0237274169921875, -0.021465301513671875, -0.01920318603515625, -0.016941070556640625, -0.014678955078125, -0.012416839599609375, -0.01015472412109375, -0.007892608642578125, -0.0056304931640625, -0.003368377685546875, -0.00110626220703125, 0.001155853271484375, 0.00341796875, 0.005680084228515625, 0.00794219970703125, 0.010204315185546875, 0.0124664306640625, 0.014728546142578125, 0.01699066162109375, 0.019252777099609375, 0.021514892578125, 0.023777008056640625, 0.02603912353515625, 0.028301239013671875, 0.0305633544921875, 0.032825469970703125, 0.03508758544921875, 0.037349700927734375, 0.03961181640625, 0.041873931884765625, 0.04413604736328125, 0.046398162841796875, 0.0486602783203125, 0.050922393798828125, 0.05318450927734375, 0.055446624755859375, 0.057708740234375, 0.059970855712890625, 0.06223297119140625, 0.06449508666992188, 0.0667572021484375, 0.06901931762695312, 0.07128143310546875, 0.07354354858398438, 0.0758056640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 5.0, 6.0, 9.0, 9.0, 7.0, 8.0, 13.0, 19.0, 16.0, 43.0, 50.0, 61.0, 68.0, 70.0, 109.0, 94.0, 89.0, 61.0, 51.0, 43.0, 34.0, 21.0, 23.0, 19.0, 7.0, 10.0, 7.0, 11.0, 8.0, 2.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015533447265625, -0.014957189559936523, -0.014380931854248047, -0.01380467414855957, -0.013228416442871094, -0.012652158737182617, -0.01207590103149414, -0.011499643325805664, -0.010923385620117188, -0.010347127914428711, -0.009770870208740234, -0.009194612503051758, -0.008618354797363281, -0.008042097091674805, -0.007465839385986328, -0.0068895816802978516, -0.006313323974609375, -0.0057370662689208984, -0.005160808563232422, -0.004584550857543945, -0.004008293151855469, -0.003432035446166992, -0.0028557777404785156, -0.002279520034790039, -0.0017032623291015625, -0.001127004623413086, -0.0005507469177246094, 2.5510787963867188e-05, 0.0006017684936523438, 0.0011780261993408203, 0.0017542839050292969, 0.0023305416107177734, 0.00290679931640625, 0.0034830570220947266, 0.004059314727783203, 0.00463557243347168, 0.005211830139160156, 0.005788087844848633, 0.006364345550537109, 0.006940603256225586, 0.0075168609619140625, 0.008093118667602539, 0.008669376373291016, 0.009245634078979492, 0.009821891784667969, 0.010398149490356445, 0.010974407196044922, 0.011550664901733398, 0.012126922607421875, 0.012703180313110352, 0.013279438018798828, 0.013855695724487305, 0.014431953430175781, 0.015008211135864258, 0.015584468841552734, 0.01616072654724121, 0.016736984252929688, 0.017313241958618164, 0.01788949966430664, 0.018465757369995117, 0.019042015075683594, 0.01961827278137207, 0.020194530487060547, 0.020770788192749023, 0.0213470458984375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 18.0, 9.0, 13.0, 21.0, 22.0, 44.0, 42.0, 57.0, 71.0, 77.0, 74.0, 99.0, 86.0, 86.0, 76.0, 50.0, 36.0, 26.0, 29.0, 11.0, 11.0, 10.0, 6.0, 4.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43381404876708984, -0.4177893102169037, -0.4017646014690399, -0.38573986291885376, -0.36971515417099, -0.35369041562080383, -0.3376656770706177, -0.3216409683227539, -0.30561622977256775, -0.2895914912223816, -0.2735667824745178, -0.25754204392433167, -0.2415173202753067, -0.22549259662628174, -0.20946785807609558, -0.19344313442707062, -0.17741841077804565, -0.1613936871290207, -0.14536896347999573, -0.12934422492980957, -0.1133195012807846, -0.09729477763175964, -0.08127004653215408, -0.06524531543254852, -0.04922059178352356, -0.0331958644092083, -0.017171137034893036, -0.001146409660577774, 0.014878317713737488, 0.03090304136276245, 0.04692777246236801, 0.06295250356197357, 0.07897722721099854, 0.0950019508600235, 0.11102668195962906, 0.12705141305923462, 0.14307613670825958, 0.15910086035728455, 0.1751255989074707, 0.19115032255649567, 0.20717504620552063, 0.2231997698545456, 0.23922449350357056, 0.2552492320537567, 0.27127397060394287, 0.28729867935180664, 0.3033234179019928, 0.31934815645217896, 0.3353728652000427, 0.3513976037502289, 0.36742231249809265, 0.3834470510482788, 0.3994717597961426, 0.41549649834632874, 0.4315212368965149, 0.44754594564437866, 0.4635706841945648, 0.479595422744751, 0.49562013149261475, 0.5116448402404785, 0.5276696085929871, 0.5436943173408508, 0.5597190260887146, 0.5757437944412231, 0.5917685031890869]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 12.0, 12.0, 13.0, 12.0, 19.0, 32.0, 21.0, 37.0, 43.0, 42.0, 38.0, 42.0, 59.0, 58.0, 61.0, 59.0, 49.0, 51.0, 57.0, 34.0, 55.0, 34.0, 27.0, 26.0, 20.0, 20.0, 17.0, 6.0, 6.0, 8.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.43590986728668213, -0.424064040184021, -0.41221821308135986, -0.40037235617637634, -0.3885265290737152, -0.3766807019710541, -0.36483484506607056, -0.3529890179634094, -0.3411431908607483, -0.32929736375808716, -0.317451536655426, -0.3056056797504425, -0.29375985264778137, -0.28191402554512024, -0.2700681686401367, -0.2582223415374756, -0.24637651443481445, -0.23453068733215332, -0.222684845328331, -0.21083900332450867, -0.19899317622184753, -0.1871473491191864, -0.17530150711536407, -0.16345566511154175, -0.15160983800888062, -0.13976401090621948, -0.12791816890239716, -0.11607233434915543, -0.1042264997959137, -0.09238066524267197, -0.08053483068943024, -0.06868899613618851, -0.05684316158294678, -0.04499732702970505, -0.03315149247646332, -0.021305657923221588, -0.009459823369979858, 0.0023860111832618713, 0.014231845736503601, 0.02607768028974533, 0.03792351484298706, 0.04976934939622879, 0.06161518394947052, 0.07346101850271225, 0.08530685305595398, 0.09715268760919571, 0.10899852216243744, 0.12084435671567917, 0.1326901912689209, 0.14453601837158203, 0.15638186037540436, 0.16822770237922668, 0.18007352948188782, 0.19191935658454895, 0.20376519858837128, 0.2156110405921936, 0.22745686769485474, 0.23930269479751587, 0.251148521900177, 0.2629943788051605, 0.27484020590782166, 0.2866860330104828, 0.2985318899154663, 0.31037771701812744, 0.3222235441207886]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 11.0, 18.0, 32.0, 33.0, 55.0, 80.0, 129.0, 227.0, 405.0, 607.0, 1140.0, 1904.0, 3254.0, 5989.0, 11417.0, 23175.0, 59920.0, 230472.0, 492540.0, 136710.0, 42130.0, 18057.0, 9020.0, 4791.0, 2663.0, 1447.0, 923.0, 521.0, 335.0, 204.0, 123.0, 73.0, 50.0, 36.0, 21.0, 16.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4716796875, -0.45793914794921875, -0.4441986083984375, -0.43045806884765625, -0.416717529296875, -0.40297698974609375, -0.3892364501953125, -0.37549591064453125, -0.36175537109375, -0.34801483154296875, -0.3342742919921875, -0.32053375244140625, -0.306793212890625, -0.29305267333984375, -0.2793121337890625, -0.26557159423828125, -0.2518310546875, -0.23809051513671875, -0.2243499755859375, -0.21060943603515625, -0.196868896484375, -0.18312835693359375, -0.1693878173828125, -0.15564727783203125, -0.14190673828125, -0.12816619873046875, -0.1144256591796875, -0.10068511962890625, -0.086944580078125, -0.07320404052734375, -0.0594635009765625, -0.04572296142578125, -0.031982421875, -0.01824188232421875, -0.0045013427734375, 0.00923919677734375, 0.022979736328125, 0.03672027587890625, 0.0504608154296875, 0.06420135498046875, 0.07794189453125, 0.09168243408203125, 0.1054229736328125, 0.11916351318359375, 0.132904052734375, 0.14664459228515625, 0.1603851318359375, 0.17412567138671875, 0.1878662109375, 0.20160675048828125, 0.2153472900390625, 0.22908782958984375, 0.242828369140625, 0.25656890869140625, 0.2703094482421875, 0.28404998779296875, 0.29779052734375, 0.31153106689453125, 0.3252716064453125, 0.33901214599609375, 0.352752685546875, 0.36649322509765625, 0.3802337646484375, 0.39397430419921875, 0.40771484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 7.0, 6.0, 13.0, 15.0, 14.0, 21.0, 26.0, 25.0, 43.0, 33.0, 45.0, 37.0, 53.0, 47.0, 50.0, 54.0, 65.0, 58.0, 54.0, 49.0, 39.0, 42.0, 32.0, 40.0, 22.0, 26.0, 18.0, 15.0, 9.0, 9.0, 5.0, 7.0, 6.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84814453125, -0.8230438232421875, -0.797943115234375, -0.7728424072265625, -0.74774169921875, -0.7226409912109375, -0.697540283203125, -0.6724395751953125, -0.6473388671875, -0.6222381591796875, -0.597137451171875, -0.5720367431640625, -0.54693603515625, -0.5218353271484375, -0.496734619140625, -0.4716339111328125, -0.446533203125, -0.4214324951171875, -0.396331787109375, -0.3712310791015625, -0.34613037109375, -0.3210296630859375, -0.295928955078125, -0.2708282470703125, -0.2457275390625, -0.2206268310546875, -0.195526123046875, -0.1704254150390625, -0.14532470703125, -0.1202239990234375, -0.095123291015625, -0.0700225830078125, -0.044921875, -0.0198211669921875, 0.005279541015625, 0.0303802490234375, 0.05548095703125, 0.0805816650390625, 0.105682373046875, 0.1307830810546875, 0.1558837890625, 0.1809844970703125, 0.206085205078125, 0.2311859130859375, 0.25628662109375, 0.2813873291015625, 0.306488037109375, 0.3315887451171875, 0.356689453125, 0.3817901611328125, 0.406890869140625, 0.4319915771484375, 0.45709228515625, 0.4821929931640625, 0.507293701171875, 0.5323944091796875, 0.5574951171875, 0.5825958251953125, 0.607696533203125, 0.6327972412109375, 0.65789794921875, 0.6829986572265625, 0.708099365234375, 0.7332000732421875, 0.75830078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 14.0, 27.0, 49.0, 116.0, 250.0, 685.0, 2401.0, 12026.0, 122324.0, 854959.0, 46493.0, 6846.0, 1534.0, 463.0, 152.0, 101.0, 44.0, 22.0, 13.0, 10.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2041015625, -1.163055419921875, -1.12200927734375, -1.080963134765625, -1.0399169921875, -0.998870849609375, -0.95782470703125, -0.916778564453125, -0.875732421875, -0.834686279296875, -0.79364013671875, -0.752593994140625, -0.7115478515625, -0.670501708984375, -0.62945556640625, -0.588409423828125, -0.54736328125, -0.506317138671875, -0.46527099609375, -0.424224853515625, -0.3831787109375, -0.342132568359375, -0.30108642578125, -0.260040283203125, -0.218994140625, -0.177947998046875, -0.13690185546875, -0.095855712890625, -0.0548095703125, -0.013763427734375, 0.02728271484375, 0.068328857421875, 0.109375, 0.150421142578125, 0.19146728515625, 0.232513427734375, 0.2735595703125, 0.314605712890625, 0.35565185546875, 0.396697998046875, 0.437744140625, 0.478790283203125, 0.51983642578125, 0.560882568359375, 0.6019287109375, 0.642974853515625, 0.68402099609375, 0.725067138671875, 0.76611328125, 0.807159423828125, 0.84820556640625, 0.889251708984375, 0.9302978515625, 0.971343994140625, 1.01239013671875, 1.053436279296875, 1.094482421875, 1.135528564453125, 1.17657470703125, 1.217620849609375, 1.2586669921875, 1.299713134765625, 1.34075927734375, 1.381805419921875, 1.4228515625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 8.0, 11.0, 18.0, 13.0, 16.0, 20.0, 19.0, 36.0, 37.0, 31.0, 45.0, 40.0, 47.0, 50.0, 45.0, 57.0, 56.0, 58.0, 43.0, 36.0, 44.0, 34.0, 32.0, 28.0, 32.0, 27.0, 25.0, 19.0, 8.0, 5.0, 7.0, 7.0, 2.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0], "bins": [-0.94384765625, -0.9179840087890625, -0.892120361328125, -0.8662567138671875, -0.84039306640625, -0.8145294189453125, -0.788665771484375, -0.7628021240234375, -0.7369384765625, -0.7110748291015625, -0.685211181640625, -0.6593475341796875, -0.63348388671875, -0.6076202392578125, -0.581756591796875, -0.5558929443359375, -0.530029296875, -0.5041656494140625, -0.478302001953125, -0.4524383544921875, -0.42657470703125, -0.4007110595703125, -0.374847412109375, -0.3489837646484375, -0.3231201171875, -0.2972564697265625, -0.271392822265625, -0.2455291748046875, -0.21966552734375, -0.1938018798828125, -0.167938232421875, -0.1420745849609375, -0.1162109375, -0.0903472900390625, -0.064483642578125, -0.0386199951171875, -0.01275634765625, 0.0131072998046875, 0.038970947265625, 0.0648345947265625, 0.0906982421875, 0.1165618896484375, 0.142425537109375, 0.1682891845703125, 0.19415283203125, 0.2200164794921875, 0.245880126953125, 0.2717437744140625, 0.297607421875, 0.3234710693359375, 0.349334716796875, 0.3751983642578125, 0.40106201171875, 0.4269256591796875, 0.452789306640625, 0.4786529541015625, 0.5045166015625, 0.5303802490234375, 0.556243896484375, 0.5821075439453125, 0.60797119140625, 0.6338348388671875, 0.659698486328125, 0.6855621337890625, 0.71142578125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 7.0, 4.0, 10.0, 15.0, 17.0, 31.0, 73.0, 137.0, 303.0, 883.0, 2912.0, 14954.0, 115646.0, 699699.0, 185336.0, 22748.0, 4027.0, 1049.0, 380.0, 136.0, 80.0, 35.0, 22.0, 16.0, 13.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1737060546875, -0.16664695739746094, -0.15958786010742188, -0.1525287628173828, -0.14546966552734375, -0.1384105682373047, -0.13135147094726562, -0.12429237365722656, -0.1172332763671875, -0.11017417907714844, -0.10311508178710938, -0.09605598449707031, -0.08899688720703125, -0.08193778991699219, -0.07487869262695312, -0.06781959533691406, -0.060760498046875, -0.05370140075683594, -0.046642303466796875, -0.03958320617675781, -0.03252410888671875, -0.025465011596679688, -0.018405914306640625, -0.011346817016601562, -0.0042877197265625, 0.0027713775634765625, 0.009830474853515625, 0.016889572143554688, 0.02394866943359375, 0.031007766723632812, 0.038066864013671875, 0.04512596130371094, 0.05218505859375, 0.05924415588378906, 0.06630325317382812, 0.07336235046386719, 0.08042144775390625, 0.08748054504394531, 0.09453964233398438, 0.10159873962402344, 0.1086578369140625, 0.11571693420410156, 0.12277603149414062, 0.1298351287841797, 0.13689422607421875, 0.1439533233642578, 0.15101242065429688, 0.15807151794433594, 0.165130615234375, 0.17218971252441406, 0.17924880981445312, 0.1863079071044922, 0.19336700439453125, 0.2004261016845703, 0.20748519897460938, 0.21454429626464844, 0.2216033935546875, 0.22866249084472656, 0.23572158813476562, 0.2427806854248047, 0.24983978271484375, 0.2568988800048828, 0.2639579772949219, 0.27101707458496094, 0.278076171875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 11.0, 4.0, 6.0, 13.0, 7.0, 9.0, 22.0, 30.0, 27.0, 41.0, 59.0, 63.0, 91.0, 123.0, 107.0, 92.0, 74.0, 59.0, 46.0, 20.0, 22.0, 25.0, 12.0, 18.0, 14.0, 3.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.11732292175293e-05, -3.033410757780075e-05, -2.9494985938072205e-05, -2.865586429834366e-05, -2.7816742658615112e-05, -2.6977621018886566e-05, -2.613849937915802e-05, -2.5299377739429474e-05, -2.4460256099700928e-05, -2.362113445997238e-05, -2.2782012820243835e-05, -2.194289118051529e-05, -2.1103769540786743e-05, -2.0264647901058197e-05, -1.942552626132965e-05, -1.8586404621601105e-05, -1.774728298187256e-05, -1.6908161342144012e-05, -1.6069039702415466e-05, -1.522991806268692e-05, -1.4390796422958374e-05, -1.3551674783229828e-05, -1.2712553143501282e-05, -1.1873431503772736e-05, -1.103430986404419e-05, -1.0195188224315643e-05, -9.356066584587097e-06, -8.516944944858551e-06, -7.677823305130005e-06, -6.838701665401459e-06, -5.999580025672913e-06, -5.1604583859443665e-06, -4.32133674621582e-06, -3.482215106487274e-06, -2.643093466758728e-06, -1.8039718270301819e-06, -9.648501873016357e-07, -1.257285475730896e-07, 7.133930921554565e-07, 1.5525147318840027e-06, 2.391636371612549e-06, 3.230758011341095e-06, 4.069879651069641e-06, 4.909001290798187e-06, 5.748122930526733e-06, 6.5872445702552795e-06, 7.426366209983826e-06, 8.265487849712372e-06, 9.104609489440918e-06, 9.943731129169464e-06, 1.078285276889801e-05, 1.1621974408626556e-05, 1.2461096048355103e-05, 1.3300217688083649e-05, 1.4139339327812195e-05, 1.4978460967540741e-05, 1.5817582607269287e-05, 1.6656704246997833e-05, 1.749582588672638e-05, 1.8334947526454926e-05, 1.917406916618347e-05, 2.0013190805912018e-05, 2.0852312445640564e-05, 2.169143408536911e-05, 2.2530555725097656e-05]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 11.0, 8.0, 13.0, 22.0, 20.0, 30.0, 64.0, 103.0, 255.0, 701.0, 2130.0, 9160.0, 55004.0, 437698.0, 471320.0, 58753.0, 9764.0, 2300.0, 628.0, 255.0, 106.0, 74.0, 43.0, 20.0, 16.0, 15.0, 7.0, 12.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.208984375, -0.2017822265625, -0.194580078125, -0.1873779296875, -0.18017578125, -0.1729736328125, -0.165771484375, -0.1585693359375, -0.1513671875, -0.1441650390625, -0.136962890625, -0.1297607421875, -0.12255859375, -0.1153564453125, -0.108154296875, -0.1009521484375, -0.09375, -0.0865478515625, -0.079345703125, -0.0721435546875, -0.06494140625, -0.0577392578125, -0.050537109375, -0.0433349609375, -0.0361328125, -0.0289306640625, -0.021728515625, -0.0145263671875, -0.00732421875, -0.0001220703125, 0.007080078125, 0.0142822265625, 0.021484375, 0.0286865234375, 0.035888671875, 0.0430908203125, 0.05029296875, 0.0574951171875, 0.064697265625, 0.0718994140625, 0.0791015625, 0.0863037109375, 0.093505859375, 0.1007080078125, 0.10791015625, 0.1151123046875, 0.122314453125, 0.1295166015625, 0.13671875, 0.1439208984375, 0.151123046875, 0.1583251953125, 0.16552734375, 0.1727294921875, 0.179931640625, 0.1871337890625, 0.1943359375, 0.2015380859375, 0.208740234375, 0.2159423828125, 0.22314453125, 0.2303466796875, 0.237548828125, 0.2447509765625, 0.251953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 16.0, 13.0, 22.0, 18.0, 32.0, 28.0, 37.0, 42.0, 48.0, 71.0, 74.0, 118.0, 87.0, 66.0, 46.0, 54.0, 41.0, 45.0, 35.0, 24.0, 14.0, 20.0, 13.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06256103515625, -0.059897422790527344, -0.05723381042480469, -0.05457019805908203, -0.051906585693359375, -0.04924297332763672, -0.04657936096191406, -0.043915748596191406, -0.04125213623046875, -0.038588523864746094, -0.03592491149902344, -0.03326129913330078, -0.030597686767578125, -0.02793407440185547, -0.025270462036132812, -0.022606849670410156, -0.0199432373046875, -0.017279624938964844, -0.014616012573242188, -0.011952400207519531, -0.009288787841796875, -0.006625175476074219, -0.0039615631103515625, -0.0012979507446289062, 0.00136566162109375, 0.004029273986816406, 0.0066928863525390625, 0.009356498718261719, 0.012020111083984375, 0.014683723449707031, 0.017347335815429688, 0.020010948181152344, 0.022674560546875, 0.025338172912597656, 0.028001785278320312, 0.03066539764404297, 0.033329010009765625, 0.03599262237548828, 0.03865623474121094, 0.041319847106933594, 0.04398345947265625, 0.046647071838378906, 0.04931068420410156, 0.05197429656982422, 0.054637908935546875, 0.05730152130126953, 0.05996513366699219, 0.06262874603271484, 0.0652923583984375, 0.06795597076416016, 0.07061958312988281, 0.07328319549560547, 0.07594680786132812, 0.07861042022705078, 0.08127403259277344, 0.0839376449584961, 0.08660125732421875, 0.0892648696899414, 0.09192848205566406, 0.09459209442138672, 0.09725570678710938, 0.09991931915283203, 0.10258293151855469, 0.10524654388427734, 0.10791015625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 3.0, 18.0, 30.0, 53.0, 95.0, 139.0, 191.0, 174.0, 129.0, 84.0, 44.0, 27.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4290276765823364, -1.353173851966858, -1.2773200273513794, -1.2014660835266113, -1.1256122589111328, -1.0497584342956543, -0.9739046096801758, -0.8980507254600525, -0.822196900844574, -0.7463430762290955, -0.6704891920089722, -0.5946353673934937, -0.5187815427780151, -0.44292765855789185, -0.36707383394241333, -0.29121994972229004, -0.21536612510681152, -0.13951227068901062, -0.06365843117237091, 0.012195408344268799, 0.0880492627620697, 0.1639031171798706, 0.23975694179534912, 0.3156108260154724, 0.3914646506309509, 0.46731850504875183, 0.5431723594665527, 0.6190261840820312, 0.6948800086975098, 0.7707338929176331, 0.8465877175331116, 0.9224416017532349, 0.9982953071594238, 1.0741491317749023, 1.1500029563903809, 1.2258567810058594, 1.3017107248306274, 1.377564549446106, 1.4534183740615845, 1.5292723178863525, 1.605126142501831, 1.6809799671173096, 1.756833791732788, 1.8326876163482666, 1.9085415601730347, 1.9843953847885132, 2.0602493286132812, 2.1361031532287598, 2.2119569778442383, 2.287810802459717, 2.3636646270751953, 2.439518451690674, 2.5153722763061523, 2.591226100921631, 2.6670799255371094, 2.742933988571167, 2.8187875747680664, 2.894641399383545, 2.9704952239990234, 3.046349048614502, 3.1222028732299805, 3.198056697845459, 3.2739105224609375, 3.349764585494995, 3.4256184101104736]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 6.0, 4.0, 5.0, 7.0, 13.0, 7.0, 10.0, 18.0, 19.0, 18.0, 24.0, 34.0, 22.0, 30.0, 35.0, 44.0, 55.0, 40.0, 35.0, 41.0, 40.0, 53.0, 34.0, 41.0, 37.0, 41.0, 44.0, 38.0, 40.0, 22.0, 22.0, 21.0, 16.0, 16.0, 10.0, 11.0, 9.0, 10.0, 5.0, 4.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2290598154067993, -1.1891682147979736, -1.149276614189148, -1.1093850135803223, -1.0694934129714966, -1.029601812362671, -0.9897102117538452, -0.9498186111450195, -0.9099270105361938, -0.8700354099273682, -0.8301438093185425, -0.7902522087097168, -0.7503606081008911, -0.7104690074920654, -0.6705774068832397, -0.6306858062744141, -0.5907941460609436, -0.5509025454521179, -0.5110109448432922, -0.47111934423446655, -0.43122774362564087, -0.3913361430168152, -0.3514445126056671, -0.31155291199684143, -0.27166131138801575, -0.23176971077919006, -0.19187811017036438, -0.1519864946603775, -0.11209489405155182, -0.07220329344272614, -0.03231167793273926, 0.007579922676086426, 0.04747152328491211, 0.08736312389373779, 0.12725472450256348, 0.16714634001255035, 0.20703794062137604, 0.24692954123020172, 0.2868211567401886, 0.3267127573490143, 0.36660435795783997, 0.40649595856666565, 0.44638755917549133, 0.4862791895866394, 0.5261707901954651, 0.5660623908042908, 0.6059539914131165, 0.6458455920219421, 0.6857371926307678, 0.7256287932395935, 0.7655203938484192, 0.8054119944572449, 0.8453035950660706, 0.8851951956748962, 0.9250868558883667, 0.9649784564971924, 1.004870057106018, 1.0447616577148438, 1.0846532583236694, 1.1245448589324951, 1.1644364595413208, 1.2043280601501465, 1.2442196607589722, 1.2841112613677979, 1.3240028619766235]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 10.0, 6.0, 15.0, 15.0, 22.0, 26.0, 44.0, 57.0, 73.0, 109.0, 144.0, 183.0, 282.0, 473.0, 710.0, 1193.0, 2124.0, 4104.0, 8482.0, 21958.0, 80337.0, 723258.0, 2847475.0, 411283.0, 57942.0, 18156.0, 7265.0, 3614.0, 1916.0, 1040.0, 625.0, 422.0, 272.0, 185.0, 132.0, 81.0, 61.0, 44.0, 35.0, 22.0, 24.0, 23.0, 9.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-0.6552734375, -0.6343994140625, -0.613525390625, -0.5926513671875, -0.57177734375, -0.5509033203125, -0.530029296875, -0.5091552734375, -0.48828125, -0.4674072265625, -0.446533203125, -0.4256591796875, -0.40478515625, -0.3839111328125, -0.363037109375, -0.3421630859375, -0.3212890625, -0.3004150390625, -0.279541015625, -0.2586669921875, -0.23779296875, -0.2169189453125, -0.196044921875, -0.1751708984375, -0.154296875, -0.1334228515625, -0.112548828125, -0.0916748046875, -0.07080078125, -0.0499267578125, -0.029052734375, -0.0081787109375, 0.0126953125, 0.0335693359375, 0.054443359375, 0.0753173828125, 0.09619140625, 0.1170654296875, 0.137939453125, 0.1588134765625, 0.1796875, 0.2005615234375, 0.221435546875, 0.2423095703125, 0.26318359375, 0.2840576171875, 0.304931640625, 0.3258056640625, 0.3466796875, 0.3675537109375, 0.388427734375, 0.4093017578125, 0.43017578125, 0.4510498046875, 0.471923828125, 0.4927978515625, 0.513671875, 0.5345458984375, 0.555419921875, 0.5762939453125, 0.59716796875, 0.6180419921875, 0.638916015625, 0.6597900390625, 0.6806640625]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 15.0, 18.0, 9.0, 15.0, 24.0, 33.0, 24.0, 35.0, 46.0, 38.0, 74.0, 46.0, 54.0, 61.0, 60.0, 41.0, 57.0, 56.0, 46.0, 45.0, 37.0, 35.0, 24.0, 18.0, 16.0, 12.0, 9.0, 11.0, 3.0, 4.0, 3.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.431640625, -0.4202384948730469, -0.40883636474609375, -0.3974342346191406, -0.3860321044921875, -0.3746299743652344, -0.36322784423828125, -0.3518257141113281, -0.340423583984375, -0.3290214538574219, -0.31761932373046875, -0.3062171936035156, -0.2948150634765625, -0.2834129333496094, -0.27201080322265625, -0.2606086730957031, -0.24920654296875, -0.23780441284179688, -0.22640228271484375, -0.21500015258789062, -0.2035980224609375, -0.19219589233398438, -0.18079376220703125, -0.16939163208007812, -0.157989501953125, -0.14658737182617188, -0.13518524169921875, -0.12378311157226562, -0.1123809814453125, -0.10097885131835938, -0.08957672119140625, -0.07817459106445312, -0.0667724609375, -0.055370330810546875, -0.04396820068359375, -0.032566070556640625, -0.0211639404296875, -0.009761810302734375, 0.00164031982421875, 0.013042449951171875, 0.024444580078125, 0.035846710205078125, 0.04724884033203125, 0.058650970458984375, 0.0700531005859375, 0.08145523071289062, 0.09285736083984375, 0.10425949096679688, 0.11566162109375, 0.12706375122070312, 0.13846588134765625, 0.14986801147460938, 0.1612701416015625, 0.17267227172851562, 0.18407440185546875, 0.19547653198242188, 0.206878662109375, 0.21828079223632812, 0.22968292236328125, 0.24108505249023438, 0.2524871826171875, 0.2638893127441406, 0.27529144287109375, 0.2866935729980469, 0.298095703125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 4.0, 8.0, 9.0, 13.0, 15.0, 23.0, 49.0, 66.0, 118.0, 222.0, 499.0, 1420.0, 5698.0, 43627.0, 2687962.0, 1415247.0, 32294.0, 4622.0, 1316.0, 515.0, 247.0, 118.0, 73.0, 37.0, 24.0, 17.0, 5.0, 6.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.857421875, -1.8057403564453125, -1.754058837890625, -1.7023773193359375, -1.65069580078125, -1.5990142822265625, -1.547332763671875, -1.4956512451171875, -1.4439697265625, -1.3922882080078125, -1.340606689453125, -1.2889251708984375, -1.23724365234375, -1.1855621337890625, -1.133880615234375, -1.0821990966796875, -1.030517578125, -0.9788360595703125, -0.927154541015625, -0.8754730224609375, -0.82379150390625, -0.7721099853515625, -0.720428466796875, -0.6687469482421875, -0.6170654296875, -0.5653839111328125, -0.513702392578125, -0.4620208740234375, -0.41033935546875, -0.3586578369140625, -0.306976318359375, -0.2552947998046875, -0.20361328125, -0.1519317626953125, -0.100250244140625, -0.0485687255859375, 0.00311279296875, 0.0547943115234375, 0.106475830078125, 0.1581573486328125, 0.2098388671875, 0.2615203857421875, 0.313201904296875, 0.3648834228515625, 0.41656494140625, 0.4682464599609375, 0.519927978515625, 0.5716094970703125, 0.623291015625, 0.6749725341796875, 0.726654052734375, 0.7783355712890625, 0.83001708984375, 0.8816986083984375, 0.933380126953125, 0.9850616455078125, 1.0367431640625, 1.0884246826171875, 1.140106201171875, 1.1917877197265625, 1.24346923828125, 1.2951507568359375, 1.346832275390625, 1.3985137939453125, 1.4501953125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 7.0, 24.0, 27.0, 48.0, 63.0, 85.0, 138.0, 207.0, 376.0, 671.0, 836.0, 642.0, 395.0, 196.0, 122.0, 64.0, 45.0, 37.0, 20.0, 16.0, 9.0, 13.0, 2.0, 5.0, 5.0, 4.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29931640625, -0.2888069152832031, -0.27829742431640625, -0.2677879333496094, -0.2572784423828125, -0.24676895141601562, -0.23625946044921875, -0.22574996948242188, -0.215240478515625, -0.20473098754882812, -0.19422149658203125, -0.18371200561523438, -0.1732025146484375, -0.16269302368164062, -0.15218353271484375, -0.14167404174804688, -0.13116455078125, -0.12065505981445312, -0.11014556884765625, -0.09963607788085938, -0.0891265869140625, -0.07861709594726562, -0.06810760498046875, -0.057598114013671875, -0.047088623046875, -0.036579132080078125, -0.02606964111328125, -0.015560150146484375, -0.0050506591796875, 0.005458831787109375, 0.01596832275390625, 0.026477813720703125, 0.0369873046875, 0.047496795654296875, 0.05800628662109375, 0.06851577758789062, 0.0790252685546875, 0.08953475952148438, 0.10004425048828125, 0.11055374145507812, 0.121063232421875, 0.13157272338867188, 0.14208221435546875, 0.15259170532226562, 0.1631011962890625, 0.17361068725585938, 0.18412017822265625, 0.19462966918945312, 0.20513916015625, 0.21564865112304688, 0.22615814208984375, 0.23666763305664062, 0.2471771240234375, 0.2576866149902344, 0.26819610595703125, 0.2787055969238281, 0.289215087890625, 0.2997245788574219, 0.31023406982421875, 0.3207435607910156, 0.3312530517578125, 0.3417625427246094, 0.35227203369140625, 0.3627815246582031, 0.373291015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 5.0, 12.0, 9.0, 22.0, 20.0, 23.0, 28.0, 46.0, 53.0, 62.0, 61.0, 56.0, 83.0, 75.0, 65.0, 64.0, 68.0, 36.0, 44.0, 27.0, 34.0, 24.0, 20.0, 19.0, 12.0, 4.0, 8.0, 7.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.793707013130188, -0.770160436630249, -0.7466138601303101, -0.7230673432350159, -0.6995207667350769, -0.6759741902351379, -0.6524276733398438, -0.6288810968399048, -0.6053345203399658, -0.5817879438400269, -0.5582413673400879, -0.5346948504447937, -0.5111482739448547, -0.48760169744491577, -0.4640551507472992, -0.4405086040496826, -0.41696202754974365, -0.3934154510498047, -0.3698689043521881, -0.34632235765457153, -0.32277578115463257, -0.2992292046546936, -0.275682657957077, -0.25213611125946045, -0.22858953475952148, -0.2050429731607437, -0.18149641156196594, -0.15794984996318817, -0.1344032883644104, -0.11085672676563263, -0.08731016516685486, -0.06376360356807709, -0.04021698236465454, -0.01667042076587677, 0.006876140832901001, 0.030422702431678772, 0.05396926403045654, 0.07751582562923431, 0.10106238722801208, 0.12460894882678986, 0.14815551042556763, 0.1717020720243454, 0.19524863362312317, 0.21879519522190094, 0.2423417568206787, 0.2658883333206177, 0.28943488001823425, 0.31298142671585083, 0.3365280032157898, 0.36007457971572876, 0.38362112641334534, 0.4071676731109619, 0.4307142496109009, 0.45426082611083984, 0.4778073728084564, 0.501353919506073, 0.524900496006012, 0.5484470725059509, 0.5719935894012451, 0.5955401659011841, 0.619086742401123, 0.642633318901062, 0.666179895401001, 0.6897264122962952, 0.7132729887962341]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 13.0, 9.0, 6.0, 14.0, 21.0, 15.0, 13.0, 32.0, 26.0, 36.0, 30.0, 42.0, 37.0, 48.0, 46.0, 34.0, 33.0, 29.0, 39.0, 45.0, 44.0, 28.0, 35.0, 44.0, 40.0, 27.0, 28.0, 27.0, 24.0, 12.0, 14.0, 18.0, 17.0, 14.0, 8.0, 10.0, 8.0, 10.0, 5.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5025694966316223, -0.48626694083213806, -0.4699643850326538, -0.45366182923316956, -0.4373592734336853, -0.42105668783187866, -0.4047541320323944, -0.38845157623291016, -0.3721490204334259, -0.35584646463394165, -0.3395439088344574, -0.32324135303497314, -0.3069387674331665, -0.29063624143600464, -0.274333655834198, -0.25803110003471375, -0.2417285442352295, -0.22542598843574524, -0.209123432636261, -0.19282086193561554, -0.1765183061361313, -0.16021575033664703, -0.1439131796360016, -0.12761062383651733, -0.11130806803703308, -0.09500551223754883, -0.07870294898748398, -0.06240038946270943, -0.046097829937934875, -0.029795274138450623, -0.013492710888385773, 0.002809852361679077, 0.019112467765808105, 0.03541502729058266, 0.05171758681535721, 0.06802015006542206, 0.08432270586490631, 0.10062526166439056, 0.11692782491445541, 0.13323038816452026, 0.14953294396400452, 0.16583549976348877, 0.18213805556297302, 0.19844062626361847, 0.21474318206310272, 0.23104573786258698, 0.24734830856323242, 0.2636508643627167, 0.2799534201622009, 0.2962559759616852, 0.31255853176116943, 0.3288610875606537, 0.34516364336013794, 0.3614662289619446, 0.37776878476142883, 0.3940713405609131, 0.41037389636039734, 0.4266764521598816, 0.44297900795936584, 0.4592815637588501, 0.47558414936065674, 0.4918866753578186, 0.5081892609596252, 0.5244917869567871, 0.5407943725585938]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 7.0, 16.0, 9.0, 22.0, 23.0, 18.0, 29.0, 44.0, 50.0, 76.0, 78.0, 117.0, 148.0, 211.0, 340.0, 592.0, 1107.0, 2040.0, 4275.0, 9991.0, 35713.0, 271161.0, 597278.0, 94354.0, 17623.0, 6383.0, 2958.0, 1480.0, 861.0, 481.0, 310.0, 199.0, 137.0, 107.0, 82.0, 49.0, 40.0, 37.0, 30.0, 9.0, 12.0, 10.0, 9.0, 5.0, 4.0, 8.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.18017578125, -0.17422103881835938, -0.16826629638671875, -0.16231155395507812, -0.1563568115234375, -0.15040206909179688, -0.14444732666015625, -0.13849258422851562, -0.132537841796875, -0.12658309936523438, -0.12062835693359375, -0.11467361450195312, -0.1087188720703125, -0.10276412963867188, -0.09680938720703125, -0.09085464477539062, -0.08489990234375, -0.07894515991210938, -0.07299041748046875, -0.06703567504882812, -0.0610809326171875, -0.055126190185546875, -0.04917144775390625, -0.043216705322265625, -0.037261962890625, -0.031307220458984375, -0.02535247802734375, -0.019397735595703125, -0.0134429931640625, -0.007488250732421875, -0.00153350830078125, 0.004421234130859375, 0.0103759765625, 0.016330718994140625, 0.02228546142578125, 0.028240203857421875, 0.0341949462890625, 0.040149688720703125, 0.04610443115234375, 0.052059173583984375, 0.058013916015625, 0.06396865844726562, 0.06992340087890625, 0.07587814331054688, 0.0818328857421875, 0.08778762817382812, 0.09374237060546875, 0.09969711303710938, 0.10565185546875, 0.11160659790039062, 0.11756134033203125, 0.12351608276367188, 0.1294708251953125, 0.13542556762695312, 0.14138031005859375, 0.14733505249023438, 0.153289794921875, 0.15924453735351562, 0.16519927978515625, 0.17115402221679688, 0.1771087646484375, 0.18306350708007812, 0.18901824951171875, 0.19497299194335938, 0.200927734375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 4.0, 9.0, 7.0, 15.0, 12.0, 18.0, 23.0, 26.0, 24.0, 33.0, 37.0, 33.0, 46.0, 35.0, 52.0, 32.0, 27.0, 37.0, 39.0, 50.0, 50.0, 31.0, 27.0, 44.0, 32.0, 28.0, 26.0, 30.0, 16.0, 24.0, 10.0, 10.0, 16.0, 16.0, 16.0, 12.0, 8.0, 5.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.346435546875, -0.3357048034667969, -0.32497406005859375, -0.3142433166503906, -0.3035125732421875, -0.2927818298339844, -0.28205108642578125, -0.2713203430175781, -0.260589599609375, -0.24985885620117188, -0.23912811279296875, -0.22839736938476562, -0.2176666259765625, -0.20693588256835938, -0.19620513916015625, -0.18547439575195312, -0.17474365234375, -0.16401290893554688, -0.15328216552734375, -0.14255142211914062, -0.1318206787109375, -0.12108993530273438, -0.11035919189453125, -0.09962844848632812, -0.088897705078125, -0.07816696166992188, -0.06743621826171875, -0.056705474853515625, -0.0459747314453125, -0.035243988037109375, -0.02451324462890625, -0.013782501220703125, -0.0030517578125, 0.007678985595703125, 0.01840972900390625, 0.029140472412109375, 0.0398712158203125, 0.050601959228515625, 0.06133270263671875, 0.07206344604492188, 0.082794189453125, 0.09352493286132812, 0.10425567626953125, 0.11498641967773438, 0.1257171630859375, 0.13644790649414062, 0.14717864990234375, 0.15790939331054688, 0.16864013671875, 0.17937088012695312, 0.19010162353515625, 0.20083236694335938, 0.2115631103515625, 0.22229385375976562, 0.23302459716796875, 0.24375534057617188, 0.254486083984375, 0.2652168273925781, 0.27594757080078125, 0.2866783142089844, 0.2974090576171875, 0.3081398010253906, 0.31887054443359375, 0.3296012878417969, 0.34033203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 5.0, 7.0, 13.0, 12.0, 20.0, 31.0, 29.0, 72.0, 111.0, 155.0, 273.0, 526.0, 1092.0, 2538.0, 7543.0, 32860.0, 302074.0, 608400.0, 72841.0, 12823.0, 3910.0, 1589.0, 682.0, 355.0, 212.0, 112.0, 84.0, 47.0, 37.0, 21.0, 19.0, 8.0, 12.0, 11.0, 8.0, 7.0, 3.0, 6.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1973876953125, -0.19178009033203125, -0.1861724853515625, -0.18056488037109375, -0.174957275390625, -0.16934967041015625, -0.1637420654296875, -0.15813446044921875, -0.15252685546875, -0.14691925048828125, -0.1413116455078125, -0.13570404052734375, -0.130096435546875, -0.12448883056640625, -0.1188812255859375, -0.11327362060546875, -0.107666015625, -0.10205841064453125, -0.0964508056640625, -0.09084320068359375, -0.085235595703125, -0.07962799072265625, -0.0740203857421875, -0.06841278076171875, -0.06280517578125, -0.05719757080078125, -0.0515899658203125, -0.04598236083984375, -0.040374755859375, -0.03476715087890625, -0.0291595458984375, -0.02355194091796875, -0.0179443359375, -0.01233673095703125, -0.0067291259765625, -0.00112152099609375, 0.004486083984375, 0.01009368896484375, 0.0157012939453125, 0.02130889892578125, 0.02691650390625, 0.03252410888671875, 0.0381317138671875, 0.04373931884765625, 0.049346923828125, 0.05495452880859375, 0.0605621337890625, 0.06616973876953125, 0.07177734375, 0.07738494873046875, 0.0829925537109375, 0.08860015869140625, 0.094207763671875, 0.09981536865234375, 0.1054229736328125, 0.11103057861328125, 0.11663818359375, 0.12224578857421875, 0.1278533935546875, 0.13346099853515625, 0.139068603515625, 0.14467620849609375, 0.1502838134765625, 0.15589141845703125, 0.1614990234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 8.0, 16.0, 14.0, 16.0, 25.0, 31.0, 19.0, 41.0, 37.0, 32.0, 36.0, 51.0, 41.0, 46.0, 46.0, 50.0, 37.0, 55.0, 43.0, 29.0, 42.0, 39.0, 25.0, 38.0, 28.0, 16.0, 16.0, 21.0, 19.0, 12.0, 13.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87890625, -0.8501434326171875, -0.821380615234375, -0.7926177978515625, -0.76385498046875, -0.7350921630859375, -0.706329345703125, -0.6775665283203125, -0.6488037109375, -0.6200408935546875, -0.591278076171875, -0.5625152587890625, -0.53375244140625, -0.5049896240234375, -0.476226806640625, -0.4474639892578125, -0.418701171875, -0.3899383544921875, -0.361175537109375, -0.3324127197265625, -0.30364990234375, -0.2748870849609375, -0.246124267578125, -0.2173614501953125, -0.1885986328125, -0.1598358154296875, -0.131072998046875, -0.1023101806640625, -0.07354736328125, -0.0447845458984375, -0.016021728515625, 0.0127410888671875, 0.04150390625, 0.0702667236328125, 0.099029541015625, 0.1277923583984375, 0.15655517578125, 0.1853179931640625, 0.214080810546875, 0.2428436279296875, 0.2716064453125, 0.3003692626953125, 0.329132080078125, 0.3578948974609375, 0.38665771484375, 0.4154205322265625, 0.444183349609375, 0.4729461669921875, 0.501708984375, 0.5304718017578125, 0.559234619140625, 0.5879974365234375, 0.61676025390625, 0.6455230712890625, 0.674285888671875, 0.7030487060546875, 0.7318115234375, 0.7605743408203125, 0.789337158203125, 0.8180999755859375, 0.84686279296875, 0.8756256103515625, 0.904388427734375, 0.9331512451171875, 0.9619140625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 6.0, 12.0, 17.0, 18.0, 21.0, 32.0, 48.0, 64.0, 131.0, 135.0, 231.0, 397.0, 561.0, 975.0, 1697.0, 3064.0, 6274.0, 14968.0, 55552.0, 547880.0, 352632.0, 39258.0, 12368.0, 5457.0, 2729.0, 1543.0, 894.0, 570.0, 341.0, 203.0, 136.0, 89.0, 58.0, 55.0, 32.0, 31.0, 19.0, 16.0, 6.0, 6.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08355712890625, -0.08093738555908203, -0.07831764221191406, -0.0756978988647461, -0.07307815551757812, -0.07045841217041016, -0.06783866882324219, -0.06521892547607422, -0.06259918212890625, -0.05997943878173828, -0.05735969543457031, -0.054739952087402344, -0.052120208740234375, -0.049500465393066406, -0.04688072204589844, -0.04426097869873047, -0.0416412353515625, -0.03902149200439453, -0.03640174865722656, -0.033782005310058594, -0.031162261962890625, -0.028542518615722656, -0.025922775268554688, -0.02330303192138672, -0.02068328857421875, -0.01806354522705078, -0.015443801879882812, -0.012824058532714844, -0.010204315185546875, -0.007584571838378906, -0.0049648284912109375, -0.0023450851440429688, 0.000274658203125, 0.0028944015502929688, 0.0055141448974609375, 0.008133888244628906, 0.010753631591796875, 0.013373374938964844, 0.015993118286132812, 0.01861286163330078, 0.02123260498046875, 0.02385234832763672, 0.026472091674804688, 0.029091835021972656, 0.031711578369140625, 0.034331321716308594, 0.03695106506347656, 0.03957080841064453, 0.0421905517578125, 0.04481029510498047, 0.04743003845214844, 0.050049781799316406, 0.052669525146484375, 0.055289268493652344, 0.05790901184082031, 0.06052875518798828, 0.06314849853515625, 0.06576824188232422, 0.06838798522949219, 0.07100772857666016, 0.07362747192382812, 0.0762472152709961, 0.07886695861816406, 0.08148670196533203, 0.0841064453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 6.0, 5.0, 19.0, 31.0, 57.0, 114.0, 208.0, 212.0, 155.0, 72.0, 35.0, 26.0, 5.0, 13.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.389617919921875e-05, -6.177462637424469e-05, -5.965307354927063e-05, -5.753152072429657e-05, -5.540996789932251e-05, -5.328841507434845e-05, -5.116686224937439e-05, -4.904530942440033e-05, -4.692375659942627e-05, -4.480220377445221e-05, -4.268065094947815e-05, -4.055909812450409e-05, -3.843754529953003e-05, -3.631599247455597e-05, -3.419443964958191e-05, -3.207288682460785e-05, -2.995133399963379e-05, -2.782978117465973e-05, -2.570822834968567e-05, -2.358667552471161e-05, -2.146512269973755e-05, -1.934356987476349e-05, -1.722201704978943e-05, -1.5100464224815369e-05, -1.2978911399841309e-05, -1.0857358574867249e-05, -8.735805749893188e-06, -6.614252924919128e-06, -4.492700099945068e-06, -2.3711472749710083e-06, -2.4959444999694824e-07, 1.8719583749771118e-06, 3.993511199951172e-06, 6.115064024925232e-06, 8.236616849899292e-06, 1.0358169674873352e-05, 1.2479722499847412e-05, 1.4601275324821472e-05, 1.6722828149795532e-05, 1.8844380974769592e-05, 2.0965933799743652e-05, 2.3087486624717712e-05, 2.5209039449691772e-05, 2.7330592274665833e-05, 2.9452145099639893e-05, 3.157369792461395e-05, 3.369525074958801e-05, 3.581680357456207e-05, 3.793835639953613e-05, 4.005990922451019e-05, 4.218146204948425e-05, 4.430301487445831e-05, 4.642456769943237e-05, 4.854612052440643e-05, 5.066767334938049e-05, 5.278922617435455e-05, 5.491077899932861e-05, 5.703233182430267e-05, 5.9153884649276733e-05, 6.12754374742508e-05, 6.339699029922485e-05, 6.551854312419891e-05, 6.764009594917297e-05, 6.976164877414703e-05, 7.18832015991211e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 14.0, 9.0, 15.0, 40.0, 50.0, 46.0, 83.0, 106.0, 171.0, 216.0, 310.0, 412.0, 616.0, 1010.0, 1577.0, 2652.0, 4974.0, 10315.0, 27673.0, 115658.0, 534895.0, 267404.0, 49230.0, 15474.0, 6627.0, 3510.0, 1867.0, 1166.0, 763.0, 526.0, 354.0, 252.0, 159.0, 119.0, 83.0, 42.0, 33.0, 25.0, 22.0, 12.0, 10.0, 8.0, 5.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07073974609375, -0.0683603286743164, -0.06598091125488281, -0.06360149383544922, -0.061222076416015625, -0.05884265899658203, -0.05646324157714844, -0.054083824157714844, -0.05170440673828125, -0.049324989318847656, -0.04694557189941406, -0.04456615447998047, -0.042186737060546875, -0.03980731964111328, -0.03742790222167969, -0.035048484802246094, -0.0326690673828125, -0.030289649963378906, -0.027910232543945312, -0.02553081512451172, -0.023151397705078125, -0.02077198028564453, -0.018392562866210938, -0.016013145446777344, -0.01363372802734375, -0.011254310607910156, -0.008874893188476562, -0.006495475769042969, -0.004116058349609375, -0.0017366409301757812, 0.0006427764892578125, 0.0030221939086914062, 0.005401611328125, 0.007781028747558594, 0.010160446166992188, 0.012539863586425781, 0.014919281005859375, 0.01729869842529297, 0.019678115844726562, 0.022057533264160156, 0.02443695068359375, 0.026816368103027344, 0.029195785522460938, 0.03157520294189453, 0.033954620361328125, 0.03633403778076172, 0.03871345520019531, 0.041092872619628906, 0.0434722900390625, 0.045851707458496094, 0.04823112487792969, 0.05061054229736328, 0.052989959716796875, 0.05536937713623047, 0.05774879455566406, 0.060128211975097656, 0.06250762939453125, 0.06488704681396484, 0.06726646423339844, 0.06964588165283203, 0.07202529907226562, 0.07440471649169922, 0.07678413391113281, 0.0791635513305664, 0.08154296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 10.0, 26.0, 33.0, 71.0, 76.0, 112.0, 176.0, 161.0, 107.0, 89.0, 52.0, 22.0, 19.0, 12.0, 3.0, 6.0, 1.0, 5.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.03990435600280762, -0.038823604583740234, -0.03774285316467285, -0.03666210174560547, -0.035581350326538086, -0.0345005989074707, -0.03341984748840332, -0.03233909606933594, -0.031258344650268555, -0.030177593231201172, -0.02909684181213379, -0.028016090393066406, -0.026935338973999023, -0.02585458755493164, -0.024773836135864258, -0.023693084716796875, -0.022612333297729492, -0.02153158187866211, -0.020450830459594727, -0.019370079040527344, -0.01828932762145996, -0.017208576202392578, -0.016127824783325195, -0.015047073364257812, -0.01396632194519043, -0.012885570526123047, -0.011804819107055664, -0.010724067687988281, -0.009643316268920898, -0.008562564849853516, -0.007481813430786133, -0.00640106201171875, -0.005320310592651367, -0.004239559173583984, -0.0031588077545166016, -0.0020780563354492188, -0.000997304916381836, 8.344650268554688e-05, 0.0011641979217529297, 0.0022449493408203125, 0.0033257007598876953, 0.004406452178955078, 0.005487203598022461, 0.006567955017089844, 0.0076487064361572266, 0.00872945785522461, 0.009810209274291992, 0.010890960693359375, 0.011971712112426758, 0.01305246353149414, 0.014133214950561523, 0.015213966369628906, 0.01629471778869629, 0.017375469207763672, 0.018456220626831055, 0.019536972045898438, 0.02061772346496582, 0.021698474884033203, 0.022779226303100586, 0.02385997772216797, 0.02494072914123535, 0.026021480560302734, 0.027102231979370117, 0.0281829833984375]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 6.0, 9.0, 12.0, 16.0, 18.0, 30.0, 51.0, 45.0, 42.0, 56.0, 60.0, 67.0, 69.0, 81.0, 62.0, 52.0, 49.0, 46.0, 35.0, 29.0, 29.0, 17.0, 29.0, 13.0, 12.0, 15.0, 8.0, 9.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4364004135131836, -0.4223867654800415, -0.4083731174468994, -0.3943594694137573, -0.38034582138061523, -0.36633217334747314, -0.35231852531433105, -0.33830487728118896, -0.3242912292480469, -0.3102775812149048, -0.2962639331817627, -0.2822502851486206, -0.2682366371154785, -0.2542229890823364, -0.24020932614803314, -0.22619567811489105, -0.21218201518058777, -0.19816836714744568, -0.1841547191143036, -0.1701410710811615, -0.1561274230480194, -0.14211377501487732, -0.12810011208057404, -0.11408646404743195, -0.10007281601428986, -0.08605916798114777, -0.07204551994800568, -0.05803186446428299, -0.0440182164311409, -0.03000456839799881, -0.015990912914276123, -0.001977264881134033, 0.012036412954330444, 0.026050062850117683, 0.04006371274590492, 0.05407736450433731, 0.0680910125374794, 0.08210466057062149, 0.09611831605434418, 0.11013196408748627, 0.12414561212062836, 0.13815926015377045, 0.15217290818691254, 0.16618657112121582, 0.1802002191543579, 0.1942138671875, 0.2082275152206421, 0.22224116325378418, 0.23625481128692627, 0.25026845932006836, 0.26428210735321045, 0.27829575538635254, 0.29230940341949463, 0.3063230514526367, 0.3203366994857788, 0.3343503475189209, 0.348363995552063, 0.3623776435852051, 0.37639129161834717, 0.39040493965148926, 0.40441858768463135, 0.41843223571777344, 0.4324458837509155, 0.4464595317840576, 0.4604732096195221]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 12.0, 12.0, 8.0, 10.0, 19.0, 25.0, 19.0, 25.0, 21.0, 34.0, 45.0, 31.0, 42.0, 42.0, 42.0, 42.0, 36.0, 33.0, 37.0, 42.0, 44.0, 41.0, 42.0, 34.0, 25.0, 38.0, 28.0, 28.0, 15.0, 16.0, 16.0, 17.0, 16.0, 9.0, 7.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3180714547634125, -0.30745241045951843, -0.2968333661556244, -0.28621432185173035, -0.2755952775478363, -0.26497626304626465, -0.2543572187423706, -0.24373817443847656, -0.23311913013458252, -0.22250008583068848, -0.21188104152679443, -0.2012619972229004, -0.19064296782016754, -0.1800239235162735, -0.16940487921237946, -0.1587858498096466, -0.14816679060459137, -0.13754774630069733, -0.12692870199680328, -0.11630966514348984, -0.10569062829017639, -0.09507158398628235, -0.0844525396823883, -0.07383350282907486, -0.06321445852518082, -0.05259541794657707, -0.04197637736797333, -0.031357333064079285, -0.02073829248547554, -0.010119251906871796, 0.0004997923970222473, 0.011118829250335693, 0.021737873554229736, 0.03235691413283348, 0.042975954711437225, 0.05359499901533127, 0.06421403586864471, 0.07483308017253876, 0.0854521244764328, 0.09607116132974625, 0.10669020563364029, 0.11730924993753433, 0.12792828679084778, 0.13854733109474182, 0.14916637539863586, 0.1597854197025299, 0.17040446400642395, 0.1810234934091568, 0.19164253771305084, 0.20226158201694489, 0.21288062632083893, 0.22349965572357178, 0.23411870002746582, 0.24473774433135986, 0.2553567886352539, 0.26597583293914795, 0.276594877243042, 0.28721392154693604, 0.2978329658508301, 0.3084520101547241, 0.31907105445861816, 0.3296900987625122, 0.34030914306640625, 0.3509281575679779, 0.36154720187187195]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 10.0, 11.0, 25.0, 20.0, 35.0, 48.0, 66.0, 109.0, 177.0, 261.0, 462.0, 744.0, 1265.0, 2453.0, 4540.0, 9227.0, 20377.0, 49400.0, 171457.0, 495105.0, 196204.0, 54076.0, 21599.0, 9909.0, 4960.0, 2508.0, 1429.0, 734.0, 505.0, 283.0, 196.0, 127.0, 69.0, 47.0, 35.0, 29.0, 17.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6021041870117188, -0.5836029052734375, -0.5651016235351562, -0.546600341796875, -0.5280990600585938, -0.5095977783203125, -0.49109649658203125, -0.47259521484375, -0.45409393310546875, -0.4355926513671875, -0.41709136962890625, -0.398590087890625, -0.38008880615234375, -0.3615875244140625, -0.34308624267578125, -0.3245849609375, -0.30608367919921875, -0.2875823974609375, -0.26908111572265625, -0.250579833984375, -0.23207855224609375, -0.2135772705078125, -0.19507598876953125, -0.17657470703125, -0.15807342529296875, -0.1395721435546875, -0.12107086181640625, -0.102569580078125, -0.08406829833984375, -0.0655670166015625, -0.04706573486328125, -0.028564453125, -0.01006317138671875, 0.0084381103515625, 0.02693939208984375, 0.045440673828125, 0.06394195556640625, 0.0824432373046875, 0.10094451904296875, 0.11944580078125, 0.13794708251953125, 0.1564483642578125, 0.17494964599609375, 0.193450927734375, 0.21195220947265625, 0.2304534912109375, 0.24895477294921875, 0.2674560546875, 0.28595733642578125, 0.3044586181640625, 0.32295989990234375, 0.341461181640625, 0.35996246337890625, 0.3784637451171875, 0.39696502685546875, 0.41546630859375, 0.43396759033203125, 0.4524688720703125, 0.47097015380859375, 0.489471435546875, 0.5079727172851562, 0.5264739990234375, 0.5449752807617188, 0.5634765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 10.0, 14.0, 11.0, 14.0, 17.0, 17.0, 22.0, 29.0, 39.0, 28.0, 41.0, 50.0, 44.0, 54.0, 33.0, 45.0, 46.0, 53.0, 30.0, 44.0, 43.0, 38.0, 38.0, 33.0, 32.0, 25.0, 22.0, 17.0, 15.0, 20.0, 10.0, 10.0, 7.0, 6.0, 11.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5205078125, -0.5, -0.4794921875, -0.458984375, -0.4384765625, -0.41796875, -0.3974609375, -0.376953125, -0.3564453125, -0.3359375, -0.3154296875, -0.294921875, -0.2744140625, -0.25390625, -0.2333984375, -0.212890625, -0.1923828125, -0.171875, -0.1513671875, -0.130859375, -0.1103515625, -0.08984375, -0.0693359375, -0.048828125, -0.0283203125, -0.0078125, 0.0126953125, 0.033203125, 0.0537109375, 0.07421875, 0.0947265625, 0.115234375, 0.1357421875, 0.15625, 0.1767578125, 0.197265625, 0.2177734375, 0.23828125, 0.2587890625, 0.279296875, 0.2998046875, 0.3203125, 0.3408203125, 0.361328125, 0.3818359375, 0.40234375, 0.4228515625, 0.443359375, 0.4638671875, 0.484375, 0.5048828125, 0.525390625, 0.5458984375, 0.56640625, 0.5869140625, 0.607421875, 0.6279296875, 0.6484375, 0.6689453125, 0.689453125, 0.7099609375, 0.73046875, 0.7509765625, 0.771484375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 17.0, 15.0, 25.0, 32.0, 41.0, 58.0, 78.0, 148.0, 148.0, 263.0, 390.0, 658.0, 977.0, 1738.0, 3066.0, 6078.0, 11958.0, 25494.0, 62393.0, 206549.0, 459674.0, 169134.0, 53908.0, 22518.0, 10761.0, 5313.0, 2870.0, 1574.0, 926.0, 563.0, 353.0, 256.0, 160.0, 102.0, 89.0, 61.0, 44.0, 42.0, 25.0, 18.0, 9.0, 10.0, 8.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.56494140625, -0.5498466491699219, -0.5347518920898438, -0.5196571350097656, -0.5045623779296875, -0.4894676208496094, -0.47437286376953125, -0.4592781066894531, -0.444183349609375, -0.4290885925292969, -0.41399383544921875, -0.3988990783691406, -0.3838043212890625, -0.3687095642089844, -0.35361480712890625, -0.3385200500488281, -0.32342529296875, -0.3083305358886719, -0.29323577880859375, -0.2781410217285156, -0.2630462646484375, -0.24795150756835938, -0.23285675048828125, -0.21776199340820312, -0.202667236328125, -0.18757247924804688, -0.17247772216796875, -0.15738296508789062, -0.1422882080078125, -0.12719345092773438, -0.11209869384765625, -0.09700393676757812, -0.0819091796875, -0.06681442260742188, -0.05171966552734375, -0.036624908447265625, -0.0215301513671875, -0.006435394287109375, 0.00865936279296875, 0.023754119873046875, 0.038848876953125, 0.053943634033203125, 0.06903839111328125, 0.08413314819335938, 0.0992279052734375, 0.11432266235351562, 0.12941741943359375, 0.14451217651367188, 0.15960693359375, 0.17470169067382812, 0.18979644775390625, 0.20489120483398438, 0.2199859619140625, 0.23508071899414062, 0.25017547607421875, 0.2652702331542969, 0.280364990234375, 0.2954597473144531, 0.31055450439453125, 0.3256492614746094, 0.3407440185546875, 0.3558387756347656, 0.37093353271484375, 0.3860282897949219, 0.401123046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 11.0, 9.0, 8.0, 12.0, 7.0, 16.0, 16.0, 14.0, 22.0, 20.0, 20.0, 25.0, 33.0, 36.0, 37.0, 32.0, 51.0, 49.0, 43.0, 46.0, 47.0, 40.0, 57.0, 44.0, 27.0, 32.0, 31.0, 29.0, 31.0, 23.0, 18.0, 20.0, 21.0, 14.0, 13.0, 5.0, 14.0, 1.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7421875, -0.7194061279296875, -0.696624755859375, -0.6738433837890625, -0.65106201171875, -0.6282806396484375, -0.605499267578125, -0.5827178955078125, -0.5599365234375, -0.5371551513671875, -0.514373779296875, -0.4915924072265625, -0.46881103515625, -0.4460296630859375, -0.423248291015625, -0.4004669189453125, -0.377685546875, -0.3549041748046875, -0.332122802734375, -0.3093414306640625, -0.28656005859375, -0.2637786865234375, -0.240997314453125, -0.2182159423828125, -0.1954345703125, -0.1726531982421875, -0.149871826171875, -0.1270904541015625, -0.10430908203125, -0.0815277099609375, -0.058746337890625, -0.0359649658203125, -0.01318359375, 0.0095977783203125, 0.032379150390625, 0.0551605224609375, 0.07794189453125, 0.1007232666015625, 0.123504638671875, 0.1462860107421875, 0.1690673828125, 0.1918487548828125, 0.214630126953125, 0.2374114990234375, 0.26019287109375, 0.2829742431640625, 0.305755615234375, 0.3285369873046875, 0.351318359375, 0.3740997314453125, 0.396881103515625, 0.4196624755859375, 0.44244384765625, 0.4652252197265625, 0.488006591796875, 0.5107879638671875, 0.5335693359375, 0.5563507080078125, 0.579132080078125, 0.6019134521484375, 0.62469482421875, 0.6474761962890625, 0.670257568359375, 0.6930389404296875, 0.7158203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 6.0, 5.0, 11.0, 12.0, 13.0, 18.0, 23.0, 47.0, 50.0, 72.0, 102.0, 157.0, 239.0, 309.0, 461.0, 677.0, 949.0, 1396.0, 2064.0, 3209.0, 5104.0, 8036.0, 12909.0, 21166.0, 35881.0, 59621.0, 99236.0, 152250.0, 246128.0, 150434.0, 98114.0, 58892.0, 34750.0, 20994.0, 12792.0, 7710.0, 4933.0, 3132.0, 2198.0, 1403.0, 933.0, 651.0, 418.0, 307.0, 217.0, 154.0, 97.0, 74.0, 51.0, 57.0, 31.0, 21.0, 18.0, 9.0, 13.0, 4.0, 4.0, 2.0, 3.0, 2.0], "bins": [-0.06610107421875, -0.06406593322753906, -0.062030792236328125, -0.05999565124511719, -0.05796051025390625, -0.05592536926269531, -0.053890228271484375, -0.05185508728027344, -0.0498199462890625, -0.04778480529785156, -0.045749664306640625, -0.04371452331542969, -0.04167938232421875, -0.03964424133300781, -0.037609100341796875, -0.03557395935058594, -0.033538818359375, -0.03150367736816406, -0.029468536376953125, -0.027433395385742188, -0.02539825439453125, -0.023363113403320312, -0.021327972412109375, -0.019292831420898438, -0.0172576904296875, -0.015222549438476562, -0.013187408447265625, -0.011152267456054688, -0.00911712646484375, -0.0070819854736328125, -0.005046844482421875, -0.0030117034912109375, -0.0009765625, 0.0010585784912109375, 0.003093719482421875, 0.0051288604736328125, 0.00716400146484375, 0.009199142456054688, 0.011234283447265625, 0.013269424438476562, 0.0153045654296875, 0.017339706420898438, 0.019374847412109375, 0.021409988403320312, 0.02344512939453125, 0.025480270385742188, 0.027515411376953125, 0.029550552368164062, 0.031585693359375, 0.03362083435058594, 0.035655975341796875, 0.03769111633300781, 0.03972625732421875, 0.04176139831542969, 0.043796539306640625, 0.04583168029785156, 0.0478668212890625, 0.04990196228027344, 0.051937103271484375, 0.05397224426269531, 0.05600738525390625, 0.05804252624511719, 0.060077667236328125, 0.06211280822753906, 0.06414794921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 14.0, 9.0, 20.0, 18.0, 31.0, 20.0, 36.0, 40.0, 43.0, 55.0, 43.0, 53.0, 90.0, 88.0, 66.0, 57.0, 49.0, 35.0, 36.0, 32.0, 33.0, 28.0, 18.0, 14.0, 15.0, 8.0, 9.0, 9.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0], "bins": [-3.2007694244384766e-05, -3.1186267733573914e-05, -3.036484122276306e-05, -2.954341471195221e-05, -2.8721988201141357e-05, -2.7900561690330505e-05, -2.7079135179519653e-05, -2.62577086687088e-05, -2.543628215789795e-05, -2.4614855647087097e-05, -2.3793429136276245e-05, -2.2972002625465393e-05, -2.215057611465454e-05, -2.132914960384369e-05, -2.0507723093032837e-05, -1.9686296582221985e-05, -1.8864870071411133e-05, -1.804344356060028e-05, -1.722201704978943e-05, -1.6400590538978577e-05, -1.5579164028167725e-05, -1.4757737517356873e-05, -1.393631100654602e-05, -1.3114884495735168e-05, -1.2293457984924316e-05, -1.1472031474113464e-05, -1.0650604963302612e-05, -9.82917845249176e-06, -9.007751941680908e-06, -8.186325430870056e-06, -7.364898920059204e-06, -6.543472409248352e-06, -5.7220458984375e-06, -4.900619387626648e-06, -4.079192876815796e-06, -3.257766366004944e-06, -2.436339855194092e-06, -1.6149133443832397e-06, -7.934868335723877e-07, 2.7939677238464355e-08, 8.493661880493164e-07, 1.6707926988601685e-06, 2.4922192096710205e-06, 3.3136457204818726e-06, 4.135072231292725e-06, 4.956498742103577e-06, 5.777925252914429e-06, 6.599351763725281e-06, 7.420778274536133e-06, 8.242204785346985e-06, 9.063631296157837e-06, 9.885057806968689e-06, 1.0706484317779541e-05, 1.1527910828590393e-05, 1.2349337339401245e-05, 1.3170763850212097e-05, 1.399219036102295e-05, 1.4813616871833801e-05, 1.5635043382644653e-05, 1.6456469893455505e-05, 1.7277896404266357e-05, 1.809932291507721e-05, 1.892074942588806e-05, 1.9742175936698914e-05, 2.0563602447509766e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 9.0, 6.0, 18.0, 13.0, 30.0, 32.0, 40.0, 57.0, 71.0, 126.0, 204.0, 365.0, 564.0, 1035.0, 1839.0, 3378.0, 6553.0, 13733.0, 31298.0, 78085.0, 205525.0, 402071.0, 181324.0, 69078.0, 27565.0, 12500.0, 5970.0, 3051.0, 1681.0, 910.0, 535.0, 284.0, 191.0, 144.0, 62.0, 57.0, 40.0, 31.0, 27.0, 8.0, 4.0, 9.0, 7.0, 11.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1416015625, -0.1372356414794922, -0.13286972045898438, -0.12850379943847656, -0.12413787841796875, -0.11977195739746094, -0.11540603637695312, -0.11104011535644531, -0.1066741943359375, -0.10230827331542969, -0.09794235229492188, -0.09357643127441406, -0.08921051025390625, -0.08484458923339844, -0.08047866821289062, -0.07611274719238281, -0.071746826171875, -0.06738090515136719, -0.06301498413085938, -0.05864906311035156, -0.05428314208984375, -0.04991722106933594, -0.045551300048828125, -0.04118537902832031, -0.0368194580078125, -0.03245353698730469, -0.028087615966796875, -0.023721694946289062, -0.01935577392578125, -0.014989852905273438, -0.010623931884765625, -0.0062580108642578125, -0.00189208984375, 0.0024738311767578125, 0.006839752197265625, 0.011205673217773438, 0.01557159423828125, 0.019937515258789062, 0.024303436279296875, 0.028669357299804688, 0.0330352783203125, 0.03740119934082031, 0.041767120361328125, 0.04613304138183594, 0.05049896240234375, 0.05486488342285156, 0.059230804443359375, 0.06359672546386719, 0.067962646484375, 0.07232856750488281, 0.07669448852539062, 0.08106040954589844, 0.08542633056640625, 0.08979225158691406, 0.09415817260742188, 0.09852409362792969, 0.1028900146484375, 0.10725593566894531, 0.11162185668945312, 0.11598777770996094, 0.12035369873046875, 0.12471961975097656, 0.12908554077148438, 0.1334514617919922, 0.1378173828125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 4.0, 14.0, 14.0, 12.0, 14.0, 21.0, 38.0, 31.0, 53.0, 40.0, 67.0, 74.0, 90.0, 132.0, 71.0, 72.0, 48.0, 37.0, 45.0, 23.0, 18.0, 24.0, 19.0, 5.0, 6.0, 5.0, 2.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111572265625, -0.10848617553710938, -0.10540008544921875, -0.10231399536132812, -0.0992279052734375, -0.09614181518554688, -0.09305572509765625, -0.08996963500976562, -0.086883544921875, -0.08379745483398438, -0.08071136474609375, -0.07762527465820312, -0.0745391845703125, -0.07145309448242188, -0.06836700439453125, -0.06528091430664062, -0.06219482421875, -0.059108734130859375, -0.05602264404296875, -0.052936553955078125, -0.0498504638671875, -0.046764373779296875, -0.04367828369140625, -0.040592193603515625, -0.037506103515625, -0.034420013427734375, -0.03133392333984375, -0.028247833251953125, -0.0251617431640625, -0.022075653076171875, -0.01898956298828125, -0.015903472900390625, -0.0128173828125, -0.009731292724609375, -0.00664520263671875, -0.003559112548828125, -0.0004730224609375, 0.002613067626953125, 0.00569915771484375, 0.008785247802734375, 0.011871337890625, 0.014957427978515625, 0.01804351806640625, 0.021129608154296875, 0.0242156982421875, 0.027301788330078125, 0.03038787841796875, 0.033473968505859375, 0.03656005859375, 0.039646148681640625, 0.04273223876953125, 0.045818328857421875, 0.0489044189453125, 0.051990509033203125, 0.05507659912109375, 0.058162689208984375, 0.061248779296875, 0.06433486938476562, 0.06742095947265625, 0.07050704956054688, 0.0735931396484375, 0.07667922973632812, 0.07976531982421875, 0.08285140991210938, 0.0859375]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 18.0, 30.0, 39.0, 47.0, 88.0, 112.0, 129.0, 138.0, 132.0, 85.0, 58.0, 40.0, 25.0, 18.0, 6.0, 4.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7422631978988647, -1.6838864088058472, -1.6255096197128296, -1.567132830619812, -1.5087560415267944, -1.4503792524337769, -1.3920024633407593, -1.3336256742477417, -1.2752488851547241, -1.2168720960617065, -1.158495306968689, -1.1001185178756714, -1.0417417287826538, -0.9833649396896362, -0.9249881505966187, -0.8666113615036011, -0.8082345128059387, -0.7498577237129211, -0.6914809346199036, -0.633104145526886, -0.5747273564338684, -0.516350507736206, -0.45797374844551086, -0.3995969593524933, -0.3412201702594757, -0.28284338116645813, -0.22446659207344055, -0.16608978807926178, -0.1077129989862442, -0.04933619499206543, 0.009040594100952148, 0.06741738319396973, 0.1257941722869873, 0.18417096138000488, 0.24254775047302246, 0.30092453956604004, 0.3593013286590576, 0.4176781475543976, 0.47605493664741516, 0.5344316959381104, 0.5928084850311279, 0.6511852741241455, 0.7095620632171631, 0.7679388523101807, 0.8263156414031982, 0.8846924304962158, 0.9430692195892334, 1.001446008682251, 1.0598227977752686, 1.1181995868682861, 1.1765763759613037, 1.2349531650543213, 1.2933299541473389, 1.3517067432403564, 1.410083532333374, 1.4684603214263916, 1.5268372297286987, 1.5852140188217163, 1.6435908079147339, 1.7019675970077515, 1.760344386100769, 1.8187211751937866, 1.8770979642868042, 1.9354747533798218, 1.9938515424728394]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 7.0, 6.0, 4.0, 7.0, 9.0, 9.0, 12.0, 15.0, 10.0, 17.0, 23.0, 25.0, 27.0, 22.0, 34.0, 30.0, 37.0, 26.0, 47.0, 37.0, 38.0, 57.0, 37.0, 42.0, 58.0, 41.0, 48.0, 42.0, 33.0, 21.0, 23.0, 25.0, 22.0, 21.0, 17.0, 14.0, 16.0, 9.0, 7.0, 9.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-1.433144211769104, -1.3912572860717773, -1.3493704795837402, -1.3074835538864136, -1.2655967473983765, -1.2237098217010498, -1.1818230152130127, -1.139936089515686, -1.098049283027649, -1.0561623573303223, -1.0142755508422852, -0.9723886847496033, -0.9305018186569214, -0.8886149525642395, -0.8467280864715576, -0.804841160774231, -0.7629542946815491, -0.7210674285888672, -0.6791805624961853, -0.6372936964035034, -0.5954068303108215, -0.5535199642181396, -0.511633038520813, -0.4697462022304535, -0.4278593361377716, -0.3859724700450897, -0.34408560395240784, -0.30219870805740356, -0.2603118419647217, -0.218424990773201, -0.1765381097793579, -0.13465124368667603, -0.09276437759399414, -0.05087750777602196, -0.008990637958049774, 0.03289623558521271, 0.07478310167789459, 0.11666996777057648, 0.15855684876441956, 0.20044371485710144, 0.24233058094978333, 0.2842174470424652, 0.3261043131351471, 0.36799120903015137, 0.40987807512283325, 0.45176494121551514, 0.493651807308197, 0.5355386734008789, 0.5774255394935608, 0.6193124055862427, 0.6611992716789246, 0.7030861377716064, 0.7449730038642883, 0.7868598699569702, 0.8287467956542969, 0.870633602142334, 0.9125205278396606, 0.9544073939323425, 0.9962942600250244, 1.038181185722351, 1.0800679922103882, 1.1219549179077148, 1.163841724395752, 1.2057286500930786, 1.2476154565811157]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 11.0, 10.0, 6.0, 10.0, 22.0, 21.0, 32.0, 27.0, 34.0, 72.0, 80.0, 91.0, 137.0, 150.0, 212.0, 300.0, 430.0, 568.0, 956.0, 1556.0, 2443.0, 5537.0, 1030562.0, 2488.0, 1575.0, 912.0, 646.0, 448.0, 310.0, 232.0, 168.0, 130.0, 84.0, 81.0, 72.0, 24.0, 40.0, 27.0, 26.0, 15.0, 13.0, 12.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6053814888000488, -1.5552562475204468, -1.5051310062408447, -1.4550058841705322, -1.4048806428909302, -1.3547554016113281, -1.304630160331726, -1.254504919052124, -1.204379677772522, -1.15425443649292, -1.1041291952133179, -1.0540039539337158, -1.0038788318634033, -0.9537535905838013, -0.9036283493041992, -0.8535031080245972, -0.8033779263496399, -0.7532526850700378, -0.7031275033950806, -0.6530022621154785, -0.6028770208358765, -0.5527517795562744, -0.5026265978813171, -0.4525013566017151, -0.4023761451244354, -0.35225093364715576, -0.3021256923675537, -0.25200048089027405, -0.2018752545118332, -0.15175002813339233, -0.10162481665611267, -0.05149957537651062, -0.001374363899230957, 0.0487508587539196, 0.09887608140707016, 0.14900130033493042, 0.19912652671337128, 0.24925175309181213, 0.2993769645690918, 0.34950220584869385, 0.3996274173259735, 0.4497526288032532, 0.4998778700828552, 0.5500030517578125, 0.6001282930374146, 0.6502535343170166, 0.7003787755966187, 0.7505040168762207, 0.800629198551178, 0.85075443983078, 0.9008796215057373, 0.9510048627853394, 1.0011301040649414, 1.0512553453445435, 1.1013805866241455, 1.151505708694458, 1.20163094997406, 1.251756191253662, 1.3018814325332642, 1.3520066738128662, 1.4021317958831787, 1.4522570371627808, 1.5023822784423828, 1.5525075197219849, 1.602632761001587]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 11.0, 10.0, 12.0, 46.0, 89.0, 222.0, 887.0, 3409.0, 16280.0, 51430152.0, 15165.0, 3631.0, 920.0, 274.0, 113.0, 52.0, 29.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.324853420257568, -7.037331581115723, -6.749809741973877, -6.462287902832031, -6.1747660636901855, -5.88724422454834, -5.599722862243652, -5.312200546264648, -5.024679183959961, -4.737157344818115, -4.4496355056762695, -4.162113666534424, -3.874591827392578, -3.5870699882507324, -3.299548387527466, -3.01202654838562, -2.7245044708251953, -2.4369826316833496, -2.149460792541504, -1.8619390726089478, -1.574417233467102, -1.2868953943252563, -0.9993736743927002, -0.7118518352508545, -0.4243299961090088, -0.13680818676948547, 0.15071362257003784, 0.43823540210723877, 0.7257572412490845, 1.0132790803909302, 1.3008008003234863, 1.588322639465332, 1.875844955444336, 2.1633667945861816, 2.4508886337280273, 2.738410472869873, 3.0259323120117188, 3.3134541511535645, 3.600975751876831, 3.8884975910186768, 4.176019668579102, 4.463541507720947, 4.751063346862793, 5.038585186004639, 5.326107025146484, 5.61362886428833, 5.901150703430176, 6.188672065734863, 6.476193904876709, 6.763715744018555, 7.0512375831604, 7.338759422302246, 7.626281261444092, 7.9138031005859375, 8.201324462890625, 8.488846778869629, 8.776368141174316, 9.063889503479004, 9.351411819458008, 9.638933181762695, 9.9264554977417, 10.213976860046387, 10.50149917602539, 10.789020538330078, 11.076542854309082]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 2.0, 2.0, 8.0, 3.0, 11.0, 10.0, 13.0, 31.0, 29.0, 45.0, 66.0, 104.0, 118.0, 194.0, 278.0, 442.0, 674.0, 1141.0, 1876.0, 3151.0, 5407.0, 9585.0, 17501.0, 32572.0, 64593.0, 131992.0, 271405.0, 543741.0, 3049914.0, 1323754.0, 416783.0, 208115.0, 101063.0, 49569.0, 25241.0, 13484.0, 7665.0, 4306.0, 2638.0, 1489.0, 883.0, 525.0, 356.0, 236.0, 121.0, 94.0, 66.0, 34.0, 27.0, 20.0, 22.0, 13.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.470703125, -0.4559059143066406, -0.44110870361328125, -0.4263114929199219, -0.4115142822265625, -0.3967170715332031, -0.38191986083984375, -0.3671226501464844, -0.352325439453125, -0.3375282287597656, -0.32273101806640625, -0.3079338073730469, -0.2931365966796875, -0.2783393859863281, -0.26354217529296875, -0.24874496459960938, -0.23394775390625, -0.21915054321289062, -0.20435333251953125, -0.18955612182617188, -0.1747589111328125, -0.15996170043945312, -0.14516448974609375, -0.13036727905273438, -0.115570068359375, -0.10077285766601562, -0.08597564697265625, -0.07117843627929688, -0.0563812255859375, -0.041584014892578125, -0.02678680419921875, -0.011989593505859375, 0.0028076171875, 0.017604827880859375, 0.03240203857421875, 0.047199249267578125, 0.0619964599609375, 0.07679367065429688, 0.09159088134765625, 0.10638809204101562, 0.121185302734375, 0.13598251342773438, 0.15077972412109375, 0.16557693481445312, 0.1803741455078125, 0.19517135620117188, 0.20996856689453125, 0.22476577758789062, 0.23956298828125, 0.2543601989746094, 0.26915740966796875, 0.2839546203613281, 0.2987518310546875, 0.3135490417480469, 0.32834625244140625, 0.3431434631347656, 0.357940673828125, 0.3727378845214844, 0.38753509521484375, 0.4023323059082031, 0.4171295166015625, 0.4319267272949219, 0.44672393798828125, 0.4615211486816406, 0.476318359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 12.0, 11.0, 9.0, 18.0, 26.0, 17.0, 25.0, 37.0, 23.0, 40.0, 41.0, 49.0, 50.0, 55.0, 269.0, 774.0, 118.0, 53.0, 59.0, 38.0, 41.0, 30.0, 42.0, 23.0, 25.0, 22.0, 15.0, 18.0, 18.0, 12.0, 12.0, 9.0, 3.0, 6.0, 4.0, 1.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40234375, -4.273773193359375, -4.14520263671875, -4.016632080078125, -3.8880615234375, -3.759490966796875, -3.63092041015625, -3.502349853515625, -3.373779296875, -3.245208740234375, -3.11663818359375, -2.988067626953125, -2.8594970703125, -2.730926513671875, -2.60235595703125, -2.473785400390625, -2.34521484375, -2.216644287109375, -2.08807373046875, -1.959503173828125, -1.8309326171875, -1.702362060546875, -1.57379150390625, -1.445220947265625, -1.316650390625, -1.188079833984375, -1.05950927734375, -0.930938720703125, -0.8023681640625, -0.673797607421875, -0.54522705078125, -0.416656494140625, -0.2880859375, -0.159515380859375, -0.03094482421875, 0.097625732421875, 0.2261962890625, 0.354766845703125, 0.48333740234375, 0.611907958984375, 0.740478515625, 0.869049072265625, 0.99761962890625, 1.126190185546875, 1.2547607421875, 1.383331298828125, 1.51190185546875, 1.640472412109375, 1.76904296875, 1.897613525390625, 2.02618408203125, 2.154754638671875, 2.2833251953125, 2.411895751953125, 2.54046630859375, 2.669036865234375, 2.797607421875, 2.926177978515625, 3.05474853515625, 3.183319091796875, 3.3118896484375, 3.440460205078125, 3.56903076171875, 3.697601318359375, 3.826171875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 9.0, 15.0, 18.0, 34.0, 51.0, 75.0, 126.0, 201.0, 294.0, 532.0, 866.0, 1527.0, 2373.0, 4281.0, 7396.0, 13462.0, 23903.0, 44830.0, 81635.0, 144652.0, 240551.0, 363375.0, 760659.0, 3274336.0, 510165.0, 327723.0, 211122.0, 124675.0, 68565.0, 37387.0, 20296.0, 11235.0, 6120.0, 3581.0, 2081.0, 1226.0, 780.0, 459.0, 293.0, 180.0, 114.0, 72.0, 62.0, 39.0, 26.0, 14.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.262939453125, -0.25481414794921875, -0.2466888427734375, -0.23856353759765625, -0.230438232421875, -0.22231292724609375, -0.2141876220703125, -0.20606231689453125, -0.19793701171875, -0.18981170654296875, -0.1816864013671875, -0.17356109619140625, -0.165435791015625, -0.15731048583984375, -0.1491851806640625, -0.14105987548828125, -0.1329345703125, -0.12480926513671875, -0.1166839599609375, -0.10855865478515625, -0.100433349609375, -0.09230804443359375, -0.0841827392578125, -0.07605743408203125, -0.06793212890625, -0.05980682373046875, -0.0516815185546875, -0.04355621337890625, -0.035430908203125, -0.02730560302734375, -0.0191802978515625, -0.01105499267578125, -0.0029296875, 0.00519561767578125, 0.0133209228515625, 0.02144622802734375, 0.029571533203125, 0.03769683837890625, 0.0458221435546875, 0.05394744873046875, 0.06207275390625, 0.07019805908203125, 0.0783233642578125, 0.08644866943359375, 0.094573974609375, 0.10269927978515625, 0.1108245849609375, 0.11894989013671875, 0.1270751953125, 0.13520050048828125, 0.1433258056640625, 0.15145111083984375, 0.159576416015625, 0.16770172119140625, 0.1758270263671875, 0.18395233154296875, 0.19207763671875, 0.20020294189453125, 0.2083282470703125, 0.21645355224609375, 0.224578857421875, 0.23270416259765625, 0.2408294677734375, 0.24895477294921875, 0.257080078125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 10.0, 7.0, 6.0, 10.0, 10.0, 18.0, 17.0, 30.0, 14.0, 34.0, 34.0, 37.0, 40.0, 43.0, 42.0, 46.0, 41.0, 83.0, 890.0, 195.0, 44.0, 33.0, 31.0, 36.0, 36.0, 35.0, 36.0, 22.0, 31.0, 17.0, 19.0, 16.0, 13.0, 9.0, 10.0, 8.0, 5.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.640625, -3.540985107421875, -3.44134521484375, -3.341705322265625, -3.2420654296875, -3.142425537109375, -3.04278564453125, -2.943145751953125, -2.843505859375, -2.743865966796875, -2.64422607421875, -2.544586181640625, -2.4449462890625, -2.345306396484375, -2.24566650390625, -2.146026611328125, -2.04638671875, -1.946746826171875, -1.84710693359375, -1.747467041015625, -1.6478271484375, -1.548187255859375, -1.44854736328125, -1.348907470703125, -1.249267578125, -1.149627685546875, -1.04998779296875, -0.950347900390625, -0.8507080078125, -0.751068115234375, -0.65142822265625, -0.551788330078125, -0.4521484375, -0.352508544921875, -0.25286865234375, -0.153228759765625, -0.0535888671875, 0.046051025390625, 0.14569091796875, 0.245330810546875, 0.344970703125, 0.444610595703125, 0.54425048828125, 0.643890380859375, 0.7435302734375, 0.843170166015625, 0.94281005859375, 1.042449951171875, 1.14208984375, 1.241729736328125, 1.34136962890625, 1.441009521484375, 1.5406494140625, 1.640289306640625, 1.73992919921875, 1.839569091796875, 1.939208984375, 2.038848876953125, 2.13848876953125, 2.238128662109375, 2.3377685546875, 2.437408447265625, 2.53704833984375, 2.636688232421875, 2.736328125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 10.0, 10.0, 11.0, 19.0, 43.0, 34.0, 54.0, 82.0, 124.0, 162.0, 226.0, 325.0, 426.0, 663.0, 1023.0, 1681.0, 2782.0, 5326.0, 11682.0, 29766.0, 88490.0, 278136.0, 765019.0, 4161191.0, 616737.0, 214330.0, 68417.0, 24019.0, 9461.0, 4363.0, 2411.0, 1457.0, 935.0, 583.0, 414.0, 293.0, 211.0, 138.0, 89.0, 72.0, 52.0, 44.0, 27.0, 26.0, 18.0, 14.0, 9.0, 10.0, 6.0, 4.0, 4.0, 2.0, 5.0], "bins": [-0.5595703125, -0.5432968139648438, -0.5270233154296875, -0.5107498168945312, -0.494476318359375, -0.47820281982421875, -0.4619293212890625, -0.44565582275390625, -0.42938232421875, -0.41310882568359375, -0.3968353271484375, -0.38056182861328125, -0.364288330078125, -0.34801483154296875, -0.3317413330078125, -0.31546783447265625, -0.2991943359375, -0.28292083740234375, -0.2666473388671875, -0.25037384033203125, -0.234100341796875, -0.21782684326171875, -0.2015533447265625, -0.18527984619140625, -0.16900634765625, -0.15273284912109375, -0.1364593505859375, -0.12018585205078125, -0.103912353515625, -0.08763885498046875, -0.0713653564453125, -0.05509185791015625, -0.038818359375, -0.02254486083984375, -0.0062713623046875, 0.01000213623046875, 0.026275634765625, 0.04254913330078125, 0.0588226318359375, 0.07509613037109375, 0.09136962890625, 0.10764312744140625, 0.1239166259765625, 0.14019012451171875, 0.156463623046875, 0.17273712158203125, 0.1890106201171875, 0.20528411865234375, 0.2215576171875, 0.23783111572265625, 0.2541046142578125, 0.27037811279296875, 0.286651611328125, 0.30292510986328125, 0.3191986083984375, 0.33547210693359375, 0.35174560546875, 0.36801910400390625, 0.3842926025390625, 0.40056610107421875, 0.416839599609375, 0.43311309814453125, 0.4493865966796875, 0.46566009521484375, 0.48193359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 10.0, 6.0, 4.0, 12.0, 8.0, 11.0, 19.0, 21.0, 21.0, 27.0, 25.0, 41.0, 24.0, 27.0, 45.0, 39.0, 30.0, 38.0, 40.0, 105.0, 923.0, 115.0, 49.0, 34.0, 39.0, 35.0, 24.0, 32.0, 24.0, 28.0, 25.0, 21.0, 21.0, 20.0, 21.0, 18.0, 9.0, 7.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.095672607421875, -2.99407958984375, -2.892486572265625, -2.7908935546875, -2.689300537109375, -2.58770751953125, -2.486114501953125, -2.384521484375, -2.282928466796875, -2.18133544921875, -2.079742431640625, -1.9781494140625, -1.876556396484375, -1.77496337890625, -1.673370361328125, -1.57177734375, -1.470184326171875, -1.36859130859375, -1.266998291015625, -1.1654052734375, -1.063812255859375, -0.96221923828125, -0.860626220703125, -0.759033203125, -0.657440185546875, -0.55584716796875, -0.454254150390625, -0.3526611328125, -0.251068115234375, -0.14947509765625, -0.047882080078125, 0.0537109375, 0.155303955078125, 0.25689697265625, 0.358489990234375, 0.4600830078125, 0.561676025390625, 0.66326904296875, 0.764862060546875, 0.866455078125, 0.968048095703125, 1.06964111328125, 1.171234130859375, 1.2728271484375, 1.374420166015625, 1.47601318359375, 1.577606201171875, 1.67919921875, 1.780792236328125, 1.88238525390625, 1.983978271484375, 2.0855712890625, 2.187164306640625, 2.28875732421875, 2.390350341796875, 2.491943359375, 2.593536376953125, 2.69512939453125, 2.796722412109375, 2.8983154296875, 2.999908447265625, 3.10150146484375, 3.203094482421875, 3.3046875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 10.0, 11.0, 9.0, 35.0, 89.0, 331.0, 319.0, 117.0, 53.0, 16.0, 7.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.579322814941406, -19.090288162231445, -18.601253509521484, -18.112218856811523, -17.623184204101562, -17.13414764404297, -16.64511489868164, -16.156078338623047, -15.667043685913086, -15.178009033203125, -14.688974380493164, -14.199939727783203, -13.710904121398926, -13.221869468688965, -12.732834815979004, -12.243800163269043, -11.754765510559082, -11.265730857849121, -10.77669620513916, -10.287660598754883, -9.798625946044922, -9.309591293334961, -8.820556640625, -8.331521987915039, -7.84248685836792, -7.353452205657959, -6.86441707611084, -6.375382423400879, -5.886347770690918, -5.397312641143799, -4.908277988433838, -4.419242858886719, -3.9302072525024414, -3.4411723613739014, -2.9521374702453613, -2.4631028175354004, -1.9740679264068604, -1.4850330352783203, -0.9959983825683594, -0.5069634914398193, -0.017928600311279297, 0.47110623121261597, 0.9601410627365112, 1.4491758346557617, 1.9382107257843018, 2.427245616912842, 2.9162802696228027, 3.4053151607513428, 3.894350051879883, 4.383384704589844, 4.872419834136963, 5.361454486846924, 5.850489616394043, 6.339524269104004, 6.828558921813965, 7.317593574523926, 7.806628704071045, 8.295663833618164, 8.784698486328125, 9.273733139038086, 9.762767791748047, 10.251802444458008, 10.740837097167969, 11.229872703552246, 11.718907356262207]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 9.0, 7.0, 7.0, 13.0, 19.0, 14.0, 25.0, 25.0, 27.0, 36.0, 31.0, 32.0, 48.0, 44.0, 45.0, 42.0, 40.0, 54.0, 57.0, 35.0, 46.0, 38.0, 38.0, 38.0, 30.0, 26.0, 35.0, 27.0, 19.0, 20.0, 11.0, 11.0, 10.0, 8.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.10011100769043, -9.768705368041992, -9.437298774719238, -9.1058931350708, -8.774486541748047, -8.44308090209961, -8.111675262451172, -7.780269145965576, -7.4488630294799805, -7.117456912994385, -6.786050796508789, -6.454645156860352, -6.123239040374756, -5.79183292388916, -5.460427284240723, -5.129021167755127, -4.797615051269531, -4.4662089347839355, -4.13480281829834, -3.8033971786499023, -3.4719910621643066, -3.140584945678711, -2.8091790676116943, -2.4777731895446777, -2.146367073059082, -1.8149610757827759, -1.4835550785064697, -1.1521490812301636, -0.8207430839538574, -0.48933708667755127, -0.15793108940124512, 0.17347478866577148, 0.5048809051513672, 0.8362869024276733, 1.1676928997039795, 1.4990988969802856, 1.8305048942565918, 2.1619110107421875, 2.493316888809204, 2.8247227668762207, 3.1561288833618164, 3.487534999847412, 3.8189408779144287, 4.150346755981445, 4.481752872467041, 4.813158988952637, 5.144564628601074, 5.47597074508667, 5.807376861572266, 6.138782978057861, 6.470189094543457, 6.8015947341918945, 7.13300085067749, 7.464406967163086, 7.795812606811523, 8.127218246459961, 8.458624839782715, 8.790030479431152, 9.121437072753906, 9.452842712402344, 9.784248352050781, 10.115654945373535, 10.447060585021973, 10.778467178344727, 11.109872817993164]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 5.0, 4.0, 6.0, 16.0, 21.0, 24.0, 29.0, 36.0, 57.0, 94.0, 110.0, 161.0, 290.0, 556.0, 1303.0, 3872.0, 14577.0, 112770.0, 3952287.0, 88110.0, 13562.0, 3976.0, 1258.0, 509.0, 218.0, 121.0, 72.0, 54.0, 40.0, 38.0, 31.0, 23.0, 18.0, 14.0, 15.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.234130859375, -0.22752952575683594, -0.22092819213867188, -0.2143268585205078, -0.20772552490234375, -0.2011241912841797, -0.19452285766601562, -0.18792152404785156, -0.1813201904296875, -0.17471885681152344, -0.16811752319335938, -0.1615161895751953, -0.15491485595703125, -0.1483135223388672, -0.14171218872070312, -0.13511085510253906, -0.128509521484375, -0.12190818786621094, -0.11530685424804688, -0.10870552062988281, -0.10210418701171875, -0.09550285339355469, -0.08890151977539062, -0.08230018615722656, -0.0756988525390625, -0.06909751892089844, -0.062496185302734375, -0.05589485168457031, -0.04929351806640625, -0.04269218444824219, -0.036090850830078125, -0.029489517211914062, -0.02288818359375, -0.016286849975585938, -0.009685516357421875, -0.0030841827392578125, 0.00351715087890625, 0.010118484497070312, 0.016719818115234375, 0.023321151733398438, 0.0299224853515625, 0.03652381896972656, 0.043125152587890625, 0.04972648620605469, 0.05632781982421875, 0.06292915344238281, 0.06953048706054688, 0.07613182067871094, 0.082733154296875, 0.08933448791503906, 0.09593582153320312, 0.10253715515136719, 0.10913848876953125, 0.11573982238769531, 0.12234115600585938, 0.12894248962402344, 0.1355438232421875, 0.14214515686035156, 0.14874649047851562, 0.1553478240966797, 0.16194915771484375, 0.1685504913330078, 0.17515182495117188, 0.18175315856933594, 0.1883544921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 9.0, 7.0, 14.0, 16.0, 25.0, 22.0, 19.0, 25.0, 33.0, 38.0, 46.0, 51.0, 58.0, 53.0, 61.0, 60.0, 53.0, 53.0, 50.0, 45.0, 40.0, 33.0, 22.0, 32.0, 16.0, 10.0, 16.0, 14.0, 15.0, 12.0, 10.0, 4.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042877197265625, -0.04157590866088867, -0.040274620056152344, -0.038973331451416016, -0.03767204284667969, -0.03637075424194336, -0.03506946563720703, -0.0337681770324707, -0.032466888427734375, -0.031165599822998047, -0.02986431121826172, -0.02856302261352539, -0.027261734008789062, -0.025960445404052734, -0.024659156799316406, -0.023357868194580078, -0.02205657958984375, -0.020755290985107422, -0.019454002380371094, -0.018152713775634766, -0.016851425170898438, -0.01555013656616211, -0.014248847961425781, -0.012947559356689453, -0.011646270751953125, -0.010344982147216797, -0.009043693542480469, -0.007742404937744141, -0.0064411163330078125, -0.005139827728271484, -0.0038385391235351562, -0.002537250518798828, -0.0012359619140625, 6.532669067382812e-05, 0.0013666152954101562, 0.0026679039001464844, 0.0039691925048828125, 0.005270481109619141, 0.006571769714355469, 0.007873058319091797, 0.009174346923828125, 0.010475635528564453, 0.011776924133300781, 0.01307821273803711, 0.014379501342773438, 0.015680789947509766, 0.016982078552246094, 0.018283367156982422, 0.01958465576171875, 0.020885944366455078, 0.022187232971191406, 0.023488521575927734, 0.024789810180664062, 0.02609109878540039, 0.02739238739013672, 0.028693675994873047, 0.029994964599609375, 0.0312962532043457, 0.03259754180908203, 0.03389883041381836, 0.03520011901855469, 0.036501407623291016, 0.037802696228027344, 0.03910398483276367, 0.0404052734375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 7.0, 10.0, 17.0, 13.0, 31.0, 39.0, 59.0, 91.0, 270.0, 1474.0, 59622.0, 4122011.0, 9568.0, 703.0, 127.0, 62.0, 43.0, 23.0, 15.0, 15.0, 14.0, 5.0, 7.0, 8.0, 8.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.279052734375, -0.2709197998046875, -0.262786865234375, -0.2546539306640625, -0.24652099609375, -0.2383880615234375, -0.230255126953125, -0.2221221923828125, -0.2139892578125, -0.2058563232421875, -0.197723388671875, -0.1895904541015625, -0.18145751953125, -0.1733245849609375, -0.165191650390625, -0.1570587158203125, -0.14892578125, -0.1407928466796875, -0.132659912109375, -0.1245269775390625, -0.11639404296875, -0.1082611083984375, -0.100128173828125, -0.0919952392578125, -0.0838623046875, -0.0757293701171875, -0.067596435546875, -0.0594635009765625, -0.05133056640625, -0.0431976318359375, -0.035064697265625, -0.0269317626953125, -0.018798828125, -0.0106658935546875, -0.002532958984375, 0.0055999755859375, 0.01373291015625, 0.0218658447265625, 0.029998779296875, 0.0381317138671875, 0.0462646484375, 0.0543975830078125, 0.062530517578125, 0.0706634521484375, 0.07879638671875, 0.0869293212890625, 0.095062255859375, 0.1031951904296875, 0.111328125, 0.1194610595703125, 0.127593994140625, 0.1357269287109375, 0.14385986328125, 0.1519927978515625, 0.160125732421875, 0.1682586669921875, 0.1763916015625, 0.1845245361328125, 0.192657470703125, 0.2007904052734375, 0.20892333984375, 0.2170562744140625, 0.225189208984375, 0.2333221435546875, 0.241455078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 8.0, 4.0, 2.0, 10.0, 14.0, 13.0, 27.0, 48.0, 77.0, 182.0, 441.0, 1107.0, 1181.0, 522.0, 196.0, 92.0, 46.0, 26.0, 25.0, 16.0, 8.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0911865234375, -0.08833789825439453, -0.08548927307128906, -0.0826406478881836, -0.07979202270507812, -0.07694339752197266, -0.07409477233886719, -0.07124614715576172, -0.06839752197265625, -0.06554889678955078, -0.06270027160644531, -0.059851646423339844, -0.057003021240234375, -0.054154396057128906, -0.05130577087402344, -0.04845714569091797, -0.0456085205078125, -0.04275989532470703, -0.03991127014160156, -0.037062644958496094, -0.034214019775390625, -0.031365394592285156, -0.028516769409179688, -0.02566814422607422, -0.02281951904296875, -0.01997089385986328, -0.017122268676757812, -0.014273643493652344, -0.011425018310546875, -0.008576393127441406, -0.0057277679443359375, -0.0028791427612304688, -3.0517578125e-05, 0.0028181076049804688, 0.0056667327880859375, 0.008515357971191406, 0.011363983154296875, 0.014212608337402344, 0.017061233520507812, 0.01990985870361328, 0.02275848388671875, 0.02560710906982422, 0.028455734252929688, 0.031304359436035156, 0.034152984619140625, 0.037001609802246094, 0.03985023498535156, 0.04269886016845703, 0.0455474853515625, 0.04839611053466797, 0.05124473571777344, 0.054093360900878906, 0.056941986083984375, 0.059790611267089844, 0.06263923645019531, 0.06548786163330078, 0.06833648681640625, 0.07118511199951172, 0.07403373718261719, 0.07688236236572266, 0.07973098754882812, 0.0825796127319336, 0.08542823791503906, 0.08827686309814453, 0.09112548828125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 9.0, 793.0, 199.0, 10.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1575231552124023, -1.0923783779144287, -1.027233600616455, -0.9620888233184814, -0.8969440460205078, -0.8317992687225342, -0.7666545510292053, -0.7015097737312317, -0.6363649964332581, -0.5712202191352844, -0.5060754418373108, -0.44093069434165955, -0.3757859170436859, -0.3106411397457123, -0.24549639225006104, -0.1803516149520874, -0.11520683765411377, -0.050062067806720734, 0.015082702040672302, 0.08022746443748474, 0.14537224173545837, 0.210517019033432, 0.27566176652908325, 0.3408065438270569, 0.4059513211250305, 0.47109609842300415, 0.5362408757209778, 0.6013855934143066, 0.6665303707122803, 0.7316751480102539, 0.7968199253082275, 0.8619647026062012, 0.9271094799041748, 0.9922542572021484, 1.057399034500122, 1.1225438117980957, 1.1876885890960693, 1.252833366394043, 1.3179781436920166, 1.3831229209899902, 1.4482676982879639, 1.5134124755859375, 1.5785572528839111, 1.6437020301818848, 1.7088468074798584, 1.773991584777832, 1.8391363620758057, 1.9042811393737793, 1.9694257974624634, 2.0345704555511475, 2.099715232849121, 2.1648600101470947, 2.2300047874450684, 2.295149564743042, 2.3602943420410156, 2.4254391193389893, 2.490583896636963, 2.5557286739349365, 2.62087345123291, 2.686018228530884, 2.7511630058288574, 2.816307783126831, 2.8814525604248047, 2.9465973377227783, 3.011742115020752]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 2.0, 5.0, 4.0, 2.0, 9.0, 11.0, 11.0, 13.0, 18.0, 17.0, 31.0, 23.0, 26.0, 20.0, 31.0, 39.0, 39.0, 33.0, 31.0, 30.0, 50.0, 38.0, 39.0, 36.0, 37.0, 41.0, 57.0, 34.0, 36.0, 30.0, 22.0, 26.0, 26.0, 13.0, 19.0, 22.0, 13.0, 14.0, 14.0, 10.0, 6.0, 7.0, 1.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.15533310174942017, -0.15025539696216583, -0.1451776921749115, -0.14009998738765717, -0.13502228260040283, -0.1299445629119873, -0.12486685812473297, -0.11978915333747864, -0.1147114485502243, -0.10963374376296997, -0.10455603897571564, -0.0994783267378807, -0.09440062195062637, -0.08932291716337204, -0.08424520492553711, -0.07916750013828278, -0.07408979535102844, -0.06901209056377411, -0.06393438577651978, -0.058856673538684845, -0.05377896875143051, -0.04870126396417618, -0.043623555451631546, -0.038545846939086914, -0.03346814215183258, -0.028390435501933098, -0.023312728852033615, -0.018235022202134132, -0.01315731555223465, -0.008079608902335167, -0.003001902252435684, 0.0020758062601089478, 0.007153511047363281, 0.012231217697262764, 0.017308924347162247, 0.02238663099706173, 0.027464337646961212, 0.032542042434215546, 0.03761975094676018, 0.04269745945930481, 0.04777516424655914, 0.05285286903381348, 0.05793057754635811, 0.06300828605890274, 0.06808599084615707, 0.07316369563341141, 0.07824140787124634, 0.08331911265850067, 0.088396817445755, 0.09347452223300934, 0.09855222702026367, 0.1036299392580986, 0.10870764404535294, 0.11378534883260727, 0.1188630610704422, 0.12394076585769653, 0.12901847064495087, 0.1340961754322052, 0.13917388021945953, 0.14425158500671387, 0.1493293046951294, 0.15440700948238373, 0.15948471426963806, 0.1645624190568924, 0.16964012384414673]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 18.0, 14.0, 21.0, 23.0, 33.0, 42.0, 74.0, 93.0, 129.0, 191.0, 249.0, 442.0, 648.0, 1070.0, 1952.0, 3891.0, 9424.0, 40764.0, 808077.0, 152252.0, 16883.0, 5726.0, 2678.0, 1411.0, 872.0, 518.0, 320.0, 231.0, 143.0, 106.0, 65.0, 37.0, 32.0, 30.0, 21.0, 18.0, 14.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20849609375, -0.20124053955078125, -0.1939849853515625, -0.18672943115234375, -0.179473876953125, -0.17221832275390625, -0.1649627685546875, -0.15770721435546875, -0.15045166015625, -0.14319610595703125, -0.1359405517578125, -0.12868499755859375, -0.121429443359375, -0.11417388916015625, -0.1069183349609375, -0.09966278076171875, -0.0924072265625, -0.08515167236328125, -0.0778961181640625, -0.07064056396484375, -0.063385009765625, -0.05612945556640625, -0.0488739013671875, -0.04161834716796875, -0.03436279296875, -0.02710723876953125, -0.0198516845703125, -0.01259613037109375, -0.005340576171875, 0.00191497802734375, 0.0091705322265625, 0.01642608642578125, 0.023681640625, 0.03093719482421875, 0.0381927490234375, 0.04544830322265625, 0.052703857421875, 0.05995941162109375, 0.0672149658203125, 0.07447052001953125, 0.08172607421875, 0.08898162841796875, 0.0962371826171875, 0.10349273681640625, 0.110748291015625, 0.11800384521484375, 0.1252593994140625, 0.13251495361328125, 0.1397705078125, 0.14702606201171875, 0.1542816162109375, 0.16153717041015625, 0.168792724609375, 0.17604827880859375, 0.1833038330078125, 0.19055938720703125, 0.19781494140625, 0.20507049560546875, 0.2123260498046875, 0.21958160400390625, 0.226837158203125, 0.23409271240234375, 0.2413482666015625, 0.24860382080078125, 0.255859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 9.0, 10.0, 19.0, 18.0, 16.0, 18.0, 28.0, 25.0, 32.0, 37.0, 42.0, 53.0, 51.0, 53.0, 57.0, 58.0, 47.0, 51.0, 44.0, 41.0, 29.0, 47.0, 26.0, 30.0, 22.0, 17.0, 13.0, 19.0, 11.0, 12.0, 8.0, 8.0, 7.0, 4.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046173095703125, -0.04496145248413086, -0.04374980926513672, -0.04253816604614258, -0.04132652282714844, -0.0401148796081543, -0.038903236389160156, -0.037691593170166016, -0.036479949951171875, -0.035268306732177734, -0.034056663513183594, -0.03284502029418945, -0.03163337707519531, -0.030421733856201172, -0.02921009063720703, -0.02799844741821289, -0.02678680419921875, -0.02557516098022461, -0.02436351776123047, -0.023151874542236328, -0.021940231323242188, -0.020728588104248047, -0.019516944885253906, -0.018305301666259766, -0.017093658447265625, -0.015882015228271484, -0.014670372009277344, -0.013458728790283203, -0.012247085571289062, -0.011035442352294922, -0.009823799133300781, -0.00861215591430664, -0.0074005126953125, -0.006188869476318359, -0.004977226257324219, -0.003765583038330078, -0.0025539398193359375, -0.0013422966003417969, -0.00013065338134765625, 0.0010809898376464844, 0.002292633056640625, 0.0035042762756347656, 0.004715919494628906, 0.005927562713623047, 0.0071392059326171875, 0.008350849151611328, 0.009562492370605469, 0.01077413558959961, 0.01198577880859375, 0.01319742202758789, 0.014409065246582031, 0.015620708465576172, 0.016832351684570312, 0.018043994903564453, 0.019255638122558594, 0.020467281341552734, 0.021678924560546875, 0.022890567779541016, 0.024102210998535156, 0.025313854217529297, 0.026525497436523438, 0.027737140655517578, 0.02894878387451172, 0.03016042709350586, 0.0313720703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 3.0, 8.0, 5.0, 16.0, 24.0, 28.0, 40.0, 44.0, 48.0, 68.0, 86.0, 162.0, 241.0, 658.0, 2375.0, 18089.0, 401264.0, 593738.0, 26963.0, 3081.0, 750.0, 322.0, 149.0, 86.0, 80.0, 38.0, 45.0, 35.0, 21.0, 13.0, 16.0, 13.0, 6.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1156005859375, -0.11199665069580078, -0.10839271545410156, -0.10478878021240234, -0.10118484497070312, -0.0975809097290039, -0.09397697448730469, -0.09037303924560547, -0.08676910400390625, -0.08316516876220703, -0.07956123352050781, -0.0759572982788086, -0.07235336303710938, -0.06874942779541016, -0.06514549255371094, -0.06154155731201172, -0.0579376220703125, -0.05433368682861328, -0.05072975158691406, -0.047125816345214844, -0.043521881103515625, -0.039917945861816406, -0.03631401062011719, -0.03271007537841797, -0.02910614013671875, -0.02550220489501953, -0.021898269653320312, -0.018294334411621094, -0.014690399169921875, -0.011086463928222656, -0.0074825286865234375, -0.0038785934448242188, -0.000274658203125, 0.0033292770385742188, 0.0069332122802734375, 0.010537147521972656, 0.014141082763671875, 0.017745018005371094, 0.021348953247070312, 0.02495288848876953, 0.02855682373046875, 0.03216075897216797, 0.03576469421386719, 0.039368629455566406, 0.042972564697265625, 0.046576499938964844, 0.05018043518066406, 0.05378437042236328, 0.0573883056640625, 0.06099224090576172, 0.06459617614746094, 0.06820011138916016, 0.07180404663085938, 0.0754079818725586, 0.07901191711425781, 0.08261585235595703, 0.08621978759765625, 0.08982372283935547, 0.09342765808105469, 0.0970315933227539, 0.10063552856445312, 0.10423946380615234, 0.10784339904785156, 0.11144733428955078, 0.11505126953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 12.0, 15.0, 10.0, 18.0, 31.0, 22.0, 26.0, 25.0, 34.0, 43.0, 37.0, 43.0, 46.0, 46.0, 48.0, 51.0, 45.0, 54.0, 43.0, 33.0, 33.0, 38.0, 33.0, 36.0, 15.0, 19.0, 21.0, 21.0, 15.0, 21.0, 17.0, 3.0, 9.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.10675048828125, -0.10381507873535156, -0.10087966918945312, -0.09794425964355469, -0.09500885009765625, -0.09207344055175781, -0.08913803100585938, -0.08620262145996094, -0.0832672119140625, -0.08033180236816406, -0.07739639282226562, -0.07446098327636719, -0.07152557373046875, -0.06859016418457031, -0.06565475463867188, -0.06271934509277344, -0.059783935546875, -0.05684852600097656, -0.053913116455078125, -0.05097770690917969, -0.04804229736328125, -0.04510688781738281, -0.042171478271484375, -0.03923606872558594, -0.0363006591796875, -0.03336524963378906, -0.030429840087890625, -0.027494430541992188, -0.02455902099609375, -0.021623611450195312, -0.018688201904296875, -0.015752792358398438, -0.0128173828125, -0.009881973266601562, -0.006946563720703125, -0.0040111541748046875, -0.00107574462890625, 0.0018596649169921875, 0.004795074462890625, 0.0077304840087890625, 0.0106658935546875, 0.013601303100585938, 0.016536712646484375, 0.019472122192382812, 0.02240753173828125, 0.025342941284179688, 0.028278350830078125, 0.031213760375976562, 0.034149169921875, 0.03708457946777344, 0.040019989013671875, 0.04295539855957031, 0.04589080810546875, 0.04882621765136719, 0.051761627197265625, 0.05469703674316406, 0.0576324462890625, 0.06056785583496094, 0.06350326538085938, 0.06643867492675781, 0.06937408447265625, 0.07230949401855469, 0.07524490356445312, 0.07818031311035156, 0.08111572265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 9.0, 10.0, 6.0, 20.0, 15.0, 29.0, 50.0, 57.0, 77.0, 118.0, 193.0, 390.0, 811.0, 1921.0, 5057.0, 22955.0, 492696.0, 492391.0, 22950.0, 5021.0, 1929.0, 823.0, 399.0, 213.0, 120.0, 76.0, 60.0, 44.0, 29.0, 21.0, 20.0, 9.0, 10.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02484130859375, -0.02403998374938965, -0.023238658905029297, -0.022437334060668945, -0.021636009216308594, -0.020834684371948242, -0.02003335952758789, -0.01923203468322754, -0.018430709838867188, -0.017629384994506836, -0.016828060150146484, -0.016026735305786133, -0.015225410461425781, -0.01442408561706543, -0.013622760772705078, -0.012821435928344727, -0.012020111083984375, -0.011218786239624023, -0.010417461395263672, -0.00961613655090332, -0.008814811706542969, -0.008013486862182617, -0.007212162017822266, -0.006410837173461914, -0.0056095123291015625, -0.004808187484741211, -0.004006862640380859, -0.003205537796020508, -0.0024042129516601562, -0.0016028881072998047, -0.0008015632629394531, -2.384185791015625e-07, 0.00080108642578125, 0.0016024112701416016, 0.002403736114501953, 0.0032050609588623047, 0.004006385803222656, 0.004807710647583008, 0.005609035491943359, 0.006410360336303711, 0.0072116851806640625, 0.008013010025024414, 0.008814334869384766, 0.009615659713745117, 0.010416984558105469, 0.01121830940246582, 0.012019634246826172, 0.012820959091186523, 0.013622283935546875, 0.014423608779907227, 0.015224933624267578, 0.01602625846862793, 0.01682758331298828, 0.017628908157348633, 0.018430233001708984, 0.019231557846069336, 0.020032882690429688, 0.02083420753479004, 0.02163553237915039, 0.022436857223510742, 0.023238182067871094, 0.024039506912231445, 0.024840831756591797, 0.02564215660095215, 0.0264434814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 5.0, 11.0, 16.0, 15.0, 18.0, 15.0, 30.0, 40.0, 49.0, 58.0, 54.0, 82.0, 77.0, 84.0, 68.0, 53.0, 65.0, 53.0, 35.0, 47.0, 21.0, 26.0, 15.0, 17.0, 9.0, 12.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0728836059570312e-05, -1.044292002916336e-05, -1.0157003998756409e-05, -9.871087968349457e-06, -9.585171937942505e-06, -9.299255907535553e-06, -9.013339877128601e-06, -8.72742384672165e-06, -8.441507816314697e-06, -8.155591785907745e-06, -7.869675755500793e-06, -7.5837597250938416e-06, -7.29784369468689e-06, -7.011927664279938e-06, -6.726011633872986e-06, -6.440095603466034e-06, -6.154179573059082e-06, -5.86826354265213e-06, -5.582347512245178e-06, -5.296431481838226e-06, -5.010515451431274e-06, -4.7245994210243225e-06, -4.438683390617371e-06, -4.152767360210419e-06, -3.866851329803467e-06, -3.580935299396515e-06, -3.295019268989563e-06, -3.009103238582611e-06, -2.723187208175659e-06, -2.4372711777687073e-06, -2.1513551473617554e-06, -1.8654391169548035e-06, -1.5795230865478516e-06, -1.2936070561408997e-06, -1.0076910257339478e-06, -7.217749953269958e-07, -4.3585896492004395e-07, -1.4994293451309204e-07, 1.3597309589385986e-07, 4.2188912630081177e-07, 7.078051567077637e-07, 9.937211871147156e-07, 1.2796372175216675e-06, 1.5655532479286194e-06, 1.8514692783355713e-06, 2.137385308742523e-06, 2.423301339149475e-06, 2.709217369556427e-06, 2.995133399963379e-06, 3.281049430370331e-06, 3.5669654607772827e-06, 3.852881491184235e-06, 4.1387975215911865e-06, 4.4247135519981384e-06, 4.71062958240509e-06, 4.996545612812042e-06, 5.282461643218994e-06, 5.568377673625946e-06, 5.854293704032898e-06, 6.14020973443985e-06, 6.426125764846802e-06, 6.712041795253754e-06, 6.9979578256607056e-06, 7.2838738560676575e-06, 7.569789886474609e-06]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 11.0, 6.0, 15.0, 20.0, 40.0, 88.0, 196.0, 377.0, 739.0, 1592.0, 3579.0, 10678.0, 344021.0, 666267.0, 13428.0, 3943.0, 1773.0, 875.0, 419.0, 225.0, 101.0, 54.0, 32.0, 15.0, 11.0, 6.0, 6.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.04595947265625, -0.04432201385498047, -0.04268455505371094, -0.041047096252441406, -0.039409637451171875, -0.037772178649902344, -0.03613471984863281, -0.03449726104736328, -0.03285980224609375, -0.03122234344482422, -0.029584884643554688, -0.027947425842285156, -0.026309967041015625, -0.024672508239746094, -0.023035049438476562, -0.02139759063720703, -0.0197601318359375, -0.01812267303466797, -0.016485214233398438, -0.014847755432128906, -0.013210296630859375, -0.011572837829589844, -0.009935379028320312, -0.008297920227050781, -0.00666046142578125, -0.005023002624511719, -0.0033855438232421875, -0.0017480850219726562, -0.000110626220703125, 0.0015268325805664062, 0.0031642913818359375, 0.004801750183105469, 0.006439208984375, 0.008076667785644531, 0.009714126586914062, 0.011351585388183594, 0.012989044189453125, 0.014626502990722656, 0.016263961791992188, 0.01790142059326172, 0.01953887939453125, 0.02117633819580078, 0.022813796997070312, 0.024451255798339844, 0.026088714599609375, 0.027726173400878906, 0.029363632202148438, 0.03100109100341797, 0.0326385498046875, 0.03427600860595703, 0.03591346740722656, 0.037550926208496094, 0.039188385009765625, 0.040825843811035156, 0.04246330261230469, 0.04410076141357422, 0.04573822021484375, 0.04737567901611328, 0.04901313781738281, 0.050650596618652344, 0.052288055419921875, 0.053925514221191406, 0.05556297302246094, 0.05720043182373047, 0.058837890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 5.0, 9.0, 17.0, 24.0, 34.0, 52.0, 101.0, 130.0, 192.0, 147.0, 107.0, 45.0, 36.0, 24.0, 15.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04559326171875, -0.04431343078613281, -0.043033599853515625, -0.04175376892089844, -0.04047393798828125, -0.03919410705566406, -0.037914276123046875, -0.03663444519042969, -0.0353546142578125, -0.03407478332519531, -0.032794952392578125, -0.03151512145996094, -0.03023529052734375, -0.028955459594726562, -0.027675628662109375, -0.026395797729492188, -0.025115966796875, -0.023836135864257812, -0.022556304931640625, -0.021276473999023438, -0.01999664306640625, -0.018716812133789062, -0.017436981201171875, -0.016157150268554688, -0.0148773193359375, -0.013597488403320312, -0.012317657470703125, -0.011037826538085938, -0.00975799560546875, -0.008478164672851562, -0.007198333740234375, -0.0059185028076171875, -0.004638671875, -0.0033588409423828125, -0.002079010009765625, -0.0007991790771484375, 0.00048065185546875, 0.0017604827880859375, 0.003040313720703125, 0.0043201446533203125, 0.0055999755859375, 0.0068798065185546875, 0.008159637451171875, 0.009439468383789062, 0.01071929931640625, 0.011999130249023438, 0.013278961181640625, 0.014558792114257812, 0.015838623046875, 0.017118453979492188, 0.018398284912109375, 0.019678115844726562, 0.02095794677734375, 0.022237777709960938, 0.023517608642578125, 0.024797439575195312, 0.0260772705078125, 0.027357101440429688, 0.028636932373046875, 0.029916763305664062, 0.03119659423828125, 0.03247642517089844, 0.033756256103515625, 0.03503608703613281, 0.03631591796875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 32.0, 240.0, 568.0, 135.0, 21.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7432074546813965, -1.6939830780029297, -1.644758701324463, -1.5955342054367065, -1.5463098287582397, -1.497085452079773, -1.4478610754013062, -1.3986365795135498, -1.349412202835083, -1.3001878261566162, -1.2509634494781494, -1.201738953590393, -1.1525145769119263, -1.1032902002334595, -1.0540658235549927, -1.0048413276672363, -0.9556170105934143, -0.9063926339149475, -0.8571681976318359, -0.8079438209533691, -0.7587193846702576, -0.7094950079917908, -0.6602705717086792, -0.6110461950302124, -0.5618218183517456, -0.5125974416732788, -0.46337300539016724, -0.41414862871170044, -0.36492419242858887, -0.31569981575012207, -0.2664754092693329, -0.2172510027885437, -0.16802656650543213, -0.11880216002464294, -0.06957776099443436, -0.02035336196422577, 0.028871044516563416, 0.0780954509973526, 0.1273198425769806, 0.17654424905776978, 0.22576865553855896, 0.27499306201934814, 0.32421746850013733, 0.3734418749809265, 0.4226662516593933, 0.4718906879425049, 0.5211150646209717, 0.5703394412994385, 0.61956387758255, 0.6687882542610168, 0.7180126905441284, 0.7672370672225952, 0.8164615035057068, 0.8656858801841736, 0.9149103164672852, 0.964134693145752, 1.0133590698242188, 1.0625834465026855, 1.1118078231811523, 1.1610323190689087, 1.2102566957473755, 1.2594810724258423, 1.308705449104309, 1.3579299449920654, 1.4071543216705322]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 4.0, 9.0, 6.0, 7.0, 7.0, 11.0, 10.0, 16.0, 16.0, 21.0, 15.0, 18.0, 26.0, 31.0, 22.0, 33.0, 35.0, 28.0, 39.0, 30.0, 38.0, 34.0, 38.0, 35.0, 35.0, 51.0, 32.0, 48.0, 34.0, 36.0, 36.0, 26.0, 25.0, 18.0, 22.0, 20.0, 16.0, 20.0, 7.0, 13.0, 10.0, 4.0, 4.0, 3.0, 4.0, 5.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.49558281898498535, -0.4802844822406769, -0.464986115694046, -0.44968777894973755, -0.4343894124031067, -0.4190910756587982, -0.40379270911216736, -0.3884943723678589, -0.373196005821228, -0.35789766907691956, -0.3425993025302887, -0.3273009657859802, -0.31200259923934937, -0.2967042624950409, -0.28140589594841003, -0.26610755920410156, -0.2508091926574707, -0.23551084101200104, -0.22021248936653137, -0.2049141377210617, -0.18961578607559204, -0.17431744933128357, -0.1590190827846527, -0.14372074604034424, -0.12842240929603577, -0.1131240576505661, -0.09782570600509644, -0.08252735435962677, -0.0672290027141571, -0.051930658519268036, -0.03663230687379837, -0.021333955228328705, -0.006035596132278442, 0.009262754581868649, 0.02456110529601574, 0.039859455078840256, 0.05515780672430992, 0.07045615464448929, 0.08575450628995895, 0.10105285793542862, 0.11635120958089828, 0.13164955377578735, 0.14694790542125702, 0.16224625706672668, 0.17754460871219635, 0.19284296035766602, 0.20814131200313568, 0.22343966364860535, 0.238738015294075, 0.2540363669395447, 0.26933470368385315, 0.284633070230484, 0.2999314069747925, 0.31522977352142334, 0.3305281102657318, 0.34582647681236267, 0.36112481355667114, 0.3764231503009796, 0.3917215168476105, 0.40701985359191895, 0.4223182201385498, 0.4376165568828583, 0.45291492342948914, 0.4682132601737976, 0.48351162672042847]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 10.0, 11.0, 17.0, 17.0, 9.0, 27.0, 36.0, 38.0, 48.0, 64.0, 102.0, 266.0, 1035.0, 5574.0, 4116116.0, 67274.0, 2579.0, 553.0, 156.0, 90.0, 45.0, 32.0, 24.0, 33.0, 21.0, 14.0, 18.0, 11.0, 9.0, 13.0, 8.0, 7.0, 1.0, 6.0, 4.0, 3.0, 1.0], "bins": [-0.63916015625, -0.6238632202148438, -0.6085662841796875, -0.5932693481445312, -0.577972412109375, -0.5626754760742188, -0.5473785400390625, -0.5320816040039062, -0.51678466796875, -0.5014877319335938, -0.4861907958984375, -0.47089385986328125, -0.455596923828125, -0.44029998779296875, -0.4250030517578125, -0.40970611572265625, -0.3944091796875, -0.37911224365234375, -0.3638153076171875, -0.34851837158203125, -0.333221435546875, -0.31792449951171875, -0.3026275634765625, -0.28733062744140625, -0.27203369140625, -0.25673675537109375, -0.2414398193359375, -0.22614288330078125, -0.210845947265625, -0.19554901123046875, -0.1802520751953125, -0.16495513916015625, -0.149658203125, -0.13436126708984375, -0.1190643310546875, -0.10376739501953125, -0.088470458984375, -0.07317352294921875, -0.0578765869140625, -0.04257965087890625, -0.02728271484375, -0.01198577880859375, 0.0033111572265625, 0.01860809326171875, 0.033905029296875, 0.04920196533203125, 0.0644989013671875, 0.07979583740234375, 0.0950927734375, 0.11038970947265625, 0.1256866455078125, 0.14098358154296875, 0.156280517578125, 0.17157745361328125, 0.1868743896484375, 0.20217132568359375, 0.21746826171875, 0.23276519775390625, 0.2480621337890625, 0.26335906982421875, 0.278656005859375, 0.29395294189453125, 0.3092498779296875, 0.32454681396484375, 0.33984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 10.0, 5.0, 9.0, 19.0, 13.0, 11.0, 11.0, 26.0, 22.0, 27.0, 33.0, 31.0, 46.0, 51.0, 55.0, 58.0, 64.0, 43.0, 55.0, 52.0, 50.0, 41.0, 44.0, 31.0, 22.0, 35.0, 19.0, 20.0, 19.0, 15.0, 10.0, 18.0, 7.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04669189453125, -0.04546976089477539, -0.04424762725830078, -0.04302549362182617, -0.04180335998535156, -0.04058122634887695, -0.039359092712402344, -0.038136959075927734, -0.036914825439453125, -0.035692691802978516, -0.034470558166503906, -0.0332484245300293, -0.03202629089355469, -0.030804157257080078, -0.02958202362060547, -0.02835988998413086, -0.02713775634765625, -0.02591562271118164, -0.02469348907470703, -0.023471355438232422, -0.022249221801757812, -0.021027088165283203, -0.019804954528808594, -0.018582820892333984, -0.017360687255859375, -0.016138553619384766, -0.014916419982910156, -0.013694286346435547, -0.012472152709960938, -0.011250019073486328, -0.010027885437011719, -0.00880575180053711, -0.0075836181640625, -0.006361484527587891, -0.005139350891113281, -0.003917217254638672, -0.0026950836181640625, -0.0014729499816894531, -0.00025081634521484375, 0.0009713172912597656, 0.002193450927734375, 0.0034155845642089844, 0.004637718200683594, 0.005859851837158203, 0.0070819854736328125, 0.008304119110107422, 0.009526252746582031, 0.01074838638305664, 0.01197052001953125, 0.01319265365600586, 0.014414787292480469, 0.015636920928955078, 0.016859054565429688, 0.018081188201904297, 0.019303321838378906, 0.020525455474853516, 0.021747589111328125, 0.022969722747802734, 0.024191856384277344, 0.025413990020751953, 0.026636123657226562, 0.027858257293701172, 0.02908039093017578, 0.03030252456665039, 0.031524658203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 7.0, 5.0, 7.0, 18.0, 12.0, 43.0, 56.0, 142.0, 366.0, 1196.0, 7016.0, 92368.0, 3170474.0, 886178.0, 31586.0, 3556.0, 732.0, 260.0, 99.0, 61.0, 37.0, 25.0, 17.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10162353515625, -0.09752750396728516, -0.09343147277832031, -0.08933544158935547, -0.08523941040039062, -0.08114337921142578, -0.07704734802246094, -0.0729513168334961, -0.06885528564453125, -0.0647592544555664, -0.06066322326660156, -0.05656719207763672, -0.052471160888671875, -0.04837512969970703, -0.04427909851074219, -0.040183067321777344, -0.0360870361328125, -0.031991004943847656, -0.027894973754882812, -0.02379894256591797, -0.019702911376953125, -0.015606880187988281, -0.011510848999023438, -0.007414817810058594, -0.00331878662109375, 0.0007772445678710938, 0.0048732757568359375, 0.008969306945800781, 0.013065338134765625, 0.01716136932373047, 0.021257400512695312, 0.025353431701660156, 0.029449462890625, 0.033545494079589844, 0.03764152526855469, 0.04173755645751953, 0.045833587646484375, 0.04992961883544922, 0.05402565002441406, 0.058121681213378906, 0.06221771240234375, 0.0663137435913086, 0.07040977478027344, 0.07450580596923828, 0.07860183715820312, 0.08269786834716797, 0.08679389953613281, 0.09088993072509766, 0.0949859619140625, 0.09908199310302734, 0.10317802429199219, 0.10727405548095703, 0.11137008666992188, 0.11546611785888672, 0.11956214904785156, 0.1236581802368164, 0.12775421142578125, 0.1318502426147461, 0.13594627380371094, 0.14004230499267578, 0.14413833618164062, 0.14823436737060547, 0.1523303985595703, 0.15642642974853516, 0.1605224609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 8.0, 13.0, 15.0, 9.0, 22.0, 52.0, 43.0, 68.0, 108.0, 172.0, 261.0, 459.0, 821.0, 734.0, 484.0, 277.0, 201.0, 128.0, 70.0, 36.0, 27.0, 21.0, 19.0, 7.0, 5.0, 2.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03729248046875, -0.0358123779296875, -0.034332275390625, -0.0328521728515625, -0.0313720703125, -0.0298919677734375, -0.028411865234375, -0.0269317626953125, -0.02545166015625, -0.0239715576171875, -0.022491455078125, -0.0210113525390625, -0.01953125, -0.0180511474609375, -0.016571044921875, -0.0150909423828125, -0.01361083984375, -0.0121307373046875, -0.010650634765625, -0.0091705322265625, -0.0076904296875, -0.0062103271484375, -0.004730224609375, -0.0032501220703125, -0.00177001953125, -0.0002899169921875, 0.001190185546875, 0.0026702880859375, 0.004150390625, 0.0056304931640625, 0.007110595703125, 0.0085906982421875, 0.01007080078125, 0.0115509033203125, 0.013031005859375, 0.0145111083984375, 0.0159912109375, 0.0174713134765625, 0.018951416015625, 0.0204315185546875, 0.02191162109375, 0.0233917236328125, 0.024871826171875, 0.0263519287109375, 0.02783203125, 0.0293121337890625, 0.030792236328125, 0.0322723388671875, 0.03375244140625, 0.0352325439453125, 0.036712646484375, 0.0381927490234375, 0.0396728515625, 0.0411529541015625, 0.042633056640625, 0.0441131591796875, 0.04559326171875, 0.0470733642578125, 0.048553466796875, 0.0500335693359375, 0.051513671875, 0.0529937744140625, 0.054473876953125, 0.0559539794921875, 0.05743408203125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 10.0, 39.0, 260.0, 492.0, 151.0, 45.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3368317484855652, -0.314841091632843, -0.29285046458244324, -0.27085983753204346, -0.2488691806793213, -0.22687853872776031, -0.20488789677619934, -0.18289725482463837, -0.1609066128730774, -0.13891597092151642, -0.11692532896995544, -0.09493468701839447, -0.0729440450668335, -0.05095340311527252, -0.028962761163711548, -0.006972119212150574, 0.0150185227394104, 0.037009164690971375, 0.05899980664253235, 0.08099044859409332, 0.1029810905456543, 0.12497173249721527, 0.14696237444877625, 0.16895301640033722, 0.1909436583518982, 0.21293430030345917, 0.23492494225502014, 0.2569155693054199, 0.2789062261581421, 0.30089688301086426, 0.32288751006126404, 0.3448781371116638, 0.36686885356903076, 0.38885951042175293, 0.4108501374721527, 0.4328407645225525, 0.45483142137527466, 0.4768220782279968, 0.4988127052783966, 0.5208033323287964, 0.5427939891815186, 0.5647846460342407, 0.5867753028869629, 0.6087659001350403, 0.6307565569877625, 0.6527472138404846, 0.674737811088562, 0.6967284679412842, 0.7187191247940063, 0.7407097816467285, 0.7627004384994507, 0.7846910357475281, 0.8066816926002502, 0.8286723494529724, 0.8506629467010498, 0.872653603553772, 0.8946442604064941, 0.9166349172592163, 0.9386255741119385, 0.9606161713600159, 0.982606828212738, 1.0045974254608154, 1.0265880823135376, 1.0485787391662598, 1.070569396018982]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 3.0, 10.0, 11.0, 17.0, 14.0, 18.0, 20.0, 27.0, 29.0, 28.0, 34.0, 41.0, 46.0, 46.0, 38.0, 40.0, 35.0, 49.0, 45.0, 55.0, 40.0, 32.0, 39.0, 32.0, 26.0, 36.0, 28.0, 21.0, 17.0, 10.0, 21.0, 17.0, 6.0, 12.0, 10.0, 4.0, 5.0, 2.0, 7.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10927140712738037, -0.10571034252643585, -0.10214927047491074, -0.09858820587396622, -0.0950271338224411, -0.09146606922149658, -0.08790500462055206, -0.08434394001960754, -0.08078286796808243, -0.07722180336713791, -0.07366073131561279, -0.07009966671466827, -0.06653860211372375, -0.06297753006219864, -0.05941646546125412, -0.0558553971350193, -0.052294328808784485, -0.04873326048254967, -0.04517219215631485, -0.04161112755537033, -0.03805005922913551, -0.034488990902900696, -0.030927924439311028, -0.02736685797572136, -0.023805789649486542, -0.020244721323251724, -0.016683654859662056, -0.013122587464749813, -0.00956152006983757, -0.006000451743602753, -0.0024393852800130844, 0.0011216811835765839, 0.004682749509811401, 0.008243816904723644, 0.011804884299635887, 0.01536595169454813, 0.018927019089460373, 0.02248808741569519, 0.02604915387928486, 0.029610220342874527, 0.033171288669109344, 0.03673235699534416, 0.04029342532157898, 0.0438544899225235, 0.047415558248758316, 0.050976626574993134, 0.05453769117593765, 0.05809875950217247, 0.06165982782840729, 0.0652208924293518, 0.06878196448087692, 0.07234302908182144, 0.07590410113334656, 0.07946516573429108, 0.0830262303352356, 0.08658729493618011, 0.09014836698770523, 0.09370943158864975, 0.09727050364017487, 0.10083156824111938, 0.1043926328420639, 0.10795370489358902, 0.11151476949453354, 0.11507584154605865, 0.11863690614700317]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 11.0, 18.0, 12.0, 45.0, 76.0, 116.0, 195.0, 377.0, 722.0, 1807.0, 4766.0, 16212.0, 90575.0, 669365.0, 222942.0, 29224.0, 7425.0, 2499.0, 1046.0, 478.0, 256.0, 156.0, 87.0, 47.0, 42.0, 25.0, 10.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1844482421875, -0.17897415161132812, -0.17350006103515625, -0.16802597045898438, -0.1625518798828125, -0.15707778930664062, -0.15160369873046875, -0.14612960815429688, -0.140655517578125, -0.13518142700195312, -0.12970733642578125, -0.12423324584960938, -0.1187591552734375, -0.11328506469726562, -0.10781097412109375, -0.10233688354492188, -0.09686279296875, -0.09138870239257812, -0.08591461181640625, -0.08044052124023438, -0.0749664306640625, -0.06949234008789062, -0.06401824951171875, -0.058544158935546875, -0.053070068359375, -0.047595977783203125, -0.04212188720703125, -0.036647796630859375, -0.0311737060546875, -0.025699615478515625, -0.02022552490234375, -0.014751434326171875, -0.00927734375, -0.003803253173828125, 0.00167083740234375, 0.007144927978515625, 0.0126190185546875, 0.018093109130859375, 0.02356719970703125, 0.029041290283203125, 0.034515380859375, 0.039989471435546875, 0.04546356201171875, 0.050937652587890625, 0.0564117431640625, 0.061885833740234375, 0.06735992431640625, 0.07283401489257812, 0.07830810546875, 0.08378219604492188, 0.08925628662109375, 0.09473037719726562, 0.1002044677734375, 0.10567855834960938, 0.11115264892578125, 0.11662673950195312, 0.122100830078125, 0.12757492065429688, 0.13304901123046875, 0.13852310180664062, 0.1439971923828125, 0.14947128295898438, 0.15494537353515625, 0.16041946411132812, 0.1658935546875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 11.0, 9.0, 14.0, 11.0, 8.0, 14.0, 14.0, 20.0, 19.0, 28.0, 38.0, 26.0, 36.0, 46.0, 69.0, 46.0, 51.0, 50.0, 49.0, 53.0, 43.0, 43.0, 33.0, 45.0, 31.0, 24.0, 23.0, 26.0, 18.0, 19.0, 8.0, 14.0, 10.0, 7.0, 13.0, 11.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03692626953125, -0.035797119140625, -0.03466796875, -0.033538818359375, -0.03240966796875, -0.031280517578125, -0.0301513671875, -0.029022216796875, -0.02789306640625, -0.026763916015625, -0.025634765625, -0.024505615234375, -0.02337646484375, -0.022247314453125, -0.0211181640625, -0.019989013671875, -0.01885986328125, -0.017730712890625, -0.0166015625, -0.015472412109375, -0.01434326171875, -0.013214111328125, -0.0120849609375, -0.010955810546875, -0.00982666015625, -0.008697509765625, -0.007568359375, -0.006439208984375, -0.00531005859375, -0.004180908203125, -0.0030517578125, -0.001922607421875, -0.00079345703125, 0.000335693359375, 0.00146484375, 0.002593994140625, 0.00372314453125, 0.004852294921875, 0.0059814453125, 0.007110595703125, 0.00823974609375, 0.009368896484375, 0.010498046875, 0.011627197265625, 0.01275634765625, 0.013885498046875, 0.0150146484375, 0.016143798828125, 0.01727294921875, 0.018402099609375, 0.01953125, 0.020660400390625, 0.02178955078125, 0.022918701171875, 0.0240478515625, 0.025177001953125, 0.02630615234375, 0.027435302734375, 0.028564453125, 0.029693603515625, 0.03082275390625, 0.031951904296875, 0.0330810546875, 0.034210205078125, 0.03533935546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 11.0, 8.0, 11.0, 13.0, 7.0, 16.0, 16.0, 25.0, 25.0, 23.0, 30.0, 28.0, 51.0, 62.0, 119.0, 225.0, 807.0, 5708.0, 204713.0, 806302.0, 27645.0, 1750.0, 373.0, 172.0, 97.0, 52.0, 46.0, 40.0, 33.0, 23.0, 21.0, 19.0, 11.0, 9.0, 16.0, 9.0, 11.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.226318359375, -0.2195110321044922, -0.21270370483398438, -0.20589637756347656, -0.19908905029296875, -0.19228172302246094, -0.18547439575195312, -0.1786670684814453, -0.1718597412109375, -0.1650524139404297, -0.15824508666992188, -0.15143775939941406, -0.14463043212890625, -0.13782310485839844, -0.13101577758789062, -0.12420845031738281, -0.117401123046875, -0.11059379577636719, -0.10378646850585938, -0.09697914123535156, -0.09017181396484375, -0.08336448669433594, -0.07655715942382812, -0.06974983215332031, -0.0629425048828125, -0.05613517761230469, -0.049327850341796875, -0.04252052307128906, -0.03571319580078125, -0.028905868530273438, -0.022098541259765625, -0.015291213989257812, -0.00848388671875, -0.0016765594482421875, 0.005130767822265625, 0.011938095092773438, 0.01874542236328125, 0.025552749633789062, 0.032360076904296875, 0.03916740417480469, 0.0459747314453125, 0.05278205871582031, 0.059589385986328125, 0.06639671325683594, 0.07320404052734375, 0.08001136779785156, 0.08681869506835938, 0.09362602233886719, 0.100433349609375, 0.10724067687988281, 0.11404800415039062, 0.12085533142089844, 0.12766265869140625, 0.13446998596191406, 0.14127731323242188, 0.1480846405029297, 0.1548919677734375, 0.1616992950439453, 0.16850662231445312, 0.17531394958496094, 0.18212127685546875, 0.18892860412597656, 0.19573593139648438, 0.2025432586669922, 0.2093505859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 6.0, 9.0, 8.0, 8.0, 30.0, 22.0, 29.0, 32.0, 36.0, 29.0, 32.0, 52.0, 46.0, 40.0, 48.0, 56.0, 51.0, 43.0, 47.0, 47.0, 46.0, 42.0, 50.0, 25.0, 33.0, 26.0, 26.0, 17.0, 17.0, 13.0, 7.0, 9.0, 2.0, 2.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08306884765625, -0.08063697814941406, -0.07820510864257812, -0.07577323913574219, -0.07334136962890625, -0.07090950012207031, -0.06847763061523438, -0.06604576110839844, -0.0636138916015625, -0.06118202209472656, -0.058750152587890625, -0.05631828308105469, -0.05388641357421875, -0.05145454406738281, -0.049022674560546875, -0.04659080505371094, -0.044158935546875, -0.04172706604003906, -0.039295196533203125, -0.03686332702636719, -0.03443145751953125, -0.03199958801269531, -0.029567718505859375, -0.027135848999023438, -0.0247039794921875, -0.022272109985351562, -0.019840240478515625, -0.017408370971679688, -0.01497650146484375, -0.012544631958007812, -0.010112762451171875, -0.0076808929443359375, -0.0052490234375, -0.0028171539306640625, -0.000385284423828125, 0.0020465850830078125, 0.00447845458984375, 0.0069103240966796875, 0.009342193603515625, 0.011774063110351562, 0.0142059326171875, 0.016637802124023438, 0.019069671630859375, 0.021501541137695312, 0.02393341064453125, 0.026365280151367188, 0.028797149658203125, 0.031229019165039062, 0.033660888671875, 0.03609275817871094, 0.038524627685546875, 0.04095649719238281, 0.04338836669921875, 0.04582023620605469, 0.048252105712890625, 0.05068397521972656, 0.0531158447265625, 0.05554771423339844, 0.057979583740234375, 0.06041145324707031, 0.06284332275390625, 0.06527519226074219, 0.06770706176757812, 0.07013893127441406, 0.07257080078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 8.0, 6.0, 15.0, 26.0, 35.0, 68.0, 121.0, 216.0, 382.0, 676.0, 1332.0, 2773.0, 6607.0, 19841.0, 87252.0, 481732.0, 359943.0, 61747.0, 15584.0, 5338.0, 2380.0, 1111.0, 583.0, 328.0, 186.0, 104.0, 53.0, 39.0, 24.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030975341796875, -0.029903411865234375, -0.02883148193359375, -0.027759552001953125, -0.0266876220703125, -0.025615692138671875, -0.02454376220703125, -0.023471832275390625, -0.02239990234375, -0.021327972412109375, -0.02025604248046875, -0.019184112548828125, -0.0181121826171875, -0.017040252685546875, -0.01596832275390625, -0.014896392822265625, -0.013824462890625, -0.012752532958984375, -0.01168060302734375, -0.010608673095703125, -0.0095367431640625, -0.008464813232421875, -0.00739288330078125, -0.006320953369140625, -0.0052490234375, -0.004177093505859375, -0.00310516357421875, -0.002033233642578125, -0.0009613037109375, 0.000110626220703125, 0.00118255615234375, 0.002254486083984375, 0.003326416015625, 0.004398345947265625, 0.00547027587890625, 0.006542205810546875, 0.0076141357421875, 0.008686065673828125, 0.00975799560546875, 0.010829925537109375, 0.01190185546875, 0.012973785400390625, 0.01404571533203125, 0.015117645263671875, 0.0161895751953125, 0.017261505126953125, 0.01833343505859375, 0.019405364990234375, 0.020477294921875, 0.021549224853515625, 0.02262115478515625, 0.023693084716796875, 0.0247650146484375, 0.025836944580078125, 0.02690887451171875, 0.027980804443359375, 0.029052734375, 0.030124664306640625, 0.03119659423828125, 0.032268524169921875, 0.0333404541015625, 0.034412384033203125, 0.03548431396484375, 0.036556243896484375, 0.037628173828125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 9.0, 9.0, 7.0, 10.0, 14.0, 16.0, 12.0, 14.0, 30.0, 31.0, 34.0, 57.0, 52.0, 59.0, 72.0, 70.0, 68.0, 67.0, 61.0, 59.0, 36.0, 43.0, 35.0, 25.0, 17.0, 14.0, 14.0, 13.0, 5.0, 9.0, 3.0, 8.0, 7.0, 7.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3887882232666016e-05, -1.3440847396850586e-05, -1.2993812561035156e-05, -1.2546777725219727e-05, -1.2099742889404297e-05, -1.1652708053588867e-05, -1.1205673217773438e-05, -1.0758638381958008e-05, -1.0311603546142578e-05, -9.864568710327148e-06, -9.417533874511719e-06, -8.970499038696289e-06, -8.52346420288086e-06, -8.07642936706543e-06, -7.62939453125e-06, -7.18235969543457e-06, -6.735324859619141e-06, -6.288290023803711e-06, -5.841255187988281e-06, -5.3942203521728516e-06, -4.947185516357422e-06, -4.500150680541992e-06, -4.0531158447265625e-06, -3.606081008911133e-06, -3.159046173095703e-06, -2.7120113372802734e-06, -2.2649765014648438e-06, -1.817941665649414e-06, -1.3709068298339844e-06, -9.238719940185547e-07, -4.76837158203125e-07, -2.9802322387695312e-08, 4.172325134277344e-07, 8.642673492431641e-07, 1.3113021850585938e-06, 1.7583370208740234e-06, 2.205371856689453e-06, 2.652406692504883e-06, 3.0994415283203125e-06, 3.546476364135742e-06, 3.993511199951172e-06, 4.4405460357666016e-06, 4.887580871582031e-06, 5.334615707397461e-06, 5.781650543212891e-06, 6.22868537902832e-06, 6.67572021484375e-06, 7.12275505065918e-06, 7.569789886474609e-06, 8.016824722290039e-06, 8.463859558105469e-06, 8.910894393920898e-06, 9.357929229736328e-06, 9.804964065551758e-06, 1.0251998901367188e-05, 1.0699033737182617e-05, 1.1146068572998047e-05, 1.1593103408813477e-05, 1.2040138244628906e-05, 1.2487173080444336e-05, 1.2934207916259766e-05, 1.3381242752075195e-05, 1.3828277587890625e-05, 1.4275312423706055e-05, 1.4722347259521484e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 3.0, 7.0, 16.0, 14.0, 18.0, 26.0, 39.0, 43.0, 79.0, 160.0, 488.0, 4207.0, 159915.0, 852133.0, 29446.0, 1410.0, 237.0, 107.0, 55.0, 37.0, 24.0, 24.0, 18.0, 10.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.07039308547973633, -0.06839847564697266, -0.06640386581420898, -0.06440925598144531, -0.06241464614868164, -0.06042003631591797, -0.0584254264831543, -0.056430816650390625, -0.05443620681762695, -0.05244159698486328, -0.05044698715209961, -0.04845237731933594, -0.046457767486572266, -0.044463157653808594, -0.04246854782104492, -0.04047393798828125, -0.03847932815551758, -0.036484718322753906, -0.034490108489990234, -0.03249549865722656, -0.03050088882446289, -0.02850627899169922, -0.026511669158935547, -0.024517059326171875, -0.022522449493408203, -0.02052783966064453, -0.01853322982788086, -0.016538619995117188, -0.014544010162353516, -0.012549400329589844, -0.010554790496826172, -0.0085601806640625, -0.006565570831298828, -0.004570960998535156, -0.0025763511657714844, -0.0005817413330078125, 0.0014128684997558594, 0.0034074783325195312, 0.005402088165283203, 0.007396697998046875, 0.009391307830810547, 0.011385917663574219, 0.01338052749633789, 0.015375137329101562, 0.017369747161865234, 0.019364356994628906, 0.021358966827392578, 0.02335357666015625, 0.025348186492919922, 0.027342796325683594, 0.029337406158447266, 0.03133201599121094, 0.03332662582397461, 0.03532123565673828, 0.03731584548950195, 0.039310455322265625, 0.0413050651550293, 0.04329967498779297, 0.04529428482055664, 0.04728889465332031, 0.049283504486083984, 0.051278114318847656, 0.05327272415161133, 0.055267333984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 3.0, 8.0, 17.0, 18.0, 20.0, 25.0, 31.0, 29.0, 48.0, 59.0, 47.0, 76.0, 81.0, 87.0, 67.0, 72.0, 56.0, 52.0, 52.0, 28.0, 29.0, 30.0, 17.0, 11.0, 12.0, 5.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.017730712890625, -0.017249584197998047, -0.016768455505371094, -0.01628732681274414, -0.015806198120117188, -0.015325069427490234, -0.014843940734863281, -0.014362812042236328, -0.013881683349609375, -0.013400554656982422, -0.012919425964355469, -0.012438297271728516, -0.011957168579101562, -0.01147603988647461, -0.010994911193847656, -0.010513782501220703, -0.01003265380859375, -0.009551525115966797, -0.009070396423339844, -0.00858926773071289, -0.008108139038085938, -0.007627010345458984, -0.007145881652832031, -0.006664752960205078, -0.006183624267578125, -0.005702495574951172, -0.005221366882324219, -0.004740238189697266, -0.0042591094970703125, -0.0037779808044433594, -0.0032968521118164062, -0.002815723419189453, -0.0023345947265625, -0.0018534660339355469, -0.0013723373413085938, -0.0008912086486816406, -0.0004100799560546875, 7.104873657226562e-05, 0.0005521774291992188, 0.0010333061218261719, 0.001514434814453125, 0.001995563507080078, 0.0024766921997070312, 0.0029578208923339844, 0.0034389495849609375, 0.003920078277587891, 0.004401206970214844, 0.004882335662841797, 0.00536346435546875, 0.005844593048095703, 0.006325721740722656, 0.006806850433349609, 0.0072879791259765625, 0.007769107818603516, 0.008250236511230469, 0.008731365203857422, 0.009212493896484375, 0.009693622589111328, 0.010174751281738281, 0.010655879974365234, 0.011137008666992188, 0.01161813735961914, 0.012099266052246094, 0.012580394744873047, 0.0130615234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 35.0, 288.0, 518.0, 142.0, 17.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0957276821136475, -1.067823052406311, -1.039918303489685, -1.0120136737823486, -0.9841089248657227, -0.9562042951583862, -0.928299605846405, -0.9003949165344238, -0.8724902272224426, -0.8445855379104614, -0.8166808485984802, -0.788776159286499, -0.7608715295791626, -0.7329667806625366, -0.7050621509552002, -0.677157461643219, -0.6492527723312378, -0.6213480830192566, -0.5934433937072754, -0.5655387043952942, -0.537634015083313, -0.5097293853759766, -0.48182469606399536, -0.45392000675201416, -0.42601531744003296, -0.39811062812805176, -0.37020593881607056, -0.34230127930641174, -0.31439658999443054, -0.28649190068244934, -0.2585872411727905, -0.23068255186080933, -0.20277786254882812, -0.17487317323684692, -0.14696849882602692, -0.11906381696462631, -0.09115913510322571, -0.0632544457912445, -0.0353497713804245, -0.007445096969604492, 0.02045959234237671, 0.04836427420377731, 0.07626895606517792, 0.10417363792657852, 0.13207831978797913, 0.15998300909996033, 0.18788768351078033, 0.21579235792160034, 0.24369704723358154, 0.27160173654556274, 0.29950642585754395, 0.32741108536720276, 0.35531577467918396, 0.38322046399116516, 0.411125123500824, 0.4390298128128052, 0.4669345021247864, 0.4948391914367676, 0.5227438807487488, 0.55064857006073, 0.5785531997680664, 0.6064579486846924, 0.6343625783920288, 0.66226726770401, 0.6901719570159912]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 9.0, 11.0, 8.0, 14.0, 9.0, 12.0, 21.0, 16.0, 27.0, 19.0, 30.0, 25.0, 31.0, 26.0, 42.0, 51.0, 42.0, 47.0, 42.0, 36.0, 42.0, 39.0, 37.0, 41.0, 32.0, 36.0, 35.0, 27.0, 20.0, 18.0, 26.0, 15.0, 16.0, 18.0, 11.0, 17.0, 8.0, 3.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0], "bins": [-0.262748122215271, -0.2552414536476135, -0.24773478507995605, -0.24022811651229858, -0.2327214479446411, -0.22521477937698364, -0.21770811080932617, -0.2102014422416687, -0.20269477367401123, -0.19518810510635376, -0.1876814365386963, -0.18017476797103882, -0.17266809940338135, -0.16516143083572388, -0.1576547622680664, -0.15014809370040894, -0.14264141023159027, -0.1351347416639328, -0.12762807309627533, -0.12012140452861786, -0.11261473596096039, -0.10510806739330292, -0.09760139137506485, -0.09009472280740738, -0.08258805423974991, -0.07508138567209244, -0.06757471710443497, -0.0600680448114872, -0.05256137624382973, -0.045054707676172256, -0.03754803538322449, -0.030041366815567017, -0.022534698247909546, -0.0150280287489295, -0.007521359249949455, -1.4688819646835327e-05, 0.007491979748010635, 0.014998648315668106, 0.022505320608615875, 0.030011989176273346, 0.03751865774393082, 0.04502532631158829, 0.05253199487924576, 0.06003866717219353, 0.0675453394651413, 0.07505200803279877, 0.08255867660045624, 0.09006534516811371, 0.09757201373577118, 0.10507868230342865, 0.11258535087108612, 0.12009201943874359, 0.12759868800640106, 0.13510535657405853, 0.1426120400428772, 0.15011870861053467, 0.15762537717819214, 0.1651320457458496, 0.17263871431350708, 0.18014538288116455, 0.18765205144882202, 0.1951587200164795, 0.20266538858413696, 0.21017205715179443, 0.2176787257194519]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 9.0, 11.0, 17.0, 29.0, 46.0, 50.0, 68.0, 111.0, 167.0, 231.0, 351.0, 637.0, 1271.0, 3239.0, 14912.0, 434914.0, 3637741.0, 88037.0, 7914.0, 2148.0, 868.0, 516.0, 343.0, 194.0, 126.0, 98.0, 63.0, 47.0, 34.0, 23.0, 18.0, 16.0, 10.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.1851806640625, -0.18069839477539062, -0.17621612548828125, -0.17173385620117188, -0.1672515869140625, -0.16276931762695312, -0.15828704833984375, -0.15380477905273438, -0.149322509765625, -0.14484024047851562, -0.14035797119140625, -0.13587570190429688, -0.1313934326171875, -0.12691116333007812, -0.12242889404296875, -0.11794662475585938, -0.11346435546875, -0.10898208618164062, -0.10449981689453125, -0.10001754760742188, -0.0955352783203125, -0.09105300903320312, -0.08657073974609375, -0.08208847045898438, -0.077606201171875, -0.07312393188476562, -0.06864166259765625, -0.06415939331054688, -0.0596771240234375, -0.055194854736328125, -0.05071258544921875, -0.046230316162109375, -0.041748046875, -0.037265777587890625, -0.03278350830078125, -0.028301239013671875, -0.0238189697265625, -0.019336700439453125, -0.01485443115234375, -0.010372161865234375, -0.005889892578125, -0.001407623291015625, 0.00307464599609375, 0.007556915283203125, 0.0120391845703125, 0.016521453857421875, 0.02100372314453125, 0.025485992431640625, 0.02996826171875, 0.034450531005859375, 0.03893280029296875, 0.043415069580078125, 0.0478973388671875, 0.052379608154296875, 0.05686187744140625, 0.061344146728515625, 0.065826416015625, 0.07030868530273438, 0.07479095458984375, 0.07927322387695312, 0.0837554931640625, 0.08823776245117188, 0.09272003173828125, 0.09720230102539062, 0.1016845703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 6.0, 13.0, 7.0, 17.0, 21.0, 12.0, 22.0, 23.0, 24.0, 43.0, 39.0, 36.0, 53.0, 53.0, 68.0, 61.0, 49.0, 51.0, 45.0, 33.0, 37.0, 50.0, 29.0, 32.0, 26.0, 26.0, 13.0, 20.0, 18.0, 14.0, 7.0, 8.0, 5.0, 6.0, 4.0, 7.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04052734375, -0.03939962387084961, -0.03827190399169922, -0.03714418411254883, -0.03601646423339844, -0.03488874435424805, -0.033761024475097656, -0.032633304595947266, -0.031505584716796875, -0.030377864837646484, -0.029250144958496094, -0.028122425079345703, -0.026994705200195312, -0.025866985321044922, -0.02473926544189453, -0.02361154556274414, -0.02248382568359375, -0.02135610580444336, -0.02022838592529297, -0.019100666046142578, -0.017972946166992188, -0.016845226287841797, -0.015717506408691406, -0.014589786529541016, -0.013462066650390625, -0.012334346771240234, -0.011206626892089844, -0.010078907012939453, -0.008951187133789062, -0.007823467254638672, -0.006695747375488281, -0.005568027496337891, -0.0044403076171875, -0.0033125877380371094, -0.0021848678588867188, -0.0010571479797363281, 7.05718994140625e-05, 0.0011982917785644531, 0.0023260116577148438, 0.0034537315368652344, 0.004581451416015625, 0.005709171295166016, 0.006836891174316406, 0.007964611053466797, 0.009092330932617188, 0.010220050811767578, 0.011347770690917969, 0.01247549057006836, 0.01360321044921875, 0.01473093032836914, 0.01585865020751953, 0.016986370086669922, 0.018114089965820312, 0.019241809844970703, 0.020369529724121094, 0.021497249603271484, 0.022624969482421875, 0.023752689361572266, 0.024880409240722656, 0.026008129119873047, 0.027135848999023438, 0.028263568878173828, 0.02939128875732422, 0.03051900863647461, 0.031646728515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 11.0, 20.0, 16.0, 39.0, 41.0, 90.0, 133.0, 227.0, 371.0, 762.0, 1775.0, 6799.0, 44816.0, 526271.0, 3007260.0, 547731.0, 47142.0, 7117.0, 1978.0, 746.0, 383.0, 199.0, 145.0, 62.0, 32.0, 35.0, 15.0, 17.0, 12.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1004638671875, -0.09705924987792969, -0.09365463256835938, -0.09025001525878906, -0.08684539794921875, -0.08344078063964844, -0.08003616333007812, -0.07663154602050781, -0.0732269287109375, -0.06982231140136719, -0.06641769409179688, -0.06301307678222656, -0.05960845947265625, -0.05620384216308594, -0.052799224853515625, -0.04939460754394531, -0.045989990234375, -0.04258537292480469, -0.039180755615234375, -0.03577613830566406, -0.03237152099609375, -0.028966903686523438, -0.025562286376953125, -0.022157669067382812, -0.0187530517578125, -0.015348434448242188, -0.011943817138671875, -0.008539199829101562, -0.00513458251953125, -0.0017299652099609375, 0.001674652099609375, 0.0050792694091796875, 0.00848388671875, 0.011888504028320312, 0.015293121337890625, 0.018697738647460938, 0.02210235595703125, 0.025506973266601562, 0.028911590576171875, 0.03231620788574219, 0.0357208251953125, 0.03912544250488281, 0.042530059814453125, 0.04593467712402344, 0.04933929443359375, 0.05274391174316406, 0.056148529052734375, 0.05955314636230469, 0.062957763671875, 0.06636238098144531, 0.06976699829101562, 0.07317161560058594, 0.07657623291015625, 0.07998085021972656, 0.08338546752929688, 0.08679008483886719, 0.0901947021484375, 0.09359931945800781, 0.09700393676757812, 0.10040855407714844, 0.10381317138671875, 0.10721778869628906, 0.11062240600585938, 0.11402702331542969, 0.117431640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 12.0, 13.0, 10.0, 20.0, 22.0, 49.0, 48.0, 71.0, 110.0, 155.0, 213.0, 291.0, 404.0, 557.0, 628.0, 409.0, 292.0, 230.0, 186.0, 107.0, 71.0, 52.0, 37.0, 22.0, 27.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.057373046875, -0.05578899383544922, -0.05420494079589844, -0.052620887756347656, -0.051036834716796875, -0.049452781677246094, -0.04786872863769531, -0.04628467559814453, -0.04470062255859375, -0.04311656951904297, -0.04153251647949219, -0.039948463439941406, -0.038364410400390625, -0.036780357360839844, -0.03519630432128906, -0.03361225128173828, -0.0320281982421875, -0.03044414520263672, -0.028860092163085938, -0.027276039123535156, -0.025691986083984375, -0.024107933044433594, -0.022523880004882812, -0.02093982696533203, -0.01935577392578125, -0.01777172088623047, -0.016187667846679688, -0.014603614807128906, -0.013019561767578125, -0.011435508728027344, -0.009851455688476562, -0.008267402648925781, -0.006683349609375, -0.005099296569824219, -0.0035152435302734375, -0.0019311904907226562, -0.000347137451171875, 0.0012369155883789062, 0.0028209686279296875, 0.004405021667480469, 0.00598907470703125, 0.007573127746582031, 0.009157180786132812, 0.010741233825683594, 0.012325286865234375, 0.013909339904785156, 0.015493392944335938, 0.01707744598388672, 0.0186614990234375, 0.02024555206298828, 0.021829605102539062, 0.023413658142089844, 0.024997711181640625, 0.026581764221191406, 0.028165817260742188, 0.02974987030029297, 0.03133392333984375, 0.03291797637939453, 0.03450202941894531, 0.036086082458496094, 0.037670135498046875, 0.039254188537597656, 0.04083824157714844, 0.04242229461669922, 0.04400634765625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 11.0, 39.0, 183.0, 420.0, 267.0, 67.0, 17.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19105690717697144, -0.16678118705749512, -0.14250548183918, -0.11822976917028427, -0.09395405650138855, -0.06967834383249283, -0.04540263116359711, -0.021126925945281982, 0.003148794174194336, 0.027424506843090057, 0.05170021951198578, 0.0759759321808815, 0.10025164484977722, 0.12452735751867294, 0.14880307018756866, 0.1730787754058838, 0.1973544955253601, 0.22163021564483643, 0.24590592086315155, 0.2701816260814667, 0.294457346200943, 0.3187330663204193, 0.34300875663757324, 0.36728447675704956, 0.3915601968765259, 0.4158359169960022, 0.4401116371154785, 0.46438732743263245, 0.48866304755210876, 0.5129387378692627, 0.537214457988739, 0.5614901781082153, 0.5857658386230469, 0.6100415587425232, 0.6343172788619995, 0.6585929989814758, 0.6828687191009521, 0.7071443796157837, 0.73142009973526, 0.7556958198547363, 0.7799715399742126, 0.804247260093689, 0.8285229802131653, 0.8527987003326416, 0.8770743608474731, 0.9013500809669495, 0.9256258010864258, 0.9499015212059021, 0.9741772413253784, 0.9984529614448547, 1.022728681564331, 1.0470043420791626, 1.0712801218032837, 1.0955557823181152, 1.1198315620422363, 1.1441072225570679, 1.1683828830718994, 1.192658543586731, 1.216934323310852, 1.2412099838256836, 1.2654857635498047, 1.2897614240646362, 1.3140372037887573, 1.3383128643035889, 1.36258864402771]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 8.0, 11.0, 11.0, 14.0, 13.0, 19.0, 20.0, 24.0, 29.0, 43.0, 41.0, 38.0, 41.0, 33.0, 50.0, 44.0, 47.0, 40.0, 44.0, 46.0, 49.0, 34.0, 39.0, 25.0, 31.0, 42.0, 30.0, 27.0, 22.0, 16.0, 16.0, 18.0, 9.0, 5.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16983050107955933, -0.16446751356124878, -0.15910452604293823, -0.15374153852462769, -0.14837855100631714, -0.1430155485868454, -0.13765256106853485, -0.1322895735502243, -0.12692658603191376, -0.12156359851360321, -0.11620061099529266, -0.11083761602640152, -0.10547462850809097, -0.10011164098978043, -0.09474864602088928, -0.08938565850257874, -0.08402267098426819, -0.07865968346595764, -0.0732966959476471, -0.06793370097875595, -0.0625707134604454, -0.05720772594213486, -0.05184473469853401, -0.046481743454933167, -0.04111875593662262, -0.03575576841831207, -0.030392777174711227, -0.02502978779375553, -0.019666798412799835, -0.014303809031844139, -0.008940819650888443, -0.0035778284072875977, 0.0017851591110229492, 0.007148148491978645, 0.012511137872934341, 0.017874127253890038, 0.023237116634845734, 0.02860010601580143, 0.033963095396757126, 0.03932608664035797, 0.04468907415866852, 0.050052061676979065, 0.05541505292057991, 0.060778044164180756, 0.0661410316824913, 0.07150401920080185, 0.076867014169693, 0.08223000168800354, 0.08759298920631409, 0.09295597672462463, 0.09831896424293518, 0.10368195921182632, 0.10904494673013687, 0.11440793424844742, 0.11977092921733856, 0.1251339167356491, 0.13049690425395966, 0.1358598917722702, 0.14122287929058075, 0.1465858668088913, 0.15194886922836304, 0.15731185674667358, 0.16267484426498413, 0.16803783178329468, 0.17340081930160522]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 6.0, 8.0, 10.0, 5.0, 21.0, 29.0, 39.0, 67.0, 80.0, 151.0, 231.0, 463.0, 1014.0, 2028.0, 4058.0, 9154.0, 22253.0, 69781.0, 289077.0, 455123.0, 133379.0, 36622.0, 13487.0, 5848.0, 2769.0, 1314.0, 644.0, 336.0, 192.0, 117.0, 78.0, 49.0, 28.0, 24.0, 13.0, 6.0, 10.0, 8.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.11053466796875, -0.10710525512695312, -0.10367584228515625, -0.10024642944335938, -0.0968170166015625, -0.09338760375976562, -0.08995819091796875, -0.08652877807617188, -0.083099365234375, -0.07966995239257812, -0.07624053955078125, -0.07281112670898438, -0.0693817138671875, -0.06595230102539062, -0.06252288818359375, -0.059093475341796875, -0.0556640625, -0.052234649658203125, -0.04880523681640625, -0.045375823974609375, -0.0419464111328125, -0.038516998291015625, -0.03508758544921875, -0.031658172607421875, -0.028228759765625, -0.024799346923828125, -0.02136993408203125, -0.017940521240234375, -0.0145111083984375, -0.011081695556640625, -0.00765228271484375, -0.004222869873046875, -0.00079345703125, 0.002635955810546875, 0.00606536865234375, 0.009494781494140625, 0.0129241943359375, 0.016353607177734375, 0.01978302001953125, 0.023212432861328125, 0.026641845703125, 0.030071258544921875, 0.03350067138671875, 0.036930084228515625, 0.0403594970703125, 0.043788909912109375, 0.04721832275390625, 0.050647735595703125, 0.0540771484375, 0.057506561279296875, 0.06093597412109375, 0.06436538696289062, 0.0677947998046875, 0.07122421264648438, 0.07465362548828125, 0.07808303833007812, 0.081512451171875, 0.08494186401367188, 0.08837127685546875, 0.09180068969726562, 0.0952301025390625, 0.09865951538085938, 0.10208892822265625, 0.10551834106445312, 0.10894775390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 9.0, 8.0, 10.0, 21.0, 26.0, 21.0, 15.0, 34.0, 29.0, 45.0, 50.0, 74.0, 63.0, 56.0, 62.0, 58.0, 52.0, 50.0, 55.0, 36.0, 34.0, 31.0, 33.0, 19.0, 22.0, 14.0, 14.0, 10.0, 8.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0419921875, -0.0407414436340332, -0.039490699768066406, -0.03823995590209961, -0.03698921203613281, -0.035738468170166016, -0.03448772430419922, -0.03323698043823242, -0.031986236572265625, -0.030735492706298828, -0.02948474884033203, -0.028234004974365234, -0.026983261108398438, -0.02573251724243164, -0.024481773376464844, -0.023231029510498047, -0.02198028564453125, -0.020729541778564453, -0.019478797912597656, -0.01822805404663086, -0.016977310180664062, -0.015726566314697266, -0.014475822448730469, -0.013225078582763672, -0.011974334716796875, -0.010723590850830078, -0.009472846984863281, -0.008222103118896484, -0.0069713592529296875, -0.005720615386962891, -0.004469871520996094, -0.003219127655029297, -0.0019683837890625, -0.0007176399230957031, 0.0005331039428710938, 0.0017838478088378906, 0.0030345916748046875, 0.004285335540771484, 0.005536079406738281, 0.006786823272705078, 0.008037567138671875, 0.009288311004638672, 0.010539054870605469, 0.011789798736572266, 0.013040542602539062, 0.01429128646850586, 0.015542030334472656, 0.016792774200439453, 0.01804351806640625, 0.019294261932373047, 0.020545005798339844, 0.02179574966430664, 0.023046493530273438, 0.024297237396240234, 0.02554798126220703, 0.026798725128173828, 0.028049468994140625, 0.029300212860107422, 0.03055095672607422, 0.031801700592041016, 0.03305244445800781, 0.03430318832397461, 0.035553932189941406, 0.0368046760559082, 0.038055419921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 8.0, 13.0, 16.0, 15.0, 22.0, 24.0, 33.0, 31.0, 61.0, 87.0, 159.0, 295.0, 714.0, 2356.0, 8325.0, 36680.0, 315039.0, 586801.0, 77761.0, 14192.0, 3767.0, 1132.0, 409.0, 199.0, 124.0, 75.0, 46.0, 34.0, 24.0, 19.0, 14.0, 16.0, 8.0, 8.0, 9.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15234375, -0.147125244140625, -0.14190673828125, -0.136688232421875, -0.1314697265625, -0.126251220703125, -0.12103271484375, -0.115814208984375, -0.110595703125, -0.105377197265625, -0.10015869140625, -0.094940185546875, -0.0897216796875, -0.084503173828125, -0.07928466796875, -0.074066162109375, -0.06884765625, -0.063629150390625, -0.05841064453125, -0.053192138671875, -0.0479736328125, -0.042755126953125, -0.03753662109375, -0.032318115234375, -0.027099609375, -0.021881103515625, -0.01666259765625, -0.011444091796875, -0.0062255859375, -0.001007080078125, 0.00421142578125, 0.009429931640625, 0.0146484375, 0.019866943359375, 0.02508544921875, 0.030303955078125, 0.0355224609375, 0.040740966796875, 0.04595947265625, 0.051177978515625, 0.056396484375, 0.061614990234375, 0.06683349609375, 0.072052001953125, 0.0772705078125, 0.082489013671875, 0.08770751953125, 0.092926025390625, 0.09814453125, 0.103363037109375, 0.10858154296875, 0.113800048828125, 0.1190185546875, 0.124237060546875, 0.12945556640625, 0.134674072265625, 0.139892578125, 0.145111083984375, 0.15032958984375, 0.155548095703125, 0.1607666015625, 0.165985107421875, 0.17120361328125, 0.176422119140625, 0.181640625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 4.0, 15.0, 10.0, 11.0, 12.0, 22.0, 27.0, 11.0, 31.0, 34.0, 34.0, 44.0, 41.0, 56.0, 32.0, 29.0, 41.0, 39.0, 39.0, 43.0, 43.0, 51.0, 32.0, 30.0, 40.0, 25.0, 20.0, 22.0, 19.0, 18.0, 10.0, 16.0, 17.0, 13.0, 10.0, 7.0, 12.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0743408203125, -0.07210731506347656, -0.06987380981445312, -0.06764030456542969, -0.06540679931640625, -0.06317329406738281, -0.060939788818359375, -0.05870628356933594, -0.0564727783203125, -0.05423927307128906, -0.052005767822265625, -0.04977226257324219, -0.04753875732421875, -0.04530525207519531, -0.043071746826171875, -0.04083824157714844, -0.038604736328125, -0.03637123107910156, -0.034137725830078125, -0.03190422058105469, -0.02967071533203125, -0.027437210083007812, -0.025203704833984375, -0.022970199584960938, -0.0207366943359375, -0.018503189086914062, -0.016269683837890625, -0.014036178588867188, -0.01180267333984375, -0.009569168090820312, -0.007335662841796875, -0.0051021575927734375, -0.00286865234375, -0.0006351470947265625, 0.001598358154296875, 0.0038318634033203125, 0.00606536865234375, 0.008298873901367188, 0.010532379150390625, 0.012765884399414062, 0.0149993896484375, 0.017232894897460938, 0.019466400146484375, 0.021699905395507812, 0.02393341064453125, 0.026166915893554688, 0.028400421142578125, 0.030633926391601562, 0.032867431640625, 0.03510093688964844, 0.037334442138671875, 0.03956794738769531, 0.04180145263671875, 0.04403495788574219, 0.046268463134765625, 0.04850196838378906, 0.0507354736328125, 0.05296897888183594, 0.055202484130859375, 0.05743598937988281, 0.05966949462890625, 0.06190299987792969, 0.06413650512695312, 0.06637001037597656, 0.068603515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 4.0, 11.0, 9.0, 10.0, 15.0, 25.0, 45.0, 78.0, 84.0, 195.0, 338.0, 584.0, 1026.0, 2014.0, 4627.0, 11250.0, 39170.0, 296047.0, 579611.0, 82696.0, 18099.0, 6507.0, 2925.0, 1485.0, 731.0, 392.0, 222.0, 126.0, 80.0, 51.0, 31.0, 25.0, 8.0, 14.0, 2.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.09588623046875, -0.09330940246582031, -0.09073257446289062, -0.08815574645996094, -0.08557891845703125, -0.08300209045410156, -0.08042526245117188, -0.07784843444824219, -0.0752716064453125, -0.07269477844238281, -0.07011795043945312, -0.06754112243652344, -0.06496429443359375, -0.06238746643066406, -0.059810638427734375, -0.05723381042480469, -0.054656982421875, -0.05208015441894531, -0.049503326416015625, -0.04692649841308594, -0.04434967041015625, -0.04177284240722656, -0.039196014404296875, -0.03661918640136719, -0.0340423583984375, -0.03146553039550781, -0.028888702392578125, -0.026311874389648438, -0.02373504638671875, -0.021158218383789062, -0.018581390380859375, -0.016004562377929688, -0.013427734375, -0.010850906372070312, -0.008274078369140625, -0.0056972503662109375, -0.00312042236328125, -0.0005435943603515625, 0.002033233642578125, 0.0046100616455078125, 0.0071868896484375, 0.009763717651367188, 0.012340545654296875, 0.014917373657226562, 0.01749420166015625, 0.020071029663085938, 0.022647857666015625, 0.025224685668945312, 0.027801513671875, 0.030378341674804688, 0.032955169677734375, 0.03553199768066406, 0.03810882568359375, 0.04068565368652344, 0.043262481689453125, 0.04583930969238281, 0.0484161376953125, 0.05099296569824219, 0.053569793701171875, 0.05614662170410156, 0.05872344970703125, 0.06130027770996094, 0.06387710571289062, 0.06645393371582031, 0.06903076171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 7.0, 9.0, 13.0, 22.0, 47.0, 71.0, 84.0, 122.0, 170.0, 133.0, 103.0, 80.0, 56.0, 28.0, 21.0, 12.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7087669372558594e-05, -4.5933760702610016e-05, -4.477985203266144e-05, -4.362594336271286e-05, -4.247203469276428e-05, -4.1318126022815704e-05, -4.0164217352867126e-05, -3.901030868291855e-05, -3.785640001296997e-05, -3.670249134302139e-05, -3.5548582673072815e-05, -3.439467400312424e-05, -3.324076533317566e-05, -3.208685666322708e-05, -3.0932947993278503e-05, -2.9779039323329926e-05, -2.8625130653381348e-05, -2.747122198343277e-05, -2.6317313313484192e-05, -2.5163404643535614e-05, -2.4009495973587036e-05, -2.2855587303638458e-05, -2.170167863368988e-05, -2.0547769963741302e-05, -1.9393861293792725e-05, -1.8239952623844147e-05, -1.708604395389557e-05, -1.593213528394699e-05, -1.4778226613998413e-05, -1.3624317944049835e-05, -1.2470409274101257e-05, -1.131650060415268e-05, -1.0162591934204102e-05, -9.008683264255524e-06, -7.854774594306946e-06, -6.700865924358368e-06, -5.54695725440979e-06, -4.393048584461212e-06, -3.2391399145126343e-06, -2.0852312445640564e-06, -9.313225746154785e-07, 2.2258609533309937e-07, 1.3764947652816772e-06, 2.530403435230255e-06, 3.684312105178833e-06, 4.838220775127411e-06, 5.992129445075989e-06, 7.146038115024567e-06, 8.299946784973145e-06, 9.453855454921722e-06, 1.06077641248703e-05, 1.1761672794818878e-05, 1.2915581464767456e-05, 1.4069490134716034e-05, 1.5223398804664612e-05, 1.637730747461319e-05, 1.7531216144561768e-05, 1.8685124814510345e-05, 1.9839033484458923e-05, 2.09929421544075e-05, 2.214685082435608e-05, 2.3300759494304657e-05, 2.4454668164253235e-05, 2.5608576834201813e-05, 2.676248550415039e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 8.0, 6.0, 21.0, 30.0, 66.0, 206.0, 743.0, 4271.0, 42220.0, 822281.0, 167389.0, 9401.0, 1389.0, 297.0, 104.0, 50.0, 27.0, 13.0, 5.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.126708984375, -0.122711181640625, -0.11871337890625, -0.114715576171875, -0.1107177734375, -0.106719970703125, -0.10272216796875, -0.098724365234375, -0.0947265625, -0.090728759765625, -0.08673095703125, -0.082733154296875, -0.0787353515625, -0.074737548828125, -0.07073974609375, -0.066741943359375, -0.062744140625, -0.058746337890625, -0.05474853515625, -0.050750732421875, -0.0467529296875, -0.042755126953125, -0.03875732421875, -0.034759521484375, -0.03076171875, -0.026763916015625, -0.02276611328125, -0.018768310546875, -0.0147705078125, -0.010772705078125, -0.00677490234375, -0.002777099609375, 0.001220703125, 0.005218505859375, 0.00921630859375, 0.013214111328125, 0.0172119140625, 0.021209716796875, 0.02520751953125, 0.029205322265625, 0.033203125, 0.037200927734375, 0.04119873046875, 0.045196533203125, 0.0491943359375, 0.053192138671875, 0.05718994140625, 0.061187744140625, 0.065185546875, 0.069183349609375, 0.07318115234375, 0.077178955078125, 0.0811767578125, 0.085174560546875, 0.08917236328125, 0.093170166015625, 0.09716796875, 0.101165771484375, 0.10516357421875, 0.109161376953125, 0.1131591796875, 0.117156982421875, 0.12115478515625, 0.125152587890625, 0.129150390625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 6.0, 2.0, 1.0, 4.0, 8.0, 13.0, 16.0, 34.0, 45.0, 64.0, 94.0, 121.0, 106.0, 136.0, 115.0, 84.0, 54.0, 30.0, 21.0, 17.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0552978515625, -0.05375099182128906, -0.052204132080078125, -0.05065727233886719, -0.04911041259765625, -0.04756355285644531, -0.046016693115234375, -0.04446983337402344, -0.0429229736328125, -0.04137611389160156, -0.039829254150390625, -0.03828239440917969, -0.03673553466796875, -0.03518867492675781, -0.033641815185546875, -0.03209495544433594, -0.030548095703125, -0.029001235961914062, -0.027454376220703125, -0.025907516479492188, -0.02436065673828125, -0.022813796997070312, -0.021266937255859375, -0.019720077514648438, -0.0181732177734375, -0.016626358032226562, -0.015079498291015625, -0.013532638549804688, -0.01198577880859375, -0.010438919067382812, -0.008892059326171875, -0.0073451995849609375, -0.00579833984375, -0.0042514801025390625, -0.002704620361328125, -0.0011577606201171875, 0.00038909912109375, 0.0019359588623046875, 0.003482818603515625, 0.0050296783447265625, 0.0065765380859375, 0.008123397827148438, 0.009670257568359375, 0.011217117309570312, 0.01276397705078125, 0.014310836791992188, 0.015857696533203125, 0.017404556274414062, 0.018951416015625, 0.020498275756835938, 0.022045135498046875, 0.023591995239257812, 0.02513885498046875, 0.026685714721679688, 0.028232574462890625, 0.029779434204101562, 0.0313262939453125, 0.03287315368652344, 0.034420013427734375, 0.03596687316894531, 0.03751373291015625, 0.03906059265136719, 0.040607452392578125, 0.04215431213378906, 0.043701171875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 14.0, 20.0, 52.0, 106.0, 195.0, 228.0, 162.0, 118.0, 57.0, 20.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21428444981575012, -0.19954802095890045, -0.18481160700321198, -0.1700751781463623, -0.15533876419067383, -0.14060233533382416, -0.1258659064769745, -0.11112948507070541, -0.09639306366443634, -0.08165664225816727, -0.0669202208518982, -0.05218379199504852, -0.03744737058877945, -0.022710949182510376, -0.007974520325660706, 0.006761901080608368, 0.02149832248687744, 0.036234743893146515, 0.05097116902470589, 0.06570759415626526, 0.08044401556253433, 0.0951804369688034, 0.10991686582565308, 0.12465328723192215, 0.13938970863819122, 0.1541261374950409, 0.16886255145072937, 0.18359898030757904, 0.1983354091644287, 0.2130718231201172, 0.22780825197696686, 0.24254468083381653, 0.2572811245918274, 0.27201753854751587, 0.28675398230552673, 0.3014903962612152, 0.3162268102169037, 0.33096325397491455, 0.345699667930603, 0.3604360818862915, 0.37517249584198, 0.38990890979766846, 0.4046453535556793, 0.4193817675113678, 0.4341181814670563, 0.44885462522506714, 0.4635910391807556, 0.4783274531364441, 0.49306389689445496, 0.5078003406524658, 0.5225367546081543, 0.5372731685638428, 0.5520095825195312, 0.5667459964752197, 0.5814824104309082, 0.5962188839912415, 0.6109552979469299, 0.6256917119026184, 0.6404281258583069, 0.6551645994186401, 0.6699010133743286, 0.6846374273300171, 0.6993738412857056, 0.714110255241394, 0.7288466691970825]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 6.0, 12.0, 9.0, 4.0, 12.0, 17.0, 17.0, 19.0, 20.0, 22.0, 26.0, 28.0, 29.0, 25.0, 33.0, 34.0, 41.0, 38.0, 34.0, 49.0, 34.0, 34.0, 32.0, 39.0, 32.0, 37.0, 41.0, 35.0, 31.0, 28.0, 29.0, 33.0, 19.0, 15.0, 12.0, 11.0, 16.0, 9.0, 5.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.20495587587356567, -0.19831247627735138, -0.1916690617799759, -0.1850256621837616, -0.1783822476863861, -0.17173884809017181, -0.16509544849395752, -0.15845203399658203, -0.15180861949920654, -0.14516521990299225, -0.13852180540561676, -0.13187840580940247, -0.12523499131202698, -0.11859159171581268, -0.11194818466901779, -0.1053047776222229, -0.0986613780260086, -0.09201797097921371, -0.08537456393241882, -0.07873116433620453, -0.07208774983882904, -0.06544435024261475, -0.058800943195819855, -0.05215753614902496, -0.04551412910223007, -0.03887072205543518, -0.03222731500864029, -0.025583911687135696, -0.018940504640340805, -0.012297097593545914, -0.005653694272041321, 0.0009897127747535706, 0.007633119821548462, 0.014276525937020779, 0.020919932052493095, 0.027563337236642838, 0.03420674428343773, 0.04085015133023262, 0.04749355465173721, 0.054136961698532104, 0.060780368745326996, 0.06742377579212189, 0.07406718283891678, 0.08071058988571167, 0.08735398948192596, 0.09399740397930145, 0.10064080357551575, 0.10728421062231064, 0.11392761766910553, 0.12057102471590042, 0.1272144317626953, 0.1338578313589096, 0.1405012458562851, 0.1471446454524994, 0.15378805994987488, 0.16043145954608917, 0.16707485914230347, 0.17371825873851776, 0.18036167323589325, 0.18700507283210754, 0.19364848732948303, 0.20029188692569733, 0.20693528652191162, 0.2135787010192871, 0.2202221155166626]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 4.0, 10.0, 15.0, 21.0, 29.0, 40.0, 46.0, 60.0, 73.0, 115.0, 161.0, 237.0, 377.0, 645.0, 1119.0, 2198.0, 4330.0, 10398.0, 31711.0, 158759.0, 1174488.0, 2233106.0, 471118.0, 71746.0, 19083.0, 7184.0, 3214.0, 1661.0, 872.0, 502.0, 324.0, 179.0, 142.0, 86.0, 47.0, 47.0, 36.0, 21.0, 15.0, 16.0, 8.0, 7.0, 3.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052581787109375, -0.050844669342041016, -0.04910755157470703, -0.04737043380737305, -0.04563331604003906, -0.04389619827270508, -0.042159080505371094, -0.04042196273803711, -0.038684844970703125, -0.03694772720336914, -0.035210609436035156, -0.03347349166870117, -0.03173637390136719, -0.029999256134033203, -0.02826213836669922, -0.026525020599365234, -0.02478790283203125, -0.023050785064697266, -0.02131366729736328, -0.019576549530029297, -0.017839431762695312, -0.016102313995361328, -0.014365196228027344, -0.01262807846069336, -0.010890960693359375, -0.00915384292602539, -0.007416725158691406, -0.005679607391357422, -0.0039424896240234375, -0.002205371856689453, -0.00046825408935546875, 0.0012688636779785156, 0.0030059814453125, 0.004743099212646484, 0.006480216979980469, 0.008217334747314453, 0.009954452514648438, 0.011691570281982422, 0.013428688049316406, 0.01516580581665039, 0.016902923583984375, 0.01864004135131836, 0.020377159118652344, 0.022114276885986328, 0.023851394653320312, 0.025588512420654297, 0.02732563018798828, 0.029062747955322266, 0.03079986572265625, 0.032536983489990234, 0.03427410125732422, 0.0360112190246582, 0.03774833679199219, 0.03948545455932617, 0.041222572326660156, 0.04295969009399414, 0.044696807861328125, 0.04643392562866211, 0.048171043395996094, 0.04990816116333008, 0.05164527893066406, 0.05338239669799805, 0.05511951446533203, 0.056856632232666016, 0.05859375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 3.0, 5.0, 8.0, 7.0, 14.0, 16.0, 24.0, 17.0, 19.0, 25.0, 32.0, 32.0, 44.0, 51.0, 66.0, 73.0, 59.0, 64.0, 72.0, 38.0, 53.0, 43.0, 35.0, 31.0, 41.0, 31.0, 29.0, 15.0, 12.0, 11.0, 12.0, 7.0, 5.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.03845643997192383, -0.037178993225097656, -0.035901546478271484, -0.03462409973144531, -0.03334665298461914, -0.03206920623779297, -0.030791759490966797, -0.029514312744140625, -0.028236865997314453, -0.02695941925048828, -0.02568197250366211, -0.024404525756835938, -0.023127079010009766, -0.021849632263183594, -0.020572185516357422, -0.01929473876953125, -0.018017292022705078, -0.016739845275878906, -0.015462398529052734, -0.014184951782226562, -0.01290750503540039, -0.011630058288574219, -0.010352611541748047, -0.009075164794921875, -0.007797718048095703, -0.006520271301269531, -0.005242824554443359, -0.0039653778076171875, -0.0026879310607910156, -0.0014104843139648438, -0.00013303756713867188, 0.0011444091796875, 0.002421855926513672, 0.0036993026733398438, 0.004976749420166016, 0.0062541961669921875, 0.007531642913818359, 0.008809089660644531, 0.010086536407470703, 0.011363983154296875, 0.012641429901123047, 0.013918876647949219, 0.01519632339477539, 0.016473770141601562, 0.017751216888427734, 0.019028663635253906, 0.020306110382080078, 0.02158355712890625, 0.022861003875732422, 0.024138450622558594, 0.025415897369384766, 0.026693344116210938, 0.02797079086303711, 0.02924823760986328, 0.030525684356689453, 0.031803131103515625, 0.0330805778503418, 0.03435802459716797, 0.03563547134399414, 0.03691291809082031, 0.038190364837646484, 0.039467811584472656, 0.04074525833129883, 0.042022705078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 8.0, 10.0, 23.0, 26.0, 61.0, 71.0, 124.0, 238.0, 555.0, 1871.0, 18183.0, 838869.0, 3232052.0, 95835.0, 4668.0, 931.0, 338.0, 169.0, 98.0, 50.0, 43.0, 17.0, 19.0, 7.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1566162109375, -0.15175819396972656, -0.14690017700195312, -0.1420421600341797, -0.13718414306640625, -0.1323261260986328, -0.12746810913085938, -0.12261009216308594, -0.1177520751953125, -0.11289405822753906, -0.10803604125976562, -0.10317802429199219, -0.09832000732421875, -0.09346199035644531, -0.08860397338867188, -0.08374595642089844, -0.078887939453125, -0.07402992248535156, -0.06917190551757812, -0.06431388854980469, -0.05945587158203125, -0.05459785461425781, -0.049739837646484375, -0.04488182067871094, -0.0400238037109375, -0.03516578674316406, -0.030307769775390625, -0.025449752807617188, -0.02059173583984375, -0.015733718872070312, -0.010875701904296875, -0.0060176849365234375, -0.00115966796875, 0.0036983489990234375, 0.008556365966796875, 0.013414382934570312, 0.01827239990234375, 0.023130416870117188, 0.027988433837890625, 0.03284645080566406, 0.0377044677734375, 0.04256248474121094, 0.047420501708984375, 0.05227851867675781, 0.05713653564453125, 0.06199455261230469, 0.06685256958007812, 0.07171058654785156, 0.076568603515625, 0.08142662048339844, 0.08628463745117188, 0.09114265441894531, 0.09600067138671875, 0.10085868835449219, 0.10571670532226562, 0.11057472229003906, 0.1154327392578125, 0.12029075622558594, 0.12514877319335938, 0.1300067901611328, 0.13486480712890625, 0.1397228240966797, 0.14458084106445312, 0.14943885803222656, 0.154296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 14.0, 11.0, 20.0, 24.0, 60.0, 82.0, 142.0, 228.0, 373.0, 488.0, 556.0, 623.0, 482.0, 330.0, 228.0, 154.0, 83.0, 67.0, 42.0, 28.0, 13.0, 10.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077392578125, -0.07497119903564453, -0.07254981994628906, -0.0701284408569336, -0.06770706176757812, -0.06528568267822266, -0.06286430358886719, -0.06044292449951172, -0.05802154541015625, -0.05560016632080078, -0.05317878723144531, -0.050757408142089844, -0.048336029052734375, -0.045914649963378906, -0.04349327087402344, -0.04107189178466797, -0.0386505126953125, -0.03622913360595703, -0.03380775451660156, -0.031386375427246094, -0.028964996337890625, -0.026543617248535156, -0.024122238159179688, -0.02170085906982422, -0.01927947998046875, -0.01685810089111328, -0.014436721801757812, -0.012015342712402344, -0.009593963623046875, -0.007172584533691406, -0.0047512054443359375, -0.0023298263549804688, 9.1552734375e-05, 0.0025129318237304688, 0.0049343109130859375, 0.007355690002441406, 0.009777069091796875, 0.012198448181152344, 0.014619827270507812, 0.01704120635986328, 0.01946258544921875, 0.02188396453857422, 0.024305343627929688, 0.026726722717285156, 0.029148101806640625, 0.031569480895996094, 0.03399085998535156, 0.03641223907470703, 0.0388336181640625, 0.04125499725341797, 0.04367637634277344, 0.046097755432128906, 0.048519134521484375, 0.050940513610839844, 0.05336189270019531, 0.05578327178955078, 0.05820465087890625, 0.06062602996826172, 0.06304740905761719, 0.06546878814697266, 0.06789016723632812, 0.0703115463256836, 0.07273292541503906, 0.07515430450439453, 0.07757568359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 8.0, 173.0, 618.0, 204.0, 13.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1681140810251236, -0.1209784746170044, -0.0738428607583046, -0.026707246899604797, 0.020428359508514404, 0.0675639659166336, 0.114699587225914, 0.161835178732872, 0.2089708000421524, 0.2561064064502716, 0.303242027759552, 0.35037761926651, 0.3975132405757904, 0.4446488618850708, 0.4917844533920288, 0.5389200448989868, 0.5860556960105896, 0.6331912875175476, 0.6803269386291504, 0.7274625301361084, 0.7745981216430664, 0.8217337131500244, 0.8688693642616272, 0.9160049557685852, 0.9631405472755432, 1.010276198387146, 1.057411789894104, 1.104547381401062, 1.15168297290802, 1.198818564414978, 1.2459542751312256, 1.2930898666381836, 1.340225338935852, 1.38736093044281, 1.434496521949768, 1.4816322326660156, 1.5287678241729736, 1.5759034156799316, 1.6230390071868896, 1.6701745986938477, 1.7173101902008057, 1.7644457817077637, 1.8115813732147217, 1.8587169647216797, 1.9058526754379272, 1.9529882669448853, 2.000123977661133, 2.0472593307495117, 2.094395160675049, 2.141530752182007, 2.188666343688965, 2.235801935195923, 2.282937526702881, 2.330073118209839, 2.377208709716797, 2.424344539642334, 2.471479892730713, 2.518615484237671, 2.565751075744629, 2.612886667251587, 2.660022258758545, 2.707157850265503, 2.754293441772461, 2.801429271697998, 2.848564863204956]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 7.0, 17.0, 16.0, 17.0, 21.0, 29.0, 29.0, 33.0, 33.0, 28.0, 33.0, 53.0, 35.0, 39.0, 45.0, 49.0, 44.0, 28.0, 45.0, 53.0, 41.0, 31.0, 36.0, 31.0, 27.0, 26.0, 18.0, 18.0, 17.0, 23.0, 9.0, 12.0, 8.0, 7.0, 5.0, 9.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.17982804775238037, -0.17431052029132843, -0.1687929928302765, -0.16327545046806335, -0.1577579230070114, -0.15224039554595947, -0.14672285318374634, -0.1412053257226944, -0.13568779826164246, -0.13017027080059052, -0.12465273588895798, -0.11913520097732544, -0.1136176735162735, -0.10810014605522156, -0.10258261114358902, -0.09706507623195648, -0.09154754877090454, -0.0860300213098526, -0.08051248639822006, -0.07499495148658752, -0.06947742402553558, -0.06395989656448364, -0.058442361652851105, -0.052924830466508865, -0.047407299280166626, -0.04188976809382439, -0.03637223690748215, -0.030854705721139908, -0.02533717453479767, -0.01981964334845543, -0.01430211216211319, -0.00878458097577095, -0.003267049789428711, 0.0022504813969135284, 0.007768012583255768, 0.013285543769598007, 0.018803074955940247, 0.024320606142282486, 0.029838137328624725, 0.035355668514966965, 0.040873199701309204, 0.046390730887651443, 0.05190826207399368, 0.05742579326033592, 0.06294332444667816, 0.0684608519077301, 0.07397838681936264, 0.07949592173099518, 0.08501344919204712, 0.09053097665309906, 0.0960485115647316, 0.10156604647636414, 0.10708357393741608, 0.11260110139846802, 0.11811863631010056, 0.1236361712217331, 0.12915369868278503, 0.13467122614383698, 0.14018875360488892, 0.14570629596710205, 0.151223823428154, 0.15674135088920593, 0.16225889325141907, 0.167776420712471, 0.17329394817352295]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 5.0, 7.0, 6.0, 4.0, 10.0, 20.0, 20.0, 29.0, 50.0, 73.0, 105.0, 185.0, 293.0, 570.0, 1226.0, 2688.0, 6158.0, 15370.0, 41360.0, 118639.0, 306915.0, 336484.0, 139739.0, 47983.0, 17554.0, 7046.0, 2976.0, 1433.0, 705.0, 340.0, 170.0, 112.0, 95.0, 42.0, 36.0, 28.0, 24.0, 13.0, 15.0, 9.0, 3.0, 4.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.08081626892089844, -0.07783126831054688, -0.07484626770019531, -0.07186126708984375, -0.06887626647949219, -0.06589126586914062, -0.06290626525878906, -0.0599212646484375, -0.05693626403808594, -0.053951263427734375, -0.05096626281738281, -0.04798126220703125, -0.04499626159667969, -0.042011260986328125, -0.03902626037597656, -0.036041259765625, -0.03305625915527344, -0.030071258544921875, -0.027086257934570312, -0.02410125732421875, -0.021116256713867188, -0.018131256103515625, -0.015146255493164062, -0.0121612548828125, -0.009176254272460938, -0.006191253662109375, -0.0032062530517578125, -0.00022125244140625, 0.0027637481689453125, 0.005748748779296875, 0.008733749389648438, 0.01171875, 0.014703750610351562, 0.017688751220703125, 0.020673751831054688, 0.02365875244140625, 0.026643753051757812, 0.029628753662109375, 0.03261375427246094, 0.0355987548828125, 0.03858375549316406, 0.041568756103515625, 0.04455375671386719, 0.04753875732421875, 0.05052375793457031, 0.053508758544921875, 0.05649375915527344, 0.059478759765625, 0.06246376037597656, 0.06544876098632812, 0.06843376159667969, 0.07141876220703125, 0.07440376281738281, 0.07738876342773438, 0.08037376403808594, 0.0833587646484375, 0.08634376525878906, 0.08932876586914062, 0.09231376647949219, 0.09529876708984375, 0.09828376770019531, 0.10126876831054688, 0.10425376892089844, 0.10723876953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 4.0, 13.0, 10.0, 17.0, 11.0, 24.0, 11.0, 17.0, 35.0, 35.0, 44.0, 44.0, 57.0, 71.0, 65.0, 61.0, 60.0, 56.0, 46.0, 54.0, 34.0, 40.0, 36.0, 30.0, 36.0, 17.0, 14.0, 9.0, 9.0, 9.0, 8.0, 6.0, 7.0, 3.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036773681640625, -0.03557634353637695, -0.034379005432128906, -0.03318166732788086, -0.03198432922363281, -0.030786991119384766, -0.02958965301513672, -0.028392314910888672, -0.027194976806640625, -0.025997638702392578, -0.02480030059814453, -0.023602962493896484, -0.022405624389648438, -0.02120828628540039, -0.020010948181152344, -0.018813610076904297, -0.01761627197265625, -0.016418933868408203, -0.015221595764160156, -0.01402425765991211, -0.012826919555664062, -0.011629581451416016, -0.010432243347167969, -0.009234905242919922, -0.008037567138671875, -0.006840229034423828, -0.005642890930175781, -0.004445552825927734, -0.0032482147216796875, -0.0020508766174316406, -0.0008535385131835938, 0.0003437995910644531, 0.0015411376953125, 0.002738475799560547, 0.003935813903808594, 0.005133152008056641, 0.0063304901123046875, 0.007527828216552734, 0.008725166320800781, 0.009922504425048828, 0.011119842529296875, 0.012317180633544922, 0.013514518737792969, 0.014711856842041016, 0.015909194946289062, 0.01710653305053711, 0.018303871154785156, 0.019501209259033203, 0.02069854736328125, 0.021895885467529297, 0.023093223571777344, 0.02429056167602539, 0.025487899780273438, 0.026685237884521484, 0.02788257598876953, 0.029079914093017578, 0.030277252197265625, 0.03147459030151367, 0.03267192840576172, 0.033869266510009766, 0.03506660461425781, 0.03626394271850586, 0.037461280822753906, 0.03865861892700195, 0.03985595703125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 14.0, 6.0, 10.0, 15.0, 23.0, 33.0, 61.0, 113.0, 170.0, 264.0, 643.0, 1706.0, 5596.0, 19651.0, 73882.0, 277564.0, 442791.0, 166361.0, 42778.0, 11391.0, 3295.0, 1104.0, 446.0, 260.0, 127.0, 73.0, 52.0, 38.0, 34.0, 12.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11761474609375, -0.11345767974853516, -0.10930061340332031, -0.10514354705810547, -0.10098648071289062, -0.09682941436767578, -0.09267234802246094, -0.0885152816772461, -0.08435821533203125, -0.0802011489868164, -0.07604408264160156, -0.07188701629638672, -0.06772994995117188, -0.06357288360595703, -0.05941581726074219, -0.055258750915527344, -0.0511016845703125, -0.046944618225097656, -0.04278755187988281, -0.03863048553466797, -0.034473419189453125, -0.03031635284423828, -0.026159286499023438, -0.022002220153808594, -0.01784515380859375, -0.013688087463378906, -0.009531021118164062, -0.005373954772949219, -0.001216888427734375, 0.0029401779174804688, 0.0070972442626953125, 0.011254310607910156, 0.015411376953125, 0.019568443298339844, 0.023725509643554688, 0.02788257598876953, 0.032039642333984375, 0.03619670867919922, 0.04035377502441406, 0.044510841369628906, 0.04866790771484375, 0.052824974060058594, 0.05698204040527344, 0.06113910675048828, 0.06529617309570312, 0.06945323944091797, 0.07361030578613281, 0.07776737213134766, 0.0819244384765625, 0.08608150482177734, 0.09023857116699219, 0.09439563751220703, 0.09855270385742188, 0.10270977020263672, 0.10686683654785156, 0.1110239028930664, 0.11518096923828125, 0.1193380355834961, 0.12349510192871094, 0.12765216827392578, 0.13180923461914062, 0.13596630096435547, 0.1401233673095703, 0.14428043365478516, 0.1484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 17.0, 19.0, 26.0, 25.0, 23.0, 33.0, 40.0, 26.0, 29.0, 37.0, 49.0, 46.0, 45.0, 37.0, 49.0, 49.0, 47.0, 49.0, 39.0, 44.0, 35.0, 25.0, 26.0, 31.0, 24.0, 32.0, 11.0, 8.0, 16.0, 8.0, 10.0, 9.0, 3.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09363174438476562, -0.09082794189453125, -0.08802413940429688, -0.0852203369140625, -0.08241653442382812, -0.07961273193359375, -0.07680892944335938, -0.074005126953125, -0.07120132446289062, -0.06839752197265625, -0.06559371948242188, -0.0627899169921875, -0.059986114501953125, -0.05718231201171875, -0.054378509521484375, -0.05157470703125, -0.048770904541015625, -0.04596710205078125, -0.043163299560546875, -0.0403594970703125, -0.037555694580078125, -0.03475189208984375, -0.031948089599609375, -0.029144287109375, -0.026340484619140625, -0.02353668212890625, -0.020732879638671875, -0.0179290771484375, -0.015125274658203125, -0.01232147216796875, -0.009517669677734375, -0.0067138671875, -0.003910064697265625, -0.00110626220703125, 0.001697540283203125, 0.0045013427734375, 0.007305145263671875, 0.01010894775390625, 0.012912750244140625, 0.015716552734375, 0.018520355224609375, 0.02132415771484375, 0.024127960205078125, 0.0269317626953125, 0.029735565185546875, 0.03253936767578125, 0.035343170166015625, 0.03814697265625, 0.040950775146484375, 0.04375457763671875, 0.046558380126953125, 0.0493621826171875, 0.052165985107421875, 0.05496978759765625, 0.057773590087890625, 0.060577392578125, 0.06338119506835938, 0.06618499755859375, 0.06898880004882812, 0.0717926025390625, 0.07459640502929688, 0.07740020751953125, 0.08020401000976562, 0.0830078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 15.0, 19.0, 21.0, 46.0, 52.0, 85.0, 150.0, 321.0, 680.0, 1821.0, 6303.0, 26618.0, 136156.0, 468277.0, 320798.0, 67415.0, 13809.0, 3669.0, 1209.0, 510.0, 263.0, 130.0, 60.0, 49.0, 29.0, 16.0, 12.0, 11.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077392578125, -0.07503223419189453, -0.07267189025878906, -0.0703115463256836, -0.06795120239257812, -0.06559085845947266, -0.06323051452636719, -0.06087017059326172, -0.05850982666015625, -0.05614948272705078, -0.05378913879394531, -0.051428794860839844, -0.049068450927734375, -0.046708106994628906, -0.04434776306152344, -0.04198741912841797, -0.0396270751953125, -0.03726673126220703, -0.03490638732910156, -0.032546043395996094, -0.030185699462890625, -0.027825355529785156, -0.025465011596679688, -0.02310466766357422, -0.02074432373046875, -0.01838397979736328, -0.016023635864257812, -0.013663291931152344, -0.011302947998046875, -0.008942604064941406, -0.0065822601318359375, -0.004221916198730469, -0.001861572265625, 0.0004987716674804688, 0.0028591156005859375, 0.005219459533691406, 0.007579803466796875, 0.009940147399902344, 0.012300491333007812, 0.014660835266113281, 0.01702117919921875, 0.01938152313232422, 0.021741867065429688, 0.024102210998535156, 0.026462554931640625, 0.028822898864746094, 0.031183242797851562, 0.03354358673095703, 0.0359039306640625, 0.03826427459716797, 0.04062461853027344, 0.042984962463378906, 0.045345306396484375, 0.047705650329589844, 0.05006599426269531, 0.05242633819580078, 0.05478668212890625, 0.05714702606201172, 0.05950736999511719, 0.061867713928222656, 0.06422805786132812, 0.0665884017944336, 0.06894874572753906, 0.07130908966064453, 0.07366943359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 12.0, 10.0, 12.0, 7.0, 18.0, 15.0, 21.0, 17.0, 24.0, 28.0, 30.0, 45.0, 48.0, 56.0, 65.0, 73.0, 66.0, 69.0, 60.0, 43.0, 42.0, 25.0, 19.0, 31.0, 24.0, 13.0, 16.0, 8.0, 11.0, 14.0, 7.0, 2.0, 11.0, 13.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9490718841552734e-05, -1.8914230167865753e-05, -1.8337741494178772e-05, -1.776125282049179e-05, -1.718476414680481e-05, -1.660827547311783e-05, -1.6031786799430847e-05, -1.5455298125743866e-05, -1.4878809452056885e-05, -1.4302320778369904e-05, -1.3725832104682922e-05, -1.3149343430995941e-05, -1.257285475730896e-05, -1.1996366083621979e-05, -1.1419877409934998e-05, -1.0843388736248016e-05, -1.0266900062561035e-05, -9.690411388874054e-06, -9.113922715187073e-06, -8.537434041500092e-06, -7.96094536781311e-06, -7.384456694126129e-06, -6.807968020439148e-06, -6.231479346752167e-06, -5.6549906730651855e-06, -5.078501999378204e-06, -4.502013325691223e-06, -3.925524652004242e-06, -3.3490359783172607e-06, -2.7725473046302795e-06, -2.1960586309432983e-06, -1.6195699572563171e-06, -1.043081283569336e-06, -4.6659260988235474e-07, 1.0989606380462646e-07, 6.863847374916077e-07, 1.2628734111785889e-06, 1.83936208486557e-06, 2.4158507585525513e-06, 2.9923394322395325e-06, 3.5688281059265137e-06, 4.145316779613495e-06, 4.721805453300476e-06, 5.298294126987457e-06, 5.8747828006744385e-06, 6.45127147436142e-06, 7.027760148048401e-06, 7.604248821735382e-06, 8.180737495422363e-06, 8.757226169109344e-06, 9.333714842796326e-06, 9.910203516483307e-06, 1.0486692190170288e-05, 1.106318086385727e-05, 1.163966953754425e-05, 1.2216158211231232e-05, 1.2792646884918213e-05, 1.3369135558605194e-05, 1.3945624232292175e-05, 1.4522112905979156e-05, 1.5098601579666138e-05, 1.567509025335312e-05, 1.62515789270401e-05, 1.682806760072708e-05, 1.7404556274414062e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 2.0, 3.0, 8.0, 17.0, 11.0, 15.0, 28.0, 44.0, 49.0, 70.0, 132.0, 215.0, 380.0, 753.0, 1626.0, 3938.0, 9887.0, 28053.0, 86919.0, 229679.0, 343255.0, 219690.0, 81205.0, 26329.0, 9255.0, 3709.0, 1572.0, 717.0, 382.0, 212.0, 141.0, 76.0, 45.0, 43.0, 30.0, 13.0, 11.0, 8.0, 11.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.037506103515625, -0.03623342514038086, -0.03496074676513672, -0.03368806838989258, -0.03241539001464844, -0.031142711639404297, -0.029870033264160156, -0.028597354888916016, -0.027324676513671875, -0.026051998138427734, -0.024779319763183594, -0.023506641387939453, -0.022233963012695312, -0.020961284637451172, -0.01968860626220703, -0.01841592788696289, -0.01714324951171875, -0.01587057113647461, -0.014597892761230469, -0.013325214385986328, -0.012052536010742188, -0.010779857635498047, -0.009507179260253906, -0.008234500885009766, -0.006961822509765625, -0.005689144134521484, -0.004416465759277344, -0.003143787384033203, -0.0018711090087890625, -0.0005984306335449219, 0.0006742477416992188, 0.0019469261169433594, 0.0032196044921875, 0.004492282867431641, 0.005764961242675781, 0.007037639617919922, 0.008310317993164062, 0.009582996368408203, 0.010855674743652344, 0.012128353118896484, 0.013401031494140625, 0.014673709869384766, 0.015946388244628906, 0.017219066619873047, 0.018491744995117188, 0.019764423370361328, 0.02103710174560547, 0.02230978012084961, 0.02358245849609375, 0.02485513687133789, 0.02612781524658203, 0.027400493621826172, 0.028673171997070312, 0.029945850372314453, 0.031218528747558594, 0.032491207122802734, 0.033763885498046875, 0.035036563873291016, 0.036309242248535156, 0.0375819206237793, 0.03885459899902344, 0.04012727737426758, 0.04139995574951172, 0.04267263412475586, 0.0439453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 10.0, 6.0, 15.0, 15.0, 21.0, 25.0, 25.0, 37.0, 26.0, 46.0, 43.0, 48.0, 73.0, 62.0, 52.0, 62.0, 55.0, 62.0, 49.0, 37.0, 40.0, 39.0, 26.0, 23.0, 18.0, 14.0, 16.0, 11.0, 13.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0313720703125, -0.03046560287475586, -0.02955913543701172, -0.028652667999267578, -0.027746200561523438, -0.026839733123779297, -0.025933265686035156, -0.025026798248291016, -0.024120330810546875, -0.023213863372802734, -0.022307395935058594, -0.021400928497314453, -0.020494461059570312, -0.019587993621826172, -0.01868152618408203, -0.01777505874633789, -0.01686859130859375, -0.01596212387084961, -0.015055656433105469, -0.014149188995361328, -0.013242721557617188, -0.012336254119873047, -0.011429786682128906, -0.010523319244384766, -0.009616851806640625, -0.008710384368896484, -0.007803916931152344, -0.006897449493408203, -0.0059909820556640625, -0.005084514617919922, -0.004178047180175781, -0.0032715797424316406, -0.0023651123046875, -0.0014586448669433594, -0.0005521774291992188, 0.0003542900085449219, 0.0012607574462890625, 0.002167224884033203, 0.0030736923217773438, 0.003980159759521484, 0.004886627197265625, 0.005793094635009766, 0.006699562072753906, 0.007606029510498047, 0.008512496948242188, 0.009418964385986328, 0.010325431823730469, 0.01123189926147461, 0.01213836669921875, 0.01304483413696289, 0.013951301574707031, 0.014857769012451172, 0.015764236450195312, 0.016670703887939453, 0.017577171325683594, 0.018483638763427734, 0.019390106201171875, 0.020296573638916016, 0.021203041076660156, 0.022109508514404297, 0.023015975952148438, 0.023922443389892578, 0.02482891082763672, 0.02573537826538086, 0.026641845703125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 12.0, 44.0, 109.0, 243.0, 294.0, 188.0, 77.0, 28.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7279870510101318, -0.7022101879119873, -0.6764333844184875, -0.650656521320343, -0.6248797178268433, -0.5991028547286987, -0.5733259916305542, -0.5475491881370544, -0.5217723250389099, -0.49599549174308777, -0.4702186584472656, -0.4444417953491211, -0.41866496205329895, -0.3928881287574768, -0.36711129546165466, -0.3413344621658325, -0.3155576288700104, -0.28978079557418823, -0.2640039622783661, -0.23822711408138275, -0.21245026588439941, -0.18667343258857727, -0.16089659929275513, -0.1351197510957718, -0.10934291779994965, -0.0835660770535469, -0.057789240032434464, -0.03201240301132202, -0.006235562264919281, 0.01954127848148346, 0.0453181117773056, 0.07109495997428894, 0.09687179327011108, 0.12264863401651382, 0.14842547476291656, 0.1742023080587387, 0.19997915625572205, 0.2257559895515442, 0.25153282284736633, 0.2773096561431885, 0.303086519241333, 0.32886335253715515, 0.3546401858329773, 0.3804170489311218, 0.40619388222694397, 0.4319707155227661, 0.45774754881858826, 0.4835243821144104, 0.5093011856079102, 0.5350780487060547, 0.5608548521995544, 0.586631715297699, 0.6124085187911987, 0.6381853818893433, 0.6639622449874878, 0.6897390484809875, 0.7155159115791321, 0.7412927746772766, 0.7670695781707764, 0.7928464412689209, 0.8186232447624207, 0.8444001078605652, 0.8701769113540649, 0.8959537744522095, 0.921730637550354]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 8.0, 4.0, 9.0, 9.0, 11.0, 15.0, 23.0, 29.0, 28.0, 33.0, 29.0, 35.0, 33.0, 48.0, 59.0, 45.0, 53.0, 49.0, 59.0, 46.0, 57.0, 35.0, 38.0, 38.0, 29.0, 31.0, 26.0, 20.0, 23.0, 19.0, 13.0, 9.0, 8.0, 9.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30393558740615845, -0.29411283135414124, -0.2842901051044464, -0.2744673490524292, -0.2646446228027344, -0.25482186675071716, -0.24499912559986115, -0.23517638444900513, -0.2253536432981491, -0.2155309021472931, -0.20570816099643707, -0.19588541984558105, -0.18606266379356384, -0.17623993754386902, -0.1664171814918518, -0.1565944403409958, -0.14677169919013977, -0.13694895803928375, -0.12712621688842773, -0.11730346828699112, -0.1074807271361351, -0.09765798598527908, -0.08783523738384247, -0.07801249623298645, -0.06818975508213043, -0.058367013931274414, -0.0485442690551281, -0.03872152417898178, -0.028898783028125763, -0.019076041877269745, -0.009253297001123428, 0.0005694478750228882, 0.010392189025878906, 0.020214932039380074, 0.03003767505288124, 0.03986041992902756, 0.049683161079883575, 0.059505902230739594, 0.06932865083217621, 0.07915139198303223, 0.08897413313388824, 0.09879687428474426, 0.10861961543560028, 0.1184423640370369, 0.1282651126384735, 0.13808783888816833, 0.14791059494018555, 0.15773333609104156, 0.16755607724189758, 0.1773788183927536, 0.18720155954360962, 0.19702430069446564, 0.20684704184532166, 0.21666979789733887, 0.22649253904819489, 0.2363152801990509, 0.24613802134990692, 0.25596076250076294, 0.26578351855278015, 0.275606244802475, 0.2854290008544922, 0.295251727104187, 0.3050744831562042, 0.31489723920822144, 0.32471996545791626]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 13.0, 8.0, 12.0, 19.0, 27.0, 41.0, 67.0, 64.0, 112.0, 128.0, 215.0, 411.0, 965.0, 4298.0, 51935.0, 2574796.0, 1525839.0, 30615.0, 3066.0, 707.0, 316.0, 199.0, 113.0, 89.0, 69.0, 59.0, 36.0, 19.0, 15.0, 10.0, 7.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.101348876953125, -0.09771728515625, -0.094085693359375, -0.0904541015625, -0.086822509765625, -0.08319091796875, -0.079559326171875, -0.075927734375, -0.072296142578125, -0.06866455078125, -0.065032958984375, -0.0614013671875, -0.057769775390625, -0.05413818359375, -0.050506591796875, -0.046875, -0.043243408203125, -0.03961181640625, -0.035980224609375, -0.0323486328125, -0.028717041015625, -0.02508544921875, -0.021453857421875, -0.017822265625, -0.014190673828125, -0.01055908203125, -0.006927490234375, -0.0032958984375, 0.000335693359375, 0.00396728515625, 0.007598876953125, 0.01123046875, 0.014862060546875, 0.01849365234375, 0.022125244140625, 0.0257568359375, 0.029388427734375, 0.03302001953125, 0.036651611328125, 0.040283203125, 0.043914794921875, 0.04754638671875, 0.051177978515625, 0.0548095703125, 0.058441162109375, 0.06207275390625, 0.065704345703125, 0.0693359375, 0.072967529296875, 0.07659912109375, 0.080230712890625, 0.0838623046875, 0.087493896484375, 0.09112548828125, 0.094757080078125, 0.098388671875, 0.102020263671875, 0.10565185546875, 0.109283447265625, 0.1129150390625, 0.116546630859375, 0.12017822265625, 0.123809814453125, 0.12744140625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 8.0, 11.0, 10.0, 14.0, 17.0, 31.0, 21.0, 23.0, 39.0, 44.0, 61.0, 57.0, 60.0, 57.0, 68.0, 61.0, 72.0, 44.0, 45.0, 43.0, 35.0, 24.0, 38.0, 33.0, 21.0, 16.0, 12.0, 7.0, 12.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0423583984375, -0.04105567932128906, -0.039752960205078125, -0.03845024108886719, -0.03714752197265625, -0.03584480285644531, -0.034542083740234375, -0.03323936462402344, -0.0319366455078125, -0.030633926391601562, -0.029331207275390625, -0.028028488159179688, -0.02672576904296875, -0.025423049926757812, -0.024120330810546875, -0.022817611694335938, -0.021514892578125, -0.020212173461914062, -0.018909454345703125, -0.017606735229492188, -0.01630401611328125, -0.015001296997070312, -0.013698577880859375, -0.012395858764648438, -0.0110931396484375, -0.009790420532226562, -0.008487701416015625, -0.0071849822998046875, -0.00588226318359375, -0.0045795440673828125, -0.003276824951171875, -0.0019741058349609375, -0.00067138671875, 0.0006313323974609375, 0.001934051513671875, 0.0032367706298828125, 0.00453948974609375, 0.0058422088623046875, 0.007144927978515625, 0.008447647094726562, 0.0097503662109375, 0.011053085327148438, 0.012355804443359375, 0.013658523559570312, 0.01496124267578125, 0.016263961791992188, 0.017566680908203125, 0.018869400024414062, 0.020172119140625, 0.021474838256835938, 0.022777557373046875, 0.024080276489257812, 0.02538299560546875, 0.026685714721679688, 0.027988433837890625, 0.029291152954101562, 0.0305938720703125, 0.03189659118652344, 0.033199310302734375, 0.03450202941894531, 0.03580474853515625, 0.03710746765136719, 0.038410186767578125, 0.03971290588378906, 0.041015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 12.0, 22.0, 37.0, 42.0, 65.0, 104.0, 155.0, 301.0, 664.0, 2203.0, 12934.0, 171943.0, 2570892.0, 1355762.0, 69728.0, 6822.0, 1381.0, 505.0, 286.0, 150.0, 117.0, 48.0, 27.0, 22.0, 14.0, 13.0, 5.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1270751953125, -0.1237173080444336, -0.12035942077636719, -0.11700153350830078, -0.11364364624023438, -0.11028575897216797, -0.10692787170410156, -0.10356998443603516, -0.10021209716796875, -0.09685420989990234, -0.09349632263183594, -0.09013843536376953, -0.08678054809570312, -0.08342266082763672, -0.08006477355957031, -0.0767068862915039, -0.0733489990234375, -0.0699911117553711, -0.06663322448730469, -0.06327533721923828, -0.059917449951171875, -0.05655956268310547, -0.05320167541503906, -0.049843788146972656, -0.04648590087890625, -0.043128013610839844, -0.03977012634277344, -0.03641223907470703, -0.033054351806640625, -0.02969646453857422, -0.026338577270507812, -0.022980690002441406, -0.019622802734375, -0.016264915466308594, -0.012907028198242188, -0.009549140930175781, -0.006191253662109375, -0.0028333663940429688, 0.0005245208740234375, 0.0038824081420898438, 0.00724029541015625, 0.010598182678222656, 0.013956069946289062, 0.01731395721435547, 0.020671844482421875, 0.02402973175048828, 0.027387619018554688, 0.030745506286621094, 0.0341033935546875, 0.037461280822753906, 0.04081916809082031, 0.04417705535888672, 0.047534942626953125, 0.05089282989501953, 0.05425071716308594, 0.057608604431152344, 0.06096649169921875, 0.06432437896728516, 0.06768226623535156, 0.07104015350341797, 0.07439804077148438, 0.07775592803955078, 0.08111381530761719, 0.0844717025756836, 0.08782958984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 5.0, 7.0, 8.0, 18.0, 12.0, 36.0, 26.0, 54.0, 61.0, 91.0, 144.0, 149.0, 195.0, 247.0, 301.0, 325.0, 338.0, 354.0, 350.0, 293.0, 271.0, 186.0, 162.0, 110.0, 80.0, 59.0, 55.0, 41.0, 26.0, 22.0, 16.0, 10.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036149024963378906, -0.03470039367675781, -0.03325176239013672, -0.031803131103515625, -0.03035449981689453, -0.028905868530273438, -0.027457237243652344, -0.02600860595703125, -0.024559974670410156, -0.023111343383789062, -0.02166271209716797, -0.020214080810546875, -0.01876544952392578, -0.017316818237304688, -0.015868186950683594, -0.0144195556640625, -0.012970924377441406, -0.011522293090820312, -0.010073661804199219, -0.008625030517578125, -0.007176399230957031, -0.0057277679443359375, -0.004279136657714844, -0.00283050537109375, -0.0013818740844726562, 6.67572021484375e-05, 0.0015153884887695312, 0.002964019775390625, 0.004412651062011719, 0.0058612823486328125, 0.007309913635253906, 0.008758544921875, 0.010207176208496094, 0.011655807495117188, 0.013104438781738281, 0.014553070068359375, 0.01600170135498047, 0.017450332641601562, 0.018898963928222656, 0.02034759521484375, 0.021796226501464844, 0.023244857788085938, 0.02469348907470703, 0.026142120361328125, 0.02759075164794922, 0.029039382934570312, 0.030488014221191406, 0.0319366455078125, 0.033385276794433594, 0.03483390808105469, 0.03628253936767578, 0.037731170654296875, 0.03917980194091797, 0.04062843322753906, 0.042077064514160156, 0.04352569580078125, 0.044974327087402344, 0.04642295837402344, 0.04787158966064453, 0.049320220947265625, 0.05076885223388672, 0.05221748352050781, 0.053666114807128906, 0.05511474609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 13.0, 37.0, 111.0, 224.0, 279.0, 185.0, 105.0, 35.0, 12.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5911338925361633, -0.5739768147468567, -0.5568197965621948, -0.5396627187728882, -0.5225057005882263, -0.5053486227989197, -0.4881915748119354, -0.47103452682495117, -0.4538774788379669, -0.43672043085098267, -0.4195633828639984, -0.40240633487701416, -0.3852492570877075, -0.36809223890304565, -0.350935161113739, -0.33377811312675476, -0.3166210651397705, -0.29946401715278625, -0.282306969165802, -0.26514992117881775, -0.2479928582906723, -0.23083581030368805, -0.2136787474155426, -0.19652169942855835, -0.1793646514415741, -0.16220760345458984, -0.1450505554676056, -0.12789349257946014, -0.11073644459247589, -0.09357939660549164, -0.07642234116792679, -0.05926528573036194, -0.042108237743377686, -0.024951186031103134, -0.007794134318828583, 0.009362917393445969, 0.02651996910572052, 0.04367701709270477, 0.06083407253026962, 0.07799112796783447, 0.09514817595481873, 0.11230522394180298, 0.12946227192878723, 0.14661933481693268, 0.16377638280391693, 0.18093343079090118, 0.19809049367904663, 0.21524754166603088, 0.23240458965301514, 0.2495616376399994, 0.26671868562698364, 0.2838757336139679, 0.30103278160095215, 0.3181898593902588, 0.33534690737724304, 0.3525039553642273, 0.36966100335121155, 0.3868180513381958, 0.40397509932518005, 0.4211321473121643, 0.43828922510147095, 0.4554462432861328, 0.47260332107543945, 0.4897603690624237, 0.506917417049408]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 5.0, 4.0, 8.0, 7.0, 11.0, 11.0, 18.0, 24.0, 20.0, 25.0, 26.0, 28.0, 28.0, 33.0, 36.0, 41.0, 44.0, 55.0, 50.0, 47.0, 49.0, 44.0, 53.0, 39.0, 31.0, 49.0, 32.0, 30.0, 18.0, 27.0, 28.0, 16.0, 18.0, 8.0, 11.0, 14.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180620014667511, -0.17485976219177246, -0.16909950971603394, -0.1633392572402954, -0.15757900476455688, -0.15181876718997955, -0.14605851471424103, -0.1402982622385025, -0.13453800976276398, -0.12877775728702545, -0.12301750481128693, -0.117257259786129, -0.11149700731039047, -0.10573675483465195, -0.09997650980949402, -0.0942162573337555, -0.08845600485801697, -0.08269575238227844, -0.07693549990653992, -0.07117525488138199, -0.06541500240564346, -0.05965474992990494, -0.05389450117945671, -0.048134252429008484, -0.04237399995326996, -0.03661374747753143, -0.030853498727083206, -0.02509324811398983, -0.019332997500896454, -0.013572746887803078, -0.0078124962747097015, -0.0020522475242614746, 0.0037080049514770508, 0.009468255564570427, 0.015228506177663803, 0.02098875679075718, 0.026749007403850555, 0.03250925987958908, 0.03826950863003731, 0.044029757380485535, 0.04979000985622406, 0.055550262331962585, 0.06131051108241081, 0.06707075983285904, 0.07283101230859756, 0.07859126478433609, 0.08435150980949402, 0.09011176228523254, 0.09587201476097107, 0.1016322672367096, 0.10739251971244812, 0.11315276473760605, 0.11891301721334457, 0.1246732696890831, 0.13043351471424103, 0.13619376718997955, 0.14195401966571808, 0.1477142721414566, 0.15347452461719513, 0.15923477709293365, 0.164995014667511, 0.1707552671432495, 0.17651551961898804, 0.18227577209472656, 0.1880360245704651]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 14.0, 15.0, 21.0, 29.0, 43.0, 53.0, 96.0, 171.0, 309.0, 595.0, 1316.0, 2913.0, 6647.0, 15957.0, 42577.0, 136695.0, 379477.0, 309513.0, 97661.0, 31962.0, 12537.0, 5425.0, 2320.0, 995.0, 510.0, 277.0, 153.0, 91.0, 52.0, 28.0, 28.0, 22.0, 10.0, 9.0, 7.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0985107421875, -0.09521198272705078, -0.09191322326660156, -0.08861446380615234, -0.08531570434570312, -0.0820169448852539, -0.07871818542480469, -0.07541942596435547, -0.07212066650390625, -0.06882190704345703, -0.06552314758300781, -0.062224388122558594, -0.058925628662109375, -0.055626869201660156, -0.05232810974121094, -0.04902935028076172, -0.0457305908203125, -0.04243183135986328, -0.03913307189941406, -0.035834312438964844, -0.032535552978515625, -0.029236793518066406, -0.025938034057617188, -0.02263927459716797, -0.01934051513671875, -0.01604175567626953, -0.012742996215820312, -0.009444236755371094, -0.006145477294921875, -0.0028467178344726562, 0.0004520416259765625, 0.0037508010864257812, 0.007049560546875, 0.010348320007324219, 0.013647079467773438, 0.016945838928222656, 0.020244598388671875, 0.023543357849121094, 0.026842117309570312, 0.03014087677001953, 0.03343963623046875, 0.03673839569091797, 0.04003715515136719, 0.043335914611816406, 0.046634674072265625, 0.049933433532714844, 0.05323219299316406, 0.05653095245361328, 0.0598297119140625, 0.06312847137451172, 0.06642723083496094, 0.06972599029541016, 0.07302474975585938, 0.0763235092163086, 0.07962226867675781, 0.08292102813720703, 0.08621978759765625, 0.08951854705810547, 0.09281730651855469, 0.0961160659790039, 0.09941482543945312, 0.10271358489990234, 0.10601234436035156, 0.10931110382080078, 0.11260986328125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 12.0, 13.0, 31.0, 31.0, 21.0, 39.0, 44.0, 59.0, 71.0, 76.0, 69.0, 82.0, 85.0, 59.0, 43.0, 52.0, 45.0, 37.0, 30.0, 29.0, 18.0, 20.0, 8.0, 5.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04791259765625, -0.04642343521118164, -0.04493427276611328, -0.04344511032104492, -0.04195594787597656, -0.0404667854309082, -0.038977622985839844, -0.037488460540771484, -0.035999298095703125, -0.034510135650634766, -0.033020973205566406, -0.03153181076049805, -0.030042648315429688, -0.028553485870361328, -0.02706432342529297, -0.02557516098022461, -0.02408599853515625, -0.02259683609008789, -0.02110767364501953, -0.019618511199951172, -0.018129348754882812, -0.016640186309814453, -0.015151023864746094, -0.013661861419677734, -0.012172698974609375, -0.010683536529541016, -0.009194374084472656, -0.007705211639404297, -0.0062160491943359375, -0.004726886749267578, -0.0032377243041992188, -0.0017485618591308594, -0.0002593994140625, 0.0012297630310058594, 0.0027189254760742188, 0.004208087921142578, 0.0056972503662109375, 0.007186412811279297, 0.008675575256347656, 0.010164737701416016, 0.011653900146484375, 0.013143062591552734, 0.014632225036621094, 0.016121387481689453, 0.017610549926757812, 0.019099712371826172, 0.02058887481689453, 0.02207803726196289, 0.02356719970703125, 0.02505636215209961, 0.02654552459716797, 0.028034687042236328, 0.029523849487304688, 0.031013011932373047, 0.032502174377441406, 0.033991336822509766, 0.035480499267578125, 0.036969661712646484, 0.038458824157714844, 0.0399479866027832, 0.04143714904785156, 0.04292631149291992, 0.04441547393798828, 0.04590463638305664, 0.047393798828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 10.0, 5.0, 7.0, 15.0, 14.0, 18.0, 25.0, 40.0, 50.0, 64.0, 104.0, 131.0, 158.0, 240.0, 480.0, 891.0, 1811.0, 4066.0, 10197.0, 26194.0, 69384.0, 177505.0, 323421.0, 254750.0, 109509.0, 41692.0, 15890.0, 6309.0, 2608.0, 1214.0, 608.0, 337.0, 233.0, 157.0, 119.0, 86.0, 56.0, 35.0, 26.0, 26.0, 14.0, 12.0, 14.0, 9.0, 11.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0894775390625, -0.08690166473388672, -0.08432579040527344, -0.08174991607666016, -0.07917404174804688, -0.0765981674194336, -0.07402229309082031, -0.07144641876220703, -0.06887054443359375, -0.06629467010498047, -0.06371879577636719, -0.061142921447753906, -0.058567047119140625, -0.055991172790527344, -0.05341529846191406, -0.05083942413330078, -0.0482635498046875, -0.04568767547607422, -0.04311180114746094, -0.040535926818847656, -0.037960052490234375, -0.035384178161621094, -0.03280830383300781, -0.03023242950439453, -0.02765655517578125, -0.02508068084716797, -0.022504806518554688, -0.019928932189941406, -0.017353057861328125, -0.014777183532714844, -0.012201309204101562, -0.009625434875488281, -0.007049560546875, -0.004473686218261719, -0.0018978118896484375, 0.0006780624389648438, 0.003253936767578125, 0.005829811096191406, 0.008405685424804688, 0.010981559753417969, 0.01355743408203125, 0.01613330841064453, 0.018709182739257812, 0.021285057067871094, 0.023860931396484375, 0.026436805725097656, 0.029012680053710938, 0.03158855438232422, 0.0341644287109375, 0.03674030303955078, 0.03931617736816406, 0.041892051696777344, 0.044467926025390625, 0.047043800354003906, 0.04961967468261719, 0.05219554901123047, 0.05477142333984375, 0.05734729766845703, 0.05992317199707031, 0.062499046325683594, 0.06507492065429688, 0.06765079498291016, 0.07022666931152344, 0.07280254364013672, 0.07537841796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 11.0, 10.0, 15.0, 10.0, 16.0, 18.0, 21.0, 28.0, 35.0, 27.0, 47.0, 31.0, 41.0, 35.0, 42.0, 41.0, 42.0, 50.0, 48.0, 38.0, 43.0, 43.0, 39.0, 31.0, 24.0, 28.0, 24.0, 30.0, 29.0, 16.0, 16.0, 8.0, 11.0, 9.0, 6.0, 5.0, 3.0, 7.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0743408203125, -0.07181644439697266, -0.06929206848144531, -0.06676769256591797, -0.06424331665039062, -0.06171894073486328, -0.05919456481933594, -0.056670188903808594, -0.05414581298828125, -0.051621437072753906, -0.04909706115722656, -0.04657268524169922, -0.044048309326171875, -0.04152393341064453, -0.03899955749511719, -0.036475181579589844, -0.0339508056640625, -0.031426429748535156, -0.028902053833007812, -0.02637767791748047, -0.023853302001953125, -0.02132892608642578, -0.018804550170898438, -0.016280174255371094, -0.01375579833984375, -0.011231422424316406, -0.008707046508789062, -0.006182670593261719, -0.003658294677734375, -0.0011339187622070312, 0.0013904571533203125, 0.003914833068847656, 0.006439208984375, 0.008963584899902344, 0.011487960815429688, 0.014012336730957031, 0.016536712646484375, 0.01906108856201172, 0.021585464477539062, 0.024109840393066406, 0.02663421630859375, 0.029158592224121094, 0.03168296813964844, 0.03420734405517578, 0.036731719970703125, 0.03925609588623047, 0.04178047180175781, 0.044304847717285156, 0.0468292236328125, 0.049353599548339844, 0.05187797546386719, 0.05440235137939453, 0.056926727294921875, 0.05945110321044922, 0.06197547912597656, 0.0644998550415039, 0.06702423095703125, 0.0695486068725586, 0.07207298278808594, 0.07459735870361328, 0.07712173461914062, 0.07964611053466797, 0.08217048645019531, 0.08469486236572266, 0.08721923828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 9.0, 10.0, 10.0, 13.0, 22.0, 37.0, 53.0, 81.0, 118.0, 195.0, 282.0, 466.0, 859.0, 1329.0, 2158.0, 3531.0, 5902.0, 10179.0, 17289.0, 31390.0, 59094.0, 109642.0, 178666.0, 216322.0, 174659.0, 106569.0, 57045.0, 30835.0, 17144.0, 9747.0, 5808.0, 3502.0, 2099.0, 1314.0, 766.0, 502.0, 318.0, 208.0, 126.0, 83.0, 60.0, 44.0, 27.0, 12.0, 10.0, 13.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0218353271484375, -0.021162986755371094, -0.020490646362304688, -0.01981830596923828, -0.019145965576171875, -0.01847362518310547, -0.017801284790039062, -0.017128944396972656, -0.01645660400390625, -0.015784263610839844, -0.015111923217773438, -0.014439582824707031, -0.013767242431640625, -0.013094902038574219, -0.012422561645507812, -0.011750221252441406, -0.011077880859375, -0.010405540466308594, -0.009733200073242188, -0.009060859680175781, -0.008388519287109375, -0.007716178894042969, -0.0070438385009765625, -0.006371498107910156, -0.00569915771484375, -0.005026817321777344, -0.0043544769287109375, -0.0036821365356445312, -0.003009796142578125, -0.0023374557495117188, -0.0016651153564453125, -0.0009927749633789062, -0.0003204345703125, 0.00035190582275390625, 0.0010242462158203125, 0.0016965866088867188, 0.002368927001953125, 0.0030412673950195312, 0.0037136077880859375, 0.004385948181152344, 0.00505828857421875, 0.005730628967285156, 0.0064029693603515625, 0.007075309753417969, 0.007747650146484375, 0.008419990539550781, 0.009092330932617188, 0.009764671325683594, 0.01043701171875, 0.011109352111816406, 0.011781692504882812, 0.012454032897949219, 0.013126373291015625, 0.013798713684082031, 0.014471054077148438, 0.015143394470214844, 0.01581573486328125, 0.016488075256347656, 0.017160415649414062, 0.01783275604248047, 0.018505096435546875, 0.01917743682861328, 0.019849777221679688, 0.020522117614746094, 0.0211944580078125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 5.0, 12.0, 22.0, 17.0, 9.0, 16.0, 22.0, 24.0, 35.0, 28.0, 35.0, 53.0, 58.0, 57.0, 54.0, 47.0, 69.0, 55.0, 47.0, 58.0, 35.0, 37.0, 34.0, 24.0, 26.0, 18.0, 17.0, 19.0, 7.0, 12.0, 7.0, 10.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1861324310302734e-05, -1.1422671377658844e-05, -1.0984018445014954e-05, -1.0545365512371063e-05, -1.0106712579727173e-05, -9.668059647083282e-06, -9.229406714439392e-06, -8.790753781795502e-06, -8.352100849151611e-06, -7.913447916507721e-06, -7.4747949838638306e-06, -7.03614205121994e-06, -6.59748911857605e-06, -6.1588361859321594e-06, -5.720183253288269e-06, -5.281530320644379e-06, -4.842877388000488e-06, -4.404224455356598e-06, -3.9655715227127075e-06, -3.526918590068817e-06, -3.0882656574249268e-06, -2.6496127247810364e-06, -2.210959792137146e-06, -1.7723068594932556e-06, -1.3336539268493652e-06, -8.950009942054749e-07, -4.5634806156158447e-07, -1.7695128917694092e-08, 4.209578037261963e-07, 8.596107363700867e-07, 1.298263669013977e-06, 1.7369166016578674e-06, 2.175569534301758e-06, 2.614222466945648e-06, 3.0528753995895386e-06, 3.491528332233429e-06, 3.930181264877319e-06, 4.36883419752121e-06, 4.8074871301651e-06, 5.2461400628089905e-06, 5.684792995452881e-06, 6.123445928096771e-06, 6.562098860740662e-06, 7.000751793384552e-06, 7.439404726028442e-06, 7.878057658672333e-06, 8.316710591316223e-06, 8.755363523960114e-06, 9.194016456604004e-06, 9.632669389247894e-06, 1.0071322321891785e-05, 1.0509975254535675e-05, 1.0948628187179565e-05, 1.1387281119823456e-05, 1.1825934052467346e-05, 1.2264586985111237e-05, 1.2703239917755127e-05, 1.3141892850399017e-05, 1.3580545783042908e-05, 1.4019198715686798e-05, 1.4457851648330688e-05, 1.4896504580974579e-05, 1.533515751361847e-05, 1.577381044626236e-05, 1.621246337890625e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 13.0, 10.0, 15.0, 21.0, 26.0, 48.0, 52.0, 66.0, 111.0, 188.0, 251.0, 428.0, 703.0, 1211.0, 2015.0, 3760.0, 7063.0, 13620.0, 28705.0, 68020.0, 155851.0, 264503.0, 251840.0, 138730.0, 59052.0, 25629.0, 12304.0, 6199.0, 3341.0, 1863.0, 1120.0, 634.0, 370.0, 235.0, 147.0, 110.0, 73.0, 54.0, 40.0, 31.0, 25.0, 23.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0253753662109375, -0.024554729461669922, -0.023734092712402344, -0.022913455963134766, -0.022092819213867188, -0.02127218246459961, -0.02045154571533203, -0.019630908966064453, -0.018810272216796875, -0.017989635467529297, -0.01716899871826172, -0.01634836196899414, -0.015527725219726562, -0.014707088470458984, -0.013886451721191406, -0.013065814971923828, -0.01224517822265625, -0.011424541473388672, -0.010603904724121094, -0.009783267974853516, -0.008962631225585938, -0.00814199447631836, -0.007321357727050781, -0.006500720977783203, -0.005680084228515625, -0.004859447479248047, -0.004038810729980469, -0.0032181739807128906, -0.0023975372314453125, -0.0015769004821777344, -0.0007562637329101562, 6.437301635742188e-05, 0.000885009765625, 0.0017056465148925781, 0.0025262832641601562, 0.0033469200134277344, 0.0041675567626953125, 0.004988193511962891, 0.005808830261230469, 0.006629467010498047, 0.007450103759765625, 0.008270740509033203, 0.009091377258300781, 0.00991201400756836, 0.010732650756835938, 0.011553287506103516, 0.012373924255371094, 0.013194561004638672, 0.01401519775390625, 0.014835834503173828, 0.015656471252441406, 0.016477108001708984, 0.017297744750976562, 0.01811838150024414, 0.01893901824951172, 0.019759654998779297, 0.020580291748046875, 0.021400928497314453, 0.02222156524658203, 0.02304220199584961, 0.023862838745117188, 0.024683475494384766, 0.025504112243652344, 0.026324748992919922, 0.0271453857421875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 5.0, 10.0, 7.0, 12.0, 11.0, 18.0, 20.0, 23.0, 26.0, 32.0, 38.0, 47.0, 62.0, 51.0, 54.0, 57.0, 53.0, 42.0, 60.0, 59.0, 46.0, 46.0, 47.0, 32.0, 26.0, 21.0, 14.0, 10.0, 11.0, 10.0, 15.0, 3.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0229339599609375, -0.022223472595214844, -0.021512985229492188, -0.02080249786376953, -0.020092010498046875, -0.01938152313232422, -0.018671035766601562, -0.017960548400878906, -0.01725006103515625, -0.016539573669433594, -0.015829086303710938, -0.015118598937988281, -0.014408111572265625, -0.013697624206542969, -0.012987136840820312, -0.012276649475097656, -0.011566162109375, -0.010855674743652344, -0.010145187377929688, -0.009434700012207031, -0.008724212646484375, -0.008013725280761719, -0.0073032379150390625, -0.006592750549316406, -0.00588226318359375, -0.005171775817871094, -0.0044612884521484375, -0.0037508010864257812, -0.003040313720703125, -0.0023298263549804688, -0.0016193389892578125, -0.0009088516235351562, -0.0001983642578125, 0.0005121231079101562, 0.0012226104736328125, 0.0019330978393554688, 0.002643585205078125, 0.0033540725708007812, 0.0040645599365234375, 0.004775047302246094, 0.00548553466796875, 0.006196022033691406, 0.0069065093994140625, 0.007616996765136719, 0.008327484130859375, 0.009037971496582031, 0.009748458862304688, 0.010458946228027344, 0.01116943359375, 0.011879920959472656, 0.012590408325195312, 0.013300895690917969, 0.014011383056640625, 0.014721870422363281, 0.015432357788085938, 0.016142845153808594, 0.01685333251953125, 0.017563819885253906, 0.018274307250976562, 0.01898479461669922, 0.019695281982421875, 0.02040576934814453, 0.021116256713867188, 0.021826744079589844, 0.0225372314453125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 34.0, 122.0, 278.0, 321.0, 169.0, 56.0, 19.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447647094726562, -0.8157989382743835, -0.7868331670761108, -0.7578673958778381, -0.7289016246795654, -0.699935793876648, -0.67097008228302, -0.6420042514801025, -0.6130384802818298, -0.5840727090835571, -0.5551069378852844, -0.5261411666870117, -0.4971753656864166, -0.4682095944881439, -0.4392438232898712, -0.4102780222892761, -0.3813122808933258, -0.3523465096950531, -0.3233807384967804, -0.2944149374961853, -0.2654491662979126, -0.2364833950996399, -0.2075176239013672, -0.1785518378019333, -0.14958606660366058, -0.12062028795480728, -0.09165450930595398, -0.06268873810768127, -0.03372295945882797, -0.00475718080997467, 0.024208590388298035, 0.053174376487731934, 0.08214014768600464, 0.11110592633485794, 0.14007170498371124, 0.16903747618198395, 0.19800326228141785, 0.22696903347969055, 0.25593480467796326, 0.28490060567855835, 0.31386637687683105, 0.34283214807510376, 0.37179791927337646, 0.40076369047164917, 0.42972949147224426, 0.45869526267051697, 0.4876610338687897, 0.5166268348693848, 0.5455925464630127, 0.5745583176612854, 0.6035240888595581, 0.6324898600578308, 0.6614556312561035, 0.690421462059021, 0.7193871736526489, 0.7483530044555664, 0.7773187756538391, 0.8062845468521118, 0.8352503180503845, 0.8642160892486572, 0.8931818604469299, 0.9221476316452026, 0.9511134624481201, 0.9800792336463928, 1.0090450048446655]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 7.0, 13.0, 11.0, 8.0, 16.0, 14.0, 32.0, 38.0, 27.0, 29.0, 35.0, 31.0, 57.0, 48.0, 49.0, 56.0, 38.0, 47.0, 42.0, 36.0, 41.0, 41.0, 50.0, 29.0, 26.0, 26.0, 24.0, 24.0, 21.0, 16.0, 11.0, 14.0, 8.0, 11.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.32525014877319336, -0.31658703088760376, -0.30792391300201416, -0.29926082491874695, -0.29059770703315735, -0.28193458914756775, -0.27327150106430054, -0.26460838317871094, -0.25594526529312134, -0.24728214740753174, -0.23861904442310333, -0.22995594143867493, -0.22129282355308533, -0.21262970566749573, -0.20396660268306732, -0.19530349969863892, -0.18664038181304932, -0.17797726392745972, -0.1693141609430313, -0.1606510579586029, -0.1519879400730133, -0.1433248221874237, -0.1346617192029953, -0.1259986162185669, -0.1173354983329773, -0.10867238789796829, -0.10000927746295929, -0.09134616702795029, -0.08268305659294128, -0.07401994615793228, -0.06535683572292328, -0.056693725287914276, -0.04803061485290527, -0.03936750441789627, -0.030704393982887268, -0.022041283547878265, -0.013378173112869263, -0.00471506267786026, 0.003948047757148743, 0.012611158192157745, 0.021274268627166748, 0.02993737906217575, 0.03860048949718475, 0.047263599932193756, 0.05592671036720276, 0.06458982080221176, 0.07325293123722076, 0.08191604167222977, 0.09057915210723877, 0.09924226254224777, 0.10790537297725677, 0.11656848341226578, 0.12523159384727478, 0.13389471173286438, 0.14255781471729279, 0.1512209177017212, 0.1598840355873108, 0.1685471534729004, 0.1772102564573288, 0.1858733594417572, 0.1945364773273468, 0.2031995952129364, 0.2118626981973648, 0.2205258011817932, 0.2291889190673828]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 13.0, 26.0, 29.0, 44.0, 93.0, 154.0, 325.0, 600.0, 1381.0, 4174.0, 16024.0, 106255.0, 1421999.0, 2381849.0, 224435.0, 27405.0, 6181.0, 1869.0, 727.0, 305.0, 159.0, 83.0, 51.0, 34.0, 24.0, 10.0, 13.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0711669921875, -0.06880664825439453, -0.06644630432128906, -0.0640859603881836, -0.061725616455078125, -0.059365272521972656, -0.05700492858886719, -0.05464458465576172, -0.05228424072265625, -0.04992389678955078, -0.04756355285644531, -0.045203208923339844, -0.042842864990234375, -0.040482521057128906, -0.03812217712402344, -0.03576183319091797, -0.0334014892578125, -0.03104114532470703, -0.028680801391601562, -0.026320457458496094, -0.023960113525390625, -0.021599769592285156, -0.019239425659179688, -0.01687908172607422, -0.01451873779296875, -0.012158393859863281, -0.009798049926757812, -0.007437705993652344, -0.005077362060546875, -0.0027170181274414062, -0.0003566741943359375, 0.0020036697387695312, 0.004364013671875, 0.006724357604980469, 0.009084701538085938, 0.011445045471191406, 0.013805389404296875, 0.016165733337402344, 0.018526077270507812, 0.02088642120361328, 0.02324676513671875, 0.02560710906982422, 0.027967453002929688, 0.030327796936035156, 0.032688140869140625, 0.035048484802246094, 0.03740882873535156, 0.03976917266845703, 0.0421295166015625, 0.04448986053466797, 0.04685020446777344, 0.049210548400878906, 0.051570892333984375, 0.053931236267089844, 0.05629158020019531, 0.05865192413330078, 0.06101226806640625, 0.06337261199951172, 0.06573295593261719, 0.06809329986572266, 0.07045364379882812, 0.0728139877319336, 0.07517433166503906, 0.07753467559814453, 0.07989501953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 7.0, 16.0, 20.0, 20.0, 15.0, 24.0, 29.0, 35.0, 60.0, 49.0, 56.0, 73.0, 68.0, 79.0, 77.0, 48.0, 60.0, 46.0, 48.0, 28.0, 34.0, 25.0, 21.0, 16.0, 14.0, 11.0, 2.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037841796875, -0.036448001861572266, -0.03505420684814453, -0.0336604118347168, -0.03226661682128906, -0.030872821807861328, -0.029479026794433594, -0.02808523178100586, -0.026691436767578125, -0.02529764175415039, -0.023903846740722656, -0.022510051727294922, -0.021116256713867188, -0.019722461700439453, -0.01832866668701172, -0.016934871673583984, -0.01554107666015625, -0.014147281646728516, -0.012753486633300781, -0.011359691619873047, -0.009965896606445312, -0.008572101593017578, -0.007178306579589844, -0.005784511566162109, -0.004390716552734375, -0.0029969215393066406, -0.0016031265258789062, -0.00020933151245117188, 0.0011844635009765625, 0.002578258514404297, 0.003972053527832031, 0.005365848541259766, 0.0067596435546875, 0.008153438568115234, 0.009547233581542969, 0.010941028594970703, 0.012334823608398438, 0.013728618621826172, 0.015122413635253906, 0.01651620864868164, 0.017910003662109375, 0.01930379867553711, 0.020697593688964844, 0.022091388702392578, 0.023485183715820312, 0.024878978729248047, 0.02627277374267578, 0.027666568756103516, 0.02906036376953125, 0.030454158782958984, 0.03184795379638672, 0.03324174880981445, 0.03463554382324219, 0.03602933883666992, 0.037423133850097656, 0.03881692886352539, 0.040210723876953125, 0.04160451889038086, 0.042998313903808594, 0.04439210891723633, 0.04578590393066406, 0.0471796989440918, 0.04857349395751953, 0.049967288970947266, 0.051361083984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 8.0, 15.0, 15.0, 18.0, 32.0, 40.0, 73.0, 150.0, 237.0, 633.0, 1620.0, 7387.0, 76988.0, 1916373.0, 2094500.0, 85550.0, 7795.0, 1646.0, 584.0, 260.0, 128.0, 72.0, 49.0, 26.0, 23.0, 17.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1402587890625, -0.13646984100341797, -0.13268089294433594, -0.1288919448852539, -0.12510299682617188, -0.12131404876708984, -0.11752510070800781, -0.11373615264892578, -0.10994720458984375, -0.10615825653076172, -0.10236930847167969, -0.09858036041259766, -0.09479141235351562, -0.0910024642944336, -0.08721351623535156, -0.08342456817626953, -0.0796356201171875, -0.07584667205810547, -0.07205772399902344, -0.0682687759399414, -0.06447982788085938, -0.060690879821777344, -0.05690193176269531, -0.05311298370361328, -0.04932403564453125, -0.04553508758544922, -0.04174613952636719, -0.037957191467285156, -0.034168243408203125, -0.030379295349121094, -0.026590347290039062, -0.02280139923095703, -0.019012451171875, -0.015223503112792969, -0.011434555053710938, -0.007645606994628906, -0.003856658935546875, -6.771087646484375e-05, 0.0037212371826171875, 0.007510185241699219, 0.01129913330078125, 0.015088081359863281, 0.018877029418945312, 0.022665977478027344, 0.026454925537109375, 0.030243873596191406, 0.03403282165527344, 0.03782176971435547, 0.0416107177734375, 0.04539966583251953, 0.04918861389160156, 0.052977561950683594, 0.056766510009765625, 0.060555458068847656, 0.06434440612792969, 0.06813335418701172, 0.07192230224609375, 0.07571125030517578, 0.07950019836425781, 0.08328914642333984, 0.08707809448242188, 0.0908670425415039, 0.09465599060058594, 0.09844493865966797, 0.10223388671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 16.0, 18.0, 31.0, 35.0, 58.0, 62.0, 105.0, 167.0, 185.0, 307.0, 386.0, 440.0, 456.0, 438.0, 346.0, 295.0, 190.0, 152.0, 90.0, 85.0, 56.0, 32.0, 36.0, 18.0, 13.0, 12.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0416259765625, -0.03992176055908203, -0.03821754455566406, -0.036513328552246094, -0.034809112548828125, -0.033104896545410156, -0.03140068054199219, -0.02969646453857422, -0.02799224853515625, -0.02628803253173828, -0.024583816528320312, -0.022879600524902344, -0.021175384521484375, -0.019471168518066406, -0.017766952514648438, -0.01606273651123047, -0.0143585205078125, -0.012654304504394531, -0.010950088500976562, -0.009245872497558594, -0.007541656494140625, -0.005837440490722656, -0.0041332244873046875, -0.0024290084838867188, -0.00072479248046875, 0.0009794235229492188, 0.0026836395263671875, 0.004387855529785156, 0.006092071533203125, 0.007796287536621094, 0.009500503540039062, 0.011204719543457031, 0.012908935546875, 0.014613151550292969, 0.016317367553710938, 0.018021583557128906, 0.019725799560546875, 0.021430015563964844, 0.023134231567382812, 0.02483844757080078, 0.02654266357421875, 0.02824687957763672, 0.029951095581054688, 0.031655311584472656, 0.033359527587890625, 0.035063743591308594, 0.03676795959472656, 0.03847217559814453, 0.0401763916015625, 0.04188060760498047, 0.04358482360839844, 0.045289039611816406, 0.046993255615234375, 0.048697471618652344, 0.05040168762207031, 0.05210590362548828, 0.05381011962890625, 0.05551433563232422, 0.05721855163574219, 0.058922767639160156, 0.060626983642578125, 0.062331199645996094, 0.06403541564941406, 0.06573963165283203, 0.06744384765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 16.0, 23.0, 49.0, 102.0, 165.0, 163.0, 173.0, 120.0, 86.0, 49.0, 28.0, 15.0, 12.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5891666412353516, -0.5762376189231873, -0.563308596611023, -0.5503795742988586, -0.5374505519866943, -0.52452152967453, -0.5115925073623657, -0.4986635148525238, -0.4857344925403595, -0.4728054702281952, -0.4598764479160309, -0.4469474256038666, -0.43401840329170227, -0.42108941078186035, -0.40816038846969604, -0.39523136615753174, -0.38230234384536743, -0.3693733215332031, -0.3564442992210388, -0.3435152769088745, -0.3305862545967102, -0.3176572322845459, -0.3047282099723816, -0.2917992174625397, -0.278870165348053, -0.26594114303588867, -0.25301212072372437, -0.24008309841156006, -0.22715409100055695, -0.21422506868839264, -0.20129604637622833, -0.18836703896522522, -0.1754380166530609, -0.1625089943408966, -0.1495799720287323, -0.136650949716568, -0.12372194230556488, -0.11079291999340057, -0.09786389768123627, -0.08493488281965256, -0.07200586050748825, -0.05907684192061424, -0.046147823333740234, -0.03321880102157593, -0.02028978243470192, -0.007360763847827911, 0.005568258464336395, 0.018497273325920105, 0.03142629563808441, 0.04435531422495842, 0.05728433281183243, 0.07021335512399673, 0.08314236998558044, 0.09607139229774475, 0.10900041460990906, 0.12192942947149277, 0.13485845923423767, 0.14778748154640198, 0.16071650385856628, 0.1736455261707306, 0.1865745335817337, 0.199503555893898, 0.21243257820606232, 0.22536158561706543, 0.23829060792922974]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 12.0, 18.0, 19.0, 20.0, 17.0, 23.0, 28.0, 33.0, 21.0, 30.0, 28.0, 31.0, 34.0, 41.0, 46.0, 40.0, 35.0, 35.0, 45.0, 41.0, 36.0, 35.0, 39.0, 28.0, 29.0, 25.0, 26.0, 22.0, 23.0, 29.0, 15.0, 12.0, 15.0, 9.0, 10.0, 3.0, 14.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.16827094554901123, -0.16324302554130554, -0.15821510553359985, -0.15318717062473297, -0.14815925061702728, -0.1431313306093216, -0.1381033957004547, -0.13307547569274902, -0.12804755568504333, -0.12301963567733765, -0.11799170821905136, -0.11296378076076508, -0.10793586075305939, -0.1029079407453537, -0.09788001328706741, -0.09285208582878113, -0.08782416582107544, -0.08279624581336975, -0.07776831835508347, -0.07274039089679718, -0.06771247088909149, -0.0626845508813858, -0.05765662342309952, -0.05262869969010353, -0.047600775957107544, -0.04257285222411156, -0.03754492849111557, -0.03251700475811958, -0.027489081025123596, -0.02246115729212761, -0.017433233559131622, -0.012405309826135635, -0.0073773860931396484, -0.0023494623601436615, 0.0026784613728523254, 0.007706385105848312, 0.0127343088388443, 0.017762232571840286, 0.022790156304836273, 0.02781808003783226, 0.03284600377082825, 0.037873927503824234, 0.04290185123682022, 0.04792977496981621, 0.052957698702812195, 0.05798562243580818, 0.06301354616880417, 0.06804147362709045, 0.07306939363479614, 0.07809731364250183, 0.08312524110078812, 0.0881531685590744, 0.09318108856678009, 0.09820900857448578, 0.10323693603277206, 0.10826486349105835, 0.11329278349876404, 0.11832070350646973, 0.12334863096475601, 0.1283765584230423, 0.13340447843074799, 0.13843239843845367, 0.14346033334732056, 0.14848825335502625, 0.15351617336273193]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 8.0, 4.0, 16.0, 15.0, 29.0, 35.0, 57.0, 93.0, 188.0, 348.0, 690.0, 1570.0, 3984.0, 10791.0, 30928.0, 96468.0, 304231.0, 390091.0, 140717.0, 44117.0, 14804.0, 5393.0, 2112.0, 941.0, 413.0, 209.0, 113.0, 57.0, 45.0, 24.0, 23.0, 13.0, 11.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.131591796875, -0.12831497192382812, -0.12503814697265625, -0.12176132202148438, -0.1184844970703125, -0.11520767211914062, -0.11193084716796875, -0.10865402221679688, -0.105377197265625, -0.10210037231445312, -0.09882354736328125, -0.09554672241210938, -0.0922698974609375, -0.08899307250976562, -0.08571624755859375, -0.08243942260742188, -0.07916259765625, -0.07588577270507812, -0.07260894775390625, -0.06933212280273438, -0.0660552978515625, -0.06277847290039062, -0.05950164794921875, -0.056224822998046875, -0.052947998046875, -0.049671173095703125, -0.04639434814453125, -0.043117523193359375, -0.0398406982421875, -0.036563873291015625, -0.03328704833984375, -0.030010223388671875, -0.0267333984375, -0.023456573486328125, -0.02017974853515625, -0.016902923583984375, -0.0136260986328125, -0.010349273681640625, -0.00707244873046875, -0.003795623779296875, -0.000518798828125, 0.002758026123046875, 0.00603485107421875, 0.009311676025390625, 0.0125885009765625, 0.015865325927734375, 0.01914215087890625, 0.022418975830078125, 0.02569580078125, 0.028972625732421875, 0.03224945068359375, 0.035526275634765625, 0.0388031005859375, 0.042079925537109375, 0.04535675048828125, 0.048633575439453125, 0.051910400390625, 0.055187225341796875, 0.05846405029296875, 0.061740875244140625, 0.0650177001953125, 0.06829452514648438, 0.07157135009765625, 0.07484817504882812, 0.078125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 6.0, 6.0, 8.0, 17.0, 22.0, 22.0, 24.0, 30.0, 38.0, 39.0, 49.0, 67.0, 59.0, 62.0, 66.0, 75.0, 55.0, 64.0, 54.0, 33.0, 44.0, 44.0, 31.0, 15.0, 18.0, 13.0, 16.0, 10.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04296875, -0.04165077209472656, -0.040332794189453125, -0.03901481628417969, -0.03769683837890625, -0.03637886047363281, -0.035060882568359375, -0.03374290466308594, -0.0324249267578125, -0.031106948852539062, -0.029788970947265625, -0.028470993041992188, -0.02715301513671875, -0.025835037231445312, -0.024517059326171875, -0.023199081420898438, -0.021881103515625, -0.020563125610351562, -0.019245147705078125, -0.017927169799804688, -0.01660919189453125, -0.015291213989257812, -0.013973236083984375, -0.012655258178710938, -0.0113372802734375, -0.010019302368164062, -0.008701324462890625, -0.0073833465576171875, -0.00606536865234375, -0.0047473907470703125, -0.003429412841796875, -0.0021114349365234375, -0.00079345703125, 0.0005245208740234375, 0.001842498779296875, 0.0031604766845703125, 0.00447845458984375, 0.0057964324951171875, 0.007114410400390625, 0.008432388305664062, 0.0097503662109375, 0.011068344116210938, 0.012386322021484375, 0.013704299926757812, 0.01502227783203125, 0.016340255737304688, 0.017658233642578125, 0.018976211547851562, 0.020294189453125, 0.021612167358398438, 0.022930145263671875, 0.024248123168945312, 0.02556610107421875, 0.026884078979492188, 0.028202056884765625, 0.029520034790039062, 0.0308380126953125, 0.03215599060058594, 0.033473968505859375, 0.03479194641113281, 0.03610992431640625, 0.03742790222167969, 0.038745880126953125, 0.04006385803222656, 0.0413818359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 5.0, 5.0, 14.0, 12.0, 13.0, 12.0, 9.0, 18.0, 28.0, 32.0, 42.0, 62.0, 84.0, 178.0, 323.0, 824.0, 2198.0, 5862.0, 16586.0, 46223.0, 122305.0, 289946.0, 324370.0, 150181.0, 56765.0, 20611.0, 7348.0, 2610.0, 969.0, 410.0, 173.0, 86.0, 70.0, 39.0, 26.0, 23.0, 19.0, 17.0, 14.0, 6.0, 11.0, 5.0, 8.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0892333984375, -0.08636474609375, -0.08349609375, -0.08062744140625, -0.0777587890625, -0.07489013671875, -0.072021484375, -0.06915283203125, -0.0662841796875, -0.06341552734375, -0.060546875, -0.05767822265625, -0.0548095703125, -0.05194091796875, -0.049072265625, -0.04620361328125, -0.0433349609375, -0.04046630859375, -0.03759765625, -0.03472900390625, -0.0318603515625, -0.02899169921875, -0.026123046875, -0.02325439453125, -0.0203857421875, -0.01751708984375, -0.0146484375, -0.01177978515625, -0.0089111328125, -0.00604248046875, -0.003173828125, -0.00030517578125, 0.0025634765625, 0.00543212890625, 0.00830078125, 0.01116943359375, 0.0140380859375, 0.01690673828125, 0.019775390625, 0.02264404296875, 0.0255126953125, 0.02838134765625, 0.03125, 0.03411865234375, 0.0369873046875, 0.03985595703125, 0.042724609375, 0.04559326171875, 0.0484619140625, 0.05133056640625, 0.05419921875, 0.05706787109375, 0.0599365234375, 0.06280517578125, 0.065673828125, 0.06854248046875, 0.0714111328125, 0.07427978515625, 0.0771484375, 0.08001708984375, 0.0828857421875, 0.08575439453125, 0.088623046875, 0.09149169921875, 0.0943603515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 6.0, 6.0, 8.0, 10.0, 6.0, 16.0, 11.0, 12.0, 17.0, 17.0, 19.0, 28.0, 21.0, 28.0, 21.0, 25.0, 30.0, 33.0, 34.0, 27.0, 46.0, 47.0, 41.0, 48.0, 19.0, 39.0, 39.0, 33.0, 33.0, 25.0, 27.0, 29.0, 23.0, 30.0, 25.0, 17.0, 23.0, 20.0, 8.0, 5.0, 12.0, 14.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.078125, -0.07583045959472656, -0.07353591918945312, -0.07124137878417969, -0.06894683837890625, -0.06665229797363281, -0.06435775756835938, -0.06206321716308594, -0.0597686767578125, -0.05747413635253906, -0.055179595947265625, -0.05288505554199219, -0.05059051513671875, -0.04829597473144531, -0.046001434326171875, -0.04370689392089844, -0.041412353515625, -0.03911781311035156, -0.036823272705078125, -0.03452873229980469, -0.03223419189453125, -0.029939651489257812, -0.027645111083984375, -0.025350570678710938, -0.0230560302734375, -0.020761489868164062, -0.018466949462890625, -0.016172409057617188, -0.01387786865234375, -0.011583328247070312, -0.009288787841796875, -0.0069942474365234375, -0.00469970703125, -0.0024051666259765625, -0.000110626220703125, 0.0021839141845703125, 0.00447845458984375, 0.0067729949951171875, 0.009067535400390625, 0.011362075805664062, 0.0136566162109375, 0.015951156616210938, 0.018245697021484375, 0.020540237426757812, 0.02283477783203125, 0.025129318237304688, 0.027423858642578125, 0.029718399047851562, 0.032012939453125, 0.03430747985839844, 0.036602020263671875, 0.03889656066894531, 0.04119110107421875, 0.04348564147949219, 0.045780181884765625, 0.04807472229003906, 0.0503692626953125, 0.05266380310058594, 0.054958343505859375, 0.05725288391113281, 0.05954742431640625, 0.06184196472167969, 0.06413650512695312, 0.06643104553222656, 0.0687255859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 11.0, 8.0, 11.0, 14.0, 18.0, 28.0, 62.0, 58.0, 84.0, 163.0, 214.0, 348.0, 571.0, 996.0, 1661.0, 2743.0, 4686.0, 8425.0, 15118.0, 28022.0, 51620.0, 92884.0, 156676.0, 213101.0, 191897.0, 123294.0, 69395.0, 38615.0, 20834.0, 11466.0, 6395.0, 3695.0, 2188.0, 1252.0, 741.0, 454.0, 288.0, 165.0, 104.0, 82.0, 48.0, 34.0, 24.0, 22.0, 12.0, 10.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0211639404296875, -0.02045273780822754, -0.019741535186767578, -0.019030332565307617, -0.018319129943847656, -0.017607927322387695, -0.016896724700927734, -0.016185522079467773, -0.015474319458007812, -0.014763116836547852, -0.01405191421508789, -0.01334071159362793, -0.012629508972167969, -0.011918306350708008, -0.011207103729248047, -0.010495901107788086, -0.009784698486328125, -0.009073495864868164, -0.008362293243408203, -0.007651090621948242, -0.006939888000488281, -0.00622868537902832, -0.005517482757568359, -0.0048062801361083984, -0.0040950775146484375, -0.0033838748931884766, -0.0026726722717285156, -0.0019614696502685547, -0.0012502670288085938, -0.0005390644073486328, 0.00017213821411132812, 0.0008833408355712891, 0.00159454345703125, 0.002305746078491211, 0.003016948699951172, 0.003728151321411133, 0.004439353942871094, 0.005150556564331055, 0.005861759185791016, 0.0065729618072509766, 0.0072841644287109375, 0.007995367050170898, 0.00870656967163086, 0.00941777229309082, 0.010128974914550781, 0.010840177536010742, 0.011551380157470703, 0.012262582778930664, 0.012973785400390625, 0.013684988021850586, 0.014396190643310547, 0.015107393264770508, 0.01581859588623047, 0.01652979850769043, 0.01724100112915039, 0.01795220375061035, 0.018663406372070312, 0.019374608993530273, 0.020085811614990234, 0.020797014236450195, 0.021508216857910156, 0.022219419479370117, 0.022930622100830078, 0.02364182472229004, 0.02435302734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 2.0, 6.0, 2.0, 10.0, 6.0, 12.0, 12.0, 13.0, 15.0, 20.0, 26.0, 29.0, 36.0, 37.0, 58.0, 62.0, 54.0, 75.0, 72.0, 39.0, 65.0, 56.0, 52.0, 27.0, 34.0, 31.0, 21.0, 20.0, 23.0, 9.0, 11.0, 13.0, 7.0, 10.0, 7.0, 6.0, 2.0, 4.0, 6.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.519918441772461e-05, -1.4643184840679169e-05, -1.4087185263633728e-05, -1.3531185686588287e-05, -1.2975186109542847e-05, -1.2419186532497406e-05, -1.1863186955451965e-05, -1.1307187378406525e-05, -1.0751187801361084e-05, -1.0195188224315643e-05, -9.639188647270203e-06, -9.083189070224762e-06, -8.527189493179321e-06, -7.97118991613388e-06, -7.41519033908844e-06, -6.859190762042999e-06, -6.303191184997559e-06, -5.747191607952118e-06, -5.191192030906677e-06, -4.6351924538612366e-06, -4.079192876815796e-06, -3.5231932997703552e-06, -2.9671937227249146e-06, -2.411194145679474e-06, -1.8551945686340332e-06, -1.2991949915885925e-06, -7.431954145431519e-07, -1.8719583749771118e-07, 3.688037395477295e-07, 9.248033165931702e-07, 1.4808028936386108e-06, 2.0368024706840515e-06, 2.592802047729492e-06, 3.148801624774933e-06, 3.7048012018203735e-06, 4.260800778865814e-06, 4.816800355911255e-06, 5.3727999329566956e-06, 5.928799510002136e-06, 6.484799087047577e-06, 7.040798664093018e-06, 7.596798241138458e-06, 8.152797818183899e-06, 8.70879739522934e-06, 9.26479697227478e-06, 9.820796549320221e-06, 1.0376796126365662e-05, 1.0932795703411102e-05, 1.1488795280456543e-05, 1.2044794857501984e-05, 1.2600794434547424e-05, 1.3156794011592865e-05, 1.3712793588638306e-05, 1.4268793165683746e-05, 1.4824792742729187e-05, 1.5380792319774628e-05, 1.593679189682007e-05, 1.649279147386551e-05, 1.704879105091095e-05, 1.760479062795639e-05, 1.816079020500183e-05, 1.8716789782047272e-05, 1.9272789359092712e-05, 1.9828788936138153e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 4.0, 5.0, 12.0, 7.0, 17.0, 26.0, 53.0, 81.0, 146.0, 259.0, 522.0, 1056.0, 2157.0, 4538.0, 9685.0, 21872.0, 47050.0, 101655.0, 196151.0, 264486.0, 200862.0, 106177.0, 49889.0, 22483.0, 10180.0, 4636.0, 2236.0, 1035.0, 571.0, 257.0, 154.0, 97.0, 60.0, 25.0, 25.0, 14.0, 13.0, 7.0, 6.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0241851806640625, -0.023392915725708008, -0.022600650787353516, -0.021808385848999023, -0.02101612091064453, -0.02022385597229004, -0.019431591033935547, -0.018639326095581055, -0.017847061157226562, -0.01705479621887207, -0.016262531280517578, -0.015470266342163086, -0.014678001403808594, -0.013885736465454102, -0.01309347152709961, -0.012301206588745117, -0.011508941650390625, -0.010716676712036133, -0.00992441177368164, -0.009132146835327148, -0.008339881896972656, -0.007547616958618164, -0.006755352020263672, -0.00596308708190918, -0.0051708221435546875, -0.004378557205200195, -0.003586292266845703, -0.002794027328491211, -0.0020017623901367188, -0.0012094974517822266, -0.0004172325134277344, 0.0003750324249267578, 0.00116729736328125, 0.001959562301635742, 0.0027518272399902344, 0.0035440921783447266, 0.004336357116699219, 0.005128622055053711, 0.005920886993408203, 0.006713151931762695, 0.0075054168701171875, 0.00829768180847168, 0.009089946746826172, 0.009882211685180664, 0.010674476623535156, 0.011466741561889648, 0.01225900650024414, 0.013051271438598633, 0.013843536376953125, 0.014635801315307617, 0.01542806625366211, 0.0162203311920166, 0.017012596130371094, 0.017804861068725586, 0.018597126007080078, 0.01938939094543457, 0.020181655883789062, 0.020973920822143555, 0.021766185760498047, 0.02255845069885254, 0.02335071563720703, 0.024142980575561523, 0.024935245513916016, 0.025727510452270508, 0.026519775390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 7.0, 6.0, 5.0, 8.0, 7.0, 9.0, 6.0, 4.0, 14.0, 15.0, 8.0, 12.0, 15.0, 18.0, 31.0, 33.0, 31.0, 28.0, 34.0, 56.0, 52.0, 61.0, 51.0, 58.0, 53.0, 55.0, 47.0, 35.0, 39.0, 40.0, 30.0, 19.0, 23.0, 19.0, 14.0, 9.0, 5.0, 6.0, 11.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0222930908203125, -0.02165079116821289, -0.02100849151611328, -0.020366191864013672, -0.019723892211914062, -0.019081592559814453, -0.018439292907714844, -0.017796993255615234, -0.017154693603515625, -0.016512393951416016, -0.015870094299316406, -0.015227794647216797, -0.014585494995117188, -0.013943195343017578, -0.013300895690917969, -0.01265859603881836, -0.01201629638671875, -0.01137399673461914, -0.010731697082519531, -0.010089397430419922, -0.009447097778320312, -0.008804798126220703, -0.008162498474121094, -0.007520198822021484, -0.006877899169921875, -0.006235599517822266, -0.005593299865722656, -0.004951000213623047, -0.0043087005615234375, -0.003666400909423828, -0.0030241012573242188, -0.0023818016052246094, -0.001739501953125, -0.0010972023010253906, -0.00045490264892578125, 0.00018739700317382812, 0.0008296966552734375, 0.0014719963073730469, 0.0021142959594726562, 0.0027565956115722656, 0.003398895263671875, 0.004041194915771484, 0.004683494567871094, 0.005325794219970703, 0.0059680938720703125, 0.006610393524169922, 0.007252693176269531, 0.00789499282836914, 0.00853729248046875, 0.00917959213256836, 0.009821891784667969, 0.010464191436767578, 0.011106491088867188, 0.011748790740966797, 0.012391090393066406, 0.013033390045166016, 0.013675689697265625, 0.014317989349365234, 0.014960289001464844, 0.015602588653564453, 0.016244888305664062, 0.016887187957763672, 0.01752948760986328, 0.01817178726196289, 0.0188140869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 7.0, 14.0, 15.0, 27.0, 20.0, 45.0, 52.0, 49.0, 61.0, 86.0, 85.0, 81.0, 69.0, 74.0, 71.0, 52.0, 53.0, 34.0, 24.0, 25.0, 7.0, 16.0, 8.0, 10.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21301813423633575, -0.20575805008411407, -0.1984979808330536, -0.1912378966808319, -0.18397781252861023, -0.17671772837638855, -0.16945765912532806, -0.16219757497310638, -0.1549375057220459, -0.14767742156982422, -0.14041735231876373, -0.13315726816654205, -0.12589718401432037, -0.11863710731267929, -0.11137703061103821, -0.10411694645881653, -0.09685686230659485, -0.08959678560495377, -0.08233670145273209, -0.075076624751091, -0.06781654059886932, -0.06055646389722824, -0.05329638719558716, -0.04603630676865578, -0.038776226341724396, -0.031516145914793015, -0.024256067350506783, -0.01699598878622055, -0.00973590835928917, -0.002475827932357788, 0.004784248769283295, 0.012044329196214676, 0.01930442452430725, 0.026564504951238632, 0.03382458537817001, 0.041084662079811096, 0.04834474250674248, 0.05560482293367386, 0.06286489963531494, 0.07012498378753662, 0.0773850604891777, 0.08464513719081879, 0.09190522134304047, 0.09916529804468155, 0.10642537474632263, 0.11368545889854431, 0.1209455356001854, 0.12820561230182648, 0.13546569645404816, 0.14272578060626984, 0.14998584985733032, 0.157245934009552, 0.16450601816177368, 0.17176610231399536, 0.17902617156505585, 0.18628625571727753, 0.193546324968338, 0.2008064091205597, 0.20806647837162018, 0.21532656252384186, 0.22258664667606354, 0.22984671592712402, 0.2371068000793457, 0.24436688423156738, 0.25162696838378906]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 12.0, 10.0, 13.0, 13.0, 17.0, 24.0, 27.0, 26.0, 31.0, 31.0, 39.0, 33.0, 35.0, 52.0, 42.0, 43.0, 42.0, 41.0, 58.0, 36.0, 42.0, 44.0, 44.0, 41.0, 24.0, 24.0, 22.0, 22.0, 27.0, 12.0, 13.0, 10.0, 5.0, 1.0, 8.0, 5.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2907903790473938, -0.2819488048553467, -0.27310723066329956, -0.26426562666893005, -0.25542405247688293, -0.24658247828483582, -0.2377409040927887, -0.22889931499958038, -0.22005772590637207, -0.21121615171432495, -0.20237456262111664, -0.19353298842906952, -0.1846913993358612, -0.1758498251438141, -0.16700825095176697, -0.15816666185855865, -0.14932508766651154, -0.14048351347446442, -0.1316419243812561, -0.12280035018920898, -0.11395876109600067, -0.10511718690395355, -0.09627560526132584, -0.08743402361869812, -0.0785924419760704, -0.06975086033344269, -0.06090927869081497, -0.052067700773477554, -0.04322611913084984, -0.03438453748822212, -0.025542959570884705, -0.01670137792825699, -0.007859796285629272, 0.000981784425675869, 0.00982336513698101, 0.018664944916963577, 0.027506526559591293, 0.03634810820221901, 0.04518968611955643, 0.05403126776218414, 0.06287284940481186, 0.07171443104743958, 0.08055601269006729, 0.08939759433269501, 0.09823916852474213, 0.10708075761795044, 0.11592233180999756, 0.12476391345262527, 0.133605495095253, 0.1424470692873001, 0.15128865838050842, 0.16013023257255554, 0.16897182166576385, 0.17781339585781097, 0.1866549849510193, 0.1954965591430664, 0.20433813333511353, 0.21317970752716064, 0.22202129662036896, 0.23086287081241608, 0.2397044599056244, 0.2485460340976715, 0.25738760828971863, 0.26622921228408813, 0.27507078647613525]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 5.0, 10.0, 23.0, 33.0, 44.0, 72.0, 129.0, 222.0, 487.0, 1334.0, 4798.0, 24569.0, 294424.0, 3254168.0, 567447.0, 37528.0, 6345.0, 1584.0, 526.0, 229.0, 123.0, 70.0, 43.0, 25.0, 12.0, 13.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0897216796875, -0.0864706039428711, -0.08321952819824219, -0.07996845245361328, -0.07671737670898438, -0.07346630096435547, -0.07021522521972656, -0.06696414947509766, -0.06371307373046875, -0.060461997985839844, -0.05721092224121094, -0.05395984649658203, -0.050708770751953125, -0.04745769500732422, -0.04420661926269531, -0.040955543518066406, -0.0377044677734375, -0.034453392028808594, -0.031202316284179688, -0.02795124053955078, -0.024700164794921875, -0.02144908905029297, -0.018198013305664062, -0.014946937561035156, -0.01169586181640625, -0.008444786071777344, -0.0051937103271484375, -0.0019426345825195312, 0.001308441162109375, 0.004559516906738281, 0.0078105926513671875, 0.011061668395996094, 0.014312744140625, 0.017563819885253906, 0.020814895629882812, 0.02406597137451172, 0.027317047119140625, 0.03056812286376953, 0.03381919860839844, 0.037070274353027344, 0.04032135009765625, 0.043572425842285156, 0.04682350158691406, 0.05007457733154297, 0.053325653076171875, 0.05657672882080078, 0.05982780456542969, 0.0630788803100586, 0.0663299560546875, 0.0695810317993164, 0.07283210754394531, 0.07608318328857422, 0.07933425903320312, 0.08258533477783203, 0.08583641052246094, 0.08908748626708984, 0.09233856201171875, 0.09558963775634766, 0.09884071350097656, 0.10209178924560547, 0.10534286499023438, 0.10859394073486328, 0.11184501647949219, 0.1150960922241211, 0.11834716796875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 11.0, 12.0, 11.0, 24.0, 29.0, 23.0, 35.0, 49.0, 48.0, 61.0, 63.0, 66.0, 68.0, 66.0, 68.0, 62.0, 55.0, 53.0, 45.0, 37.0, 26.0, 22.0, 23.0, 12.0, 10.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044586181640625, -0.04314374923706055, -0.041701316833496094, -0.04025888442993164, -0.03881645202636719, -0.037374019622802734, -0.03593158721923828, -0.03448915481567383, -0.033046722412109375, -0.03160429000854492, -0.03016185760498047, -0.028719425201416016, -0.027276992797851562, -0.02583456039428711, -0.024392127990722656, -0.022949695587158203, -0.02150726318359375, -0.020064830780029297, -0.018622398376464844, -0.01717996597290039, -0.015737533569335938, -0.014295101165771484, -0.012852668762207031, -0.011410236358642578, -0.009967803955078125, -0.008525371551513672, -0.007082939147949219, -0.005640506744384766, -0.0041980743408203125, -0.0027556419372558594, -0.0013132095336914062, 0.00012922286987304688, 0.0015716552734375, 0.003014087677001953, 0.004456520080566406, 0.005898952484130859, 0.0073413848876953125, 0.008783817291259766, 0.010226249694824219, 0.011668682098388672, 0.013111114501953125, 0.014553546905517578, 0.01599597930908203, 0.017438411712646484, 0.018880844116210938, 0.02032327651977539, 0.021765708923339844, 0.023208141326904297, 0.02465057373046875, 0.026093006134033203, 0.027535438537597656, 0.02897787094116211, 0.030420303344726562, 0.031862735748291016, 0.03330516815185547, 0.03474760055541992, 0.036190032958984375, 0.03763246536254883, 0.03907489776611328, 0.040517330169677734, 0.04195976257324219, 0.04340219497680664, 0.044844627380371094, 0.04628705978393555, 0.0477294921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 6.0, 9.0, 25.0, 20.0, 50.0, 41.0, 70.0, 110.0, 213.0, 405.0, 1042.0, 3419.0, 20232.0, 279823.0, 3138989.0, 702508.0, 39479.0, 5363.0, 1342.0, 518.0, 208.0, 135.0, 90.0, 55.0, 35.0, 24.0, 23.0, 16.0, 9.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.137451171875, -0.13370037078857422, -0.12994956970214844, -0.12619876861572266, -0.12244796752929688, -0.1186971664428711, -0.11494636535644531, -0.11119556427001953, -0.10744476318359375, -0.10369396209716797, -0.09994316101074219, -0.0961923599243164, -0.09244155883789062, -0.08869075775146484, -0.08493995666503906, -0.08118915557861328, -0.0774383544921875, -0.07368755340576172, -0.06993675231933594, -0.06618595123291016, -0.062435150146484375, -0.058684349060058594, -0.05493354797363281, -0.05118274688720703, -0.04743194580078125, -0.04368114471435547, -0.03993034362792969, -0.036179542541503906, -0.032428741455078125, -0.028677940368652344, -0.024927139282226562, -0.02117633819580078, -0.017425537109375, -0.013674736022949219, -0.009923934936523438, -0.006173133850097656, -0.002422332763671875, 0.0013284683227539062, 0.0050792694091796875, 0.008830070495605469, 0.01258087158203125, 0.01633167266845703, 0.020082473754882812, 0.023833274841308594, 0.027584075927734375, 0.031334877014160156, 0.03508567810058594, 0.03883647918701172, 0.0425872802734375, 0.04633808135986328, 0.05008888244628906, 0.053839683532714844, 0.057590484619140625, 0.061341285705566406, 0.06509208679199219, 0.06884288787841797, 0.07259368896484375, 0.07634449005126953, 0.08009529113769531, 0.0838460922241211, 0.08759689331054688, 0.09134769439697266, 0.09509849548339844, 0.09884929656982422, 0.10260009765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 3.0, 12.0, 14.0, 18.0, 15.0, 28.0, 48.0, 65.0, 77.0, 119.0, 171.0, 221.0, 313.0, 365.0, 462.0, 448.0, 422.0, 324.0, 267.0, 210.0, 127.0, 88.0, 69.0, 43.0, 34.0, 22.0, 25.0, 16.0, 15.0, 9.0, 5.0, 1.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039703369140625, -0.03806161880493164, -0.03641986846923828, -0.03477811813354492, -0.03313636779785156, -0.0314946174621582, -0.029852867126464844, -0.028211116790771484, -0.026569366455078125, -0.024927616119384766, -0.023285865783691406, -0.021644115447998047, -0.020002365112304688, -0.018360614776611328, -0.01671886444091797, -0.01507711410522461, -0.01343536376953125, -0.01179361343383789, -0.010151863098144531, -0.008510112762451172, -0.0068683624267578125, -0.005226612091064453, -0.0035848617553710938, -0.0019431114196777344, -0.000301361083984375, 0.0013403892517089844, 0.0029821395874023438, 0.004623889923095703, 0.0062656402587890625, 0.007907390594482422, 0.009549140930175781, 0.01119089126586914, 0.0128326416015625, 0.01447439193725586, 0.01611614227294922, 0.017757892608642578, 0.019399642944335938, 0.021041393280029297, 0.022683143615722656, 0.024324893951416016, 0.025966644287109375, 0.027608394622802734, 0.029250144958496094, 0.030891895294189453, 0.03253364562988281, 0.03417539596557617, 0.03581714630126953, 0.03745889663696289, 0.03910064697265625, 0.04074239730834961, 0.04238414764404297, 0.04402589797973633, 0.04566764831542969, 0.04730939865112305, 0.048951148986816406, 0.050592899322509766, 0.052234649658203125, 0.053876399993896484, 0.055518150329589844, 0.0571599006652832, 0.05880165100097656, 0.06044340133666992, 0.06208515167236328, 0.06372690200805664, 0.06536865234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 16.0, 24.0, 31.0, 39.0, 75.0, 75.0, 91.0, 96.0, 113.0, 110.0, 89.0, 71.0, 57.0, 34.0, 22.0, 18.0, 13.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35860559344291687, -0.34958165884017944, -0.340557724237442, -0.3315337896347046, -0.32250985503196716, -0.31348592042922974, -0.3044620156288147, -0.29543808102607727, -0.28641414642333984, -0.2773902118206024, -0.268366277217865, -0.25934234261512756, -0.25031840801239014, -0.2412944883108139, -0.23227055370807648, -0.22324663400650024, -0.21422268450260162, -0.2051987498998642, -0.19617481529712677, -0.18715089559555054, -0.1781269609928131, -0.16910302639007568, -0.16007909178733826, -0.15105515718460083, -0.1420312225818634, -0.13300728797912598, -0.12398336082696915, -0.11495942622423172, -0.10593549907207489, -0.09691156446933746, -0.08788762986660004, -0.0788637027144432, -0.06983977556228638, -0.06081584468483925, -0.05179191380739212, -0.042767979204654694, -0.033744048327207565, -0.024720117449760437, -0.01569618284702301, -0.00667225569486618, 0.0023516789078712463, 0.01137561071664095, 0.020399542525410652, 0.02942347526550293, 0.03844740614295006, 0.047471337020397186, 0.05649527162313461, 0.06551919877529144, 0.07454313337802887, 0.0835670679807663, 0.09259099513292313, 0.10161492973566055, 0.11063885688781738, 0.11966279149055481, 0.12868672609329224, 0.13771066069602966, 0.1467345952987671, 0.15575852990150452, 0.16478246450424194, 0.17380639910697937, 0.1828303188085556, 0.19185425341129303, 0.20087818801403046, 0.2099021077156067, 0.21892604231834412]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 3.0, 11.0, 9.0, 8.0, 10.0, 20.0, 23.0, 18.0, 24.0, 31.0, 27.0, 26.0, 26.0, 24.0, 37.0, 44.0, 41.0, 35.0, 30.0, 31.0, 35.0, 41.0, 47.0, 44.0, 34.0, 34.0, 32.0, 41.0, 18.0, 31.0, 19.0, 17.0, 16.0, 24.0, 12.0, 11.0, 6.0, 9.0, 9.0, 11.0, 6.0, 3.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1703234314918518, -0.16501012444496155, -0.1596968173980713, -0.15438351035118103, -0.14907020330429077, -0.14375688135623932, -0.13844357430934906, -0.1331302672624588, -0.12781696021556854, -0.12250365316867828, -0.11719034612178802, -0.11187703162431717, -0.10656372457742691, -0.10125041753053665, -0.0959371030330658, -0.09062379598617554, -0.08531048893928528, -0.07999718189239502, -0.07468387484550476, -0.0693705603480339, -0.06405725330114365, -0.05874394625425339, -0.05343063548207283, -0.04811732470989227, -0.042804017663002014, -0.037490710616111755, -0.0321773998439312, -0.02686409093439579, -0.021550782024860382, -0.016237473115324974, -0.010924164205789566, -0.005610853433609009, -0.00029754638671875, 0.005015762522816658, 0.010329071432352066, 0.015642380341887474, 0.020955689251422882, 0.02626899816095829, 0.0315823070704937, 0.036895617842674255, 0.042208924889564514, 0.04752223193645477, 0.05283554270863533, 0.05814885348081589, 0.06346216052770615, 0.0687754675745964, 0.07408878207206726, 0.07940208911895752, 0.08471539616584778, 0.09002870321273804, 0.0953420102596283, 0.10065532475709915, 0.10596863180398941, 0.11128193885087967, 0.11659525334835052, 0.12190856039524078, 0.12722186744213104, 0.1325351744890213, 0.13784848153591156, 0.14316178858280182, 0.14847511053085327, 0.15378841757774353, 0.1591017246246338, 0.16441503167152405, 0.1697283387184143]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 3.0, 9.0, 11.0, 10.0, 15.0, 18.0, 23.0, 27.0, 43.0, 66.0, 95.0, 187.0, 282.0, 557.0, 1106.0, 2232.0, 4546.0, 10306.0, 23842.0, 59755.0, 155246.0, 324251.0, 274249.0, 114511.0, 43832.0, 18113.0, 7766.0, 3666.0, 1769.0, 863.0, 451.0, 266.0, 133.0, 83.0, 69.0, 44.0, 36.0, 23.0, 11.0, 8.0, 8.0, 5.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.142578125, -0.1379547119140625, -0.133331298828125, -0.1287078857421875, -0.12408447265625, -0.1194610595703125, -0.114837646484375, -0.1102142333984375, -0.1055908203125, -0.1009674072265625, -0.096343994140625, -0.0917205810546875, -0.08709716796875, -0.0824737548828125, -0.077850341796875, -0.0732269287109375, -0.068603515625, -0.0639801025390625, -0.059356689453125, -0.0547332763671875, -0.05010986328125, -0.0454864501953125, -0.040863037109375, -0.0362396240234375, -0.0316162109375, -0.0269927978515625, -0.022369384765625, -0.0177459716796875, -0.01312255859375, -0.0084991455078125, -0.003875732421875, 0.0007476806640625, 0.00537109375, 0.0099945068359375, 0.014617919921875, 0.0192413330078125, 0.02386474609375, 0.0284881591796875, 0.033111572265625, 0.0377349853515625, 0.0423583984375, 0.0469818115234375, 0.051605224609375, 0.0562286376953125, 0.06085205078125, 0.0654754638671875, 0.070098876953125, 0.0747222900390625, 0.079345703125, 0.0839691162109375, 0.088592529296875, 0.0932159423828125, 0.09783935546875, 0.1024627685546875, 0.107086181640625, 0.1117095947265625, 0.1163330078125, 0.1209564208984375, 0.125579833984375, 0.1302032470703125, 0.13482666015625, 0.1394500732421875, 0.144073486328125, 0.1486968994140625, 0.1533203125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 10.0, 5.0, 13.0, 13.0, 18.0, 23.0, 30.0, 32.0, 31.0, 31.0, 44.0, 52.0, 71.0, 60.0, 72.0, 76.0, 51.0, 47.0, 52.0, 61.0, 42.0, 31.0, 35.0, 31.0, 19.0, 18.0, 11.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042388916015625, -0.04110145568847656, -0.039813995361328125, -0.03852653503417969, -0.03723907470703125, -0.03595161437988281, -0.034664154052734375, -0.03337669372558594, -0.0320892333984375, -0.030801773071289062, -0.029514312744140625, -0.028226852416992188, -0.02693939208984375, -0.025651931762695312, -0.024364471435546875, -0.023077011108398438, -0.02178955078125, -0.020502090454101562, -0.019214630126953125, -0.017927169799804688, -0.01663970947265625, -0.015352249145507812, -0.014064788818359375, -0.012777328491210938, -0.0114898681640625, -0.010202407836914062, -0.008914947509765625, -0.0076274871826171875, -0.00634002685546875, -0.0050525665283203125, -0.003765106201171875, -0.0024776458740234375, -0.001190185546875, 9.72747802734375e-05, 0.001384735107421875, 0.0026721954345703125, 0.00395965576171875, 0.0052471160888671875, 0.006534576416015625, 0.007822036743164062, 0.0091094970703125, 0.010396957397460938, 0.011684417724609375, 0.012971878051757812, 0.01425933837890625, 0.015546798706054688, 0.016834259033203125, 0.018121719360351562, 0.0194091796875, 0.020696640014648438, 0.021984100341796875, 0.023271560668945312, 0.02455902099609375, 0.025846481323242188, 0.027133941650390625, 0.028421401977539062, 0.0297088623046875, 0.030996322631835938, 0.032283782958984375, 0.03357124328613281, 0.03485870361328125, 0.03614616394042969, 0.037433624267578125, 0.03872108459472656, 0.040008544921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 8.0, 5.0, 5.0, 7.0, 10.0, 7.0, 20.0, 17.0, 33.0, 41.0, 67.0, 83.0, 121.0, 176.0, 288.0, 518.0, 845.0, 1443.0, 2541.0, 4738.0, 9358.0, 19102.0, 43937.0, 99899.0, 202219.0, 274672.0, 203150.0, 101202.0, 44062.0, 19680.0, 9415.0, 4643.0, 2521.0, 1507.0, 794.0, 510.0, 292.0, 187.0, 142.0, 94.0, 60.0, 42.0, 24.0, 30.0, 13.0, 9.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09136962890625, -0.0881643295288086, -0.08495903015136719, -0.08175373077392578, -0.07854843139648438, -0.07534313201904297, -0.07213783264160156, -0.06893253326416016, -0.06572723388671875, -0.06252193450927734, -0.05931663513183594, -0.05611133575439453, -0.052906036376953125, -0.04970073699951172, -0.04649543762207031, -0.043290138244628906, -0.0400848388671875, -0.036879539489746094, -0.03367424011230469, -0.03046894073486328, -0.027263641357421875, -0.02405834197998047, -0.020853042602539062, -0.017647743225097656, -0.01444244384765625, -0.011237144470214844, -0.008031845092773438, -0.004826545715332031, -0.001621246337890625, 0.0015840530395507812, 0.0047893524169921875, 0.007994651794433594, 0.011199951171875, 0.014405250549316406, 0.017610549926757812, 0.02081584930419922, 0.024021148681640625, 0.02722644805908203, 0.030431747436523438, 0.033637046813964844, 0.03684234619140625, 0.040047645568847656, 0.04325294494628906, 0.04645824432373047, 0.049663543701171875, 0.05286884307861328, 0.05607414245605469, 0.059279441833496094, 0.0624847412109375, 0.0656900405883789, 0.06889533996582031, 0.07210063934326172, 0.07530593872070312, 0.07851123809814453, 0.08171653747558594, 0.08492183685302734, 0.08812713623046875, 0.09133243560791016, 0.09453773498535156, 0.09774303436279297, 0.10094833374023438, 0.10415363311767578, 0.10735893249511719, 0.1105642318725586, 0.11376953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 9.0, 13.0, 18.0, 16.0, 21.0, 33.0, 15.0, 22.0, 29.0, 39.0, 47.0, 43.0, 61.0, 49.0, 53.0, 42.0, 64.0, 52.0, 52.0, 47.0, 38.0, 46.0, 37.0, 23.0, 27.0, 23.0, 13.0, 9.0, 9.0, 15.0, 8.0, 4.0, 6.0, 1.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09259033203125, -0.08933639526367188, -0.08608245849609375, -0.08282852172851562, -0.0795745849609375, -0.07632064819335938, -0.07306671142578125, -0.06981277465820312, -0.066558837890625, -0.06330490112304688, -0.06005096435546875, -0.056797027587890625, -0.0535430908203125, -0.050289154052734375, -0.04703521728515625, -0.043781280517578125, -0.04052734375, -0.037273406982421875, -0.03401947021484375, -0.030765533447265625, -0.0275115966796875, -0.024257659912109375, -0.02100372314453125, -0.017749786376953125, -0.014495849609375, -0.011241912841796875, -0.00798797607421875, -0.004734039306640625, -0.0014801025390625, 0.001773834228515625, 0.00502777099609375, 0.008281707763671875, 0.01153564453125, 0.014789581298828125, 0.01804351806640625, 0.021297454833984375, 0.0245513916015625, 0.027805328369140625, 0.03105926513671875, 0.034313201904296875, 0.037567138671875, 0.040821075439453125, 0.04407501220703125, 0.047328948974609375, 0.0505828857421875, 0.053836822509765625, 0.05709075927734375, 0.060344696044921875, 0.0635986328125, 0.06685256958007812, 0.07010650634765625, 0.07336044311523438, 0.0766143798828125, 0.07986831665039062, 0.08312225341796875, 0.08637619018554688, 0.089630126953125, 0.09288406372070312, 0.09613800048828125, 0.09939193725585938, 0.1026458740234375, 0.10589981079101562, 0.10915374755859375, 0.11240768432617188, 0.11566162109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 6.0, 6.0, 8.0, 16.0, 16.0, 37.0, 49.0, 67.0, 111.0, 141.0, 214.0, 353.0, 518.0, 790.0, 1248.0, 1740.0, 2879.0, 4813.0, 8514.0, 16032.0, 33851.0, 79949.0, 200075.0, 328820.0, 209552.0, 84402.0, 35345.0, 16812.0, 8783.0, 5022.0, 3060.0, 1870.0, 1145.0, 761.0, 513.0, 354.0, 212.0, 161.0, 78.0, 72.0, 45.0, 39.0, 31.0, 12.0, 13.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.056121826171875, -0.054341793060302734, -0.05256175994873047, -0.0507817268371582, -0.04900169372558594, -0.04722166061401367, -0.045441627502441406, -0.04366159439086914, -0.041881561279296875, -0.04010152816772461, -0.038321495056152344, -0.03654146194458008, -0.03476142883300781, -0.03298139572143555, -0.03120136260986328, -0.029421329498291016, -0.02764129638671875, -0.025861263275146484, -0.02408123016357422, -0.022301197052001953, -0.020521163940429688, -0.018741130828857422, -0.016961097717285156, -0.01518106460571289, -0.013401031494140625, -0.01162099838256836, -0.009840965270996094, -0.008060932159423828, -0.0062808990478515625, -0.004500865936279297, -0.0027208328247070312, -0.0009407997131347656, 0.0008392333984375, 0.0026192665100097656, 0.004399299621582031, 0.006179332733154297, 0.007959365844726562, 0.009739398956298828, 0.011519432067871094, 0.01329946517944336, 0.015079498291015625, 0.01685953140258789, 0.018639564514160156, 0.020419597625732422, 0.022199630737304688, 0.023979663848876953, 0.02575969696044922, 0.027539730072021484, 0.02931976318359375, 0.031099796295166016, 0.03287982940673828, 0.03465986251831055, 0.03643989562988281, 0.03821992874145508, 0.039999961853027344, 0.04177999496459961, 0.043560028076171875, 0.04534006118774414, 0.047120094299316406, 0.04890012741088867, 0.05068016052246094, 0.0524601936340332, 0.05424022674560547, 0.056020259857177734, 0.05780029296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 9.0, 12.0, 18.0, 29.0, 30.0, 38.0, 53.0, 71.0, 67.0, 85.0, 70.0, 81.0, 87.0, 72.0, 66.0, 41.0, 35.0, 25.0, 27.0, 15.0, 13.0, 10.0, 8.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.62396240234375e-05, -3.532692790031433e-05, -3.441423177719116e-05, -3.350153565406799e-05, -3.2588839530944824e-05, -3.1676143407821655e-05, -3.0763447284698486e-05, -2.9850751161575317e-05, -2.893805503845215e-05, -2.802535891532898e-05, -2.711266279220581e-05, -2.619996666908264e-05, -2.5287270545959473e-05, -2.4374574422836304e-05, -2.3461878299713135e-05, -2.2549182176589966e-05, -2.1636486053466797e-05, -2.0723789930343628e-05, -1.981109380722046e-05, -1.889839768409729e-05, -1.798570156097412e-05, -1.7073005437850952e-05, -1.6160309314727783e-05, -1.5247613191604614e-05, -1.4334917068481445e-05, -1.3422220945358276e-05, -1.2509524822235107e-05, -1.1596828699111938e-05, -1.068413257598877e-05, -9.7714364528656e-06, -8.858740329742432e-06, -7.946044206619263e-06, -7.033348083496094e-06, -6.120651960372925e-06, -5.207955837249756e-06, -4.295259714126587e-06, -3.382563591003418e-06, -2.469867467880249e-06, -1.55717134475708e-06, -6.444752216339111e-07, 2.682209014892578e-07, 1.1809170246124268e-06, 2.0936131477355957e-06, 3.0063092708587646e-06, 3.919005393981934e-06, 4.8317015171051025e-06, 5.7443976402282715e-06, 6.6570937633514404e-06, 7.569789886474609e-06, 8.482486009597778e-06, 9.395182132720947e-06, 1.0307878255844116e-05, 1.1220574378967285e-05, 1.2133270502090454e-05, 1.3045966625213623e-05, 1.3958662748336792e-05, 1.4871358871459961e-05, 1.578405499458313e-05, 1.66967511177063e-05, 1.7609447240829468e-05, 1.8522143363952637e-05, 1.9434839487075806e-05, 2.0347535610198975e-05, 2.1260231733322144e-05, 2.2172927856445312e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 2.0, 4.0, 8.0, 16.0, 11.0, 23.0, 33.0, 50.0, 73.0, 129.0, 229.0, 357.0, 707.0, 1238.0, 2254.0, 5083.0, 12562.0, 37163.0, 155998.0, 504557.0, 244669.0, 53912.0, 16704.0, 6487.0, 2969.0, 1454.0, 745.0, 400.0, 267.0, 151.0, 100.0, 58.0, 51.0, 25.0, 13.0, 15.0, 7.0, 4.0, 4.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.072998046875, -0.0703573226928711, -0.06771659851074219, -0.06507587432861328, -0.062435150146484375, -0.05979442596435547, -0.05715370178222656, -0.054512977600097656, -0.05187225341796875, -0.049231529235839844, -0.04659080505371094, -0.04395008087158203, -0.041309356689453125, -0.03866863250732422, -0.03602790832519531, -0.033387184143066406, -0.0307464599609375, -0.028105735778808594, -0.025465011596679688, -0.02282428741455078, -0.020183563232421875, -0.01754283905029297, -0.014902114868164062, -0.012261390686035156, -0.00962066650390625, -0.006979942321777344, -0.0043392181396484375, -0.0016984939575195312, 0.000942230224609375, 0.0035829544067382812, 0.0062236785888671875, 0.008864402770996094, 0.011505126953125, 0.014145851135253906, 0.016786575317382812, 0.01942729949951172, 0.022068023681640625, 0.02470874786376953, 0.027349472045898438, 0.029990196228027344, 0.03263092041015625, 0.035271644592285156, 0.03791236877441406, 0.04055309295654297, 0.043193817138671875, 0.04583454132080078, 0.04847526550292969, 0.051115989685058594, 0.0537567138671875, 0.056397438049316406, 0.05903816223144531, 0.06167888641357422, 0.06431961059570312, 0.06696033477783203, 0.06960105895996094, 0.07224178314208984, 0.07488250732421875, 0.07752323150634766, 0.08016395568847656, 0.08280467987060547, 0.08544540405273438, 0.08808612823486328, 0.09072685241699219, 0.0933675765991211, 0.09600830078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 5.0, 7.0, 13.0, 9.0, 14.0, 30.0, 53.0, 69.0, 100.0, 153.0, 142.0, 109.0, 100.0, 62.0, 35.0, 28.0, 25.0, 7.0, 9.0, 10.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0787353515625, -0.07645606994628906, -0.07417678833007812, -0.07189750671386719, -0.06961822509765625, -0.06733894348144531, -0.06505966186523438, -0.06278038024902344, -0.0605010986328125, -0.05822181701660156, -0.055942535400390625, -0.05366325378417969, -0.05138397216796875, -0.04910469055175781, -0.046825408935546875, -0.04454612731933594, -0.042266845703125, -0.03998756408691406, -0.037708282470703125, -0.03542900085449219, -0.03314971923828125, -0.030870437622070312, -0.028591156005859375, -0.026311874389648438, -0.0240325927734375, -0.021753311157226562, -0.019474029541015625, -0.017194747924804688, -0.01491546630859375, -0.012636184692382812, -0.010356903076171875, -0.008077621459960938, -0.00579833984375, -0.0035190582275390625, -0.001239776611328125, 0.0010395050048828125, 0.00331878662109375, 0.0055980682373046875, 0.007877349853515625, 0.010156631469726562, 0.0124359130859375, 0.014715194702148438, 0.016994476318359375, 0.019273757934570312, 0.02155303955078125, 0.023832321166992188, 0.026111602783203125, 0.028390884399414062, 0.030670166015625, 0.03294944763183594, 0.035228729248046875, 0.03750801086425781, 0.03978729248046875, 0.04206657409667969, 0.044345855712890625, 0.04662513732910156, 0.0489044189453125, 0.05118370056152344, 0.053462982177734375, 0.05574226379394531, 0.05802154541015625, 0.06030082702636719, 0.06258010864257812, 0.06485939025878906, 0.067138671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 4.0, 11.0, 12.0, 42.0, 67.0, 78.0, 98.0, 129.0, 132.0, 94.0, 108.0, 73.0, 51.0, 39.0, 34.0, 18.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.1436989307403564, -1.1205778121948242, -1.0974565744400024, -1.0743354558944702, -1.0512142181396484, -1.0280930995941162, -1.0049718618392944, -0.9818507432937622, -0.9587295055389404, -0.9356083273887634, -0.9124871492385864, -0.8893659710884094, -0.8662447929382324, -0.8431236147880554, -0.8200024366378784, -0.7968813180923462, -0.7737601399421692, -0.7506389617919922, -0.7275177836418152, -0.7043966054916382, -0.6812754273414612, -0.6581542491912842, -0.635033130645752, -0.6119118928909302, -0.588790774345398, -0.565669596195221, -0.542548418045044, -0.5194272398948669, -0.49630606174468994, -0.47318488359451294, -0.4500637352466583, -0.4269425570964813, -0.40382134914398193, -0.38070017099380493, -0.35757899284362793, -0.3344578146934509, -0.3113366365432739, -0.2882154583930969, -0.2650943100452423, -0.2419731318950653, -0.2188519537448883, -0.1957307755947113, -0.1726095974445343, -0.1494884341955185, -0.1263672560453415, -0.10324607789516449, -0.08012491464614868, -0.05700373649597168, -0.03388255834579468, -0.010761383920907974, 0.01235979050397873, 0.035480961203575134, 0.058602139353752136, 0.08172331750392914, 0.10484448075294495, 0.12796565890312195, 0.15108683705329895, 0.17420801520347595, 0.19732919335365295, 0.22045035660266876, 0.24357153475284576, 0.2666926980018616, 0.2898138761520386, 0.3129350543022156, 0.3360562324523926]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 4.0, 11.0, 14.0, 15.0, 15.0, 15.0, 26.0, 11.0, 22.0, 28.0, 27.0, 31.0, 27.0, 42.0, 36.0, 46.0, 46.0, 42.0, 34.0, 49.0, 36.0, 40.0, 34.0, 33.0, 39.0, 30.0, 36.0, 32.0, 19.0, 16.0, 18.0, 26.0, 17.0, 11.0, 9.0, 12.0, 8.0, 10.0, 6.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3224431872367859, -0.3119032084941864, -0.3013632297515869, -0.2908232510089874, -0.28028327226638794, -0.26974329352378845, -0.25920331478118896, -0.24866333603858948, -0.23812335729599, -0.2275833785533905, -0.21704339981079102, -0.20650342106819153, -0.19596344232559204, -0.18542346358299255, -0.17488348484039307, -0.16434350609779358, -0.15380354225635529, -0.1432635635137558, -0.1327235847711563, -0.12218360602855682, -0.11164362728595734, -0.10110364854335785, -0.09056367725133896, -0.08002369850873947, -0.06948371976613998, -0.0589437410235405, -0.04840376228094101, -0.03786378726363182, -0.027323808521032333, -0.016783829778432846, -0.006243854761123657, 0.00429612398147583, 0.014836102724075317, 0.025376081466674805, 0.03591606020927429, 0.04645603522658348, 0.05699601396918297, 0.06753599643707275, 0.07807596772909164, 0.08861594647169113, 0.09915592521429062, 0.1096959039568901, 0.1202358826994896, 0.13077585399150848, 0.14131583273410797, 0.15185581147670746, 0.16239579021930695, 0.17293576896190643, 0.18347574770450592, 0.1940157264471054, 0.2045557051897049, 0.21509568393230438, 0.22563566267490387, 0.23617564141750336, 0.24671560525894165, 0.25725558400154114, 0.2677955627441406, 0.2783355414867401, 0.2888755202293396, 0.2994154989719391, 0.3099554777145386, 0.32049545645713806, 0.33103543519973755, 0.34157541394233704, 0.3521153926849365]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 7.0, 9.0, 15.0, 15.0, 23.0, 29.0, 64.0, 107.0, 173.0, 281.0, 542.0, 1040.0, 2524.0, 6466.0, 19596.0, 77477.0, 510437.0, 2471629.0, 935573.0, 125440.0, 28446.0, 8601.0, 3085.0, 1333.0, 613.0, 318.0, 179.0, 95.0, 57.0, 28.0, 31.0, 17.0, 8.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08843994140625, -0.08588695526123047, -0.08333396911621094, -0.0807809829711914, -0.07822799682617188, -0.07567501068115234, -0.07312202453613281, -0.07056903839111328, -0.06801605224609375, -0.06546306610107422, -0.06291007995605469, -0.060357093811035156, -0.057804107666015625, -0.055251121520996094, -0.05269813537597656, -0.05014514923095703, -0.0475921630859375, -0.04503917694091797, -0.04248619079589844, -0.039933204650878906, -0.037380218505859375, -0.034827232360839844, -0.03227424621582031, -0.02972126007080078, -0.02716827392578125, -0.02461528778076172, -0.022062301635742188, -0.019509315490722656, -0.016956329345703125, -0.014403343200683594, -0.011850357055664062, -0.009297370910644531, -0.006744384765625, -0.004191398620605469, -0.0016384124755859375, 0.0009145736694335938, 0.003467559814453125, 0.006020545959472656, 0.008573532104492188, 0.011126518249511719, 0.01367950439453125, 0.01623249053955078, 0.018785476684570312, 0.021338462829589844, 0.023891448974609375, 0.026444435119628906, 0.028997421264648438, 0.03155040740966797, 0.0341033935546875, 0.03665637969970703, 0.03920936584472656, 0.041762351989746094, 0.044315338134765625, 0.046868324279785156, 0.04942131042480469, 0.05197429656982422, 0.05452728271484375, 0.05708026885986328, 0.05963325500488281, 0.062186241149902344, 0.06473922729492188, 0.0672922134399414, 0.06984519958496094, 0.07239818572998047, 0.074951171875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 7.0, 14.0, 17.0, 20.0, 23.0, 33.0, 25.0, 37.0, 42.0, 51.0, 68.0, 63.0, 51.0, 62.0, 59.0, 53.0, 50.0, 48.0, 62.0, 43.0, 37.0, 31.0, 22.0, 17.0, 18.0, 12.0, 10.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0535888671875, -0.051993370056152344, -0.05039787292480469, -0.04880237579345703, -0.047206878662109375, -0.04561138153076172, -0.04401588439941406, -0.042420387268066406, -0.04082489013671875, -0.039229393005371094, -0.03763389587402344, -0.03603839874267578, -0.034442901611328125, -0.03284740447998047, -0.03125190734863281, -0.029656410217285156, -0.0280609130859375, -0.026465415954589844, -0.024869918823242188, -0.02327442169189453, -0.021678924560546875, -0.02008342742919922, -0.018487930297851562, -0.016892433166503906, -0.01529693603515625, -0.013701438903808594, -0.012105941772460938, -0.010510444641113281, -0.008914947509765625, -0.007319450378417969, -0.0057239532470703125, -0.004128456115722656, -0.002532958984375, -0.0009374618530273438, 0.0006580352783203125, 0.0022535324096679688, 0.003849029541015625, 0.005444526672363281, 0.0070400238037109375, 0.008635520935058594, 0.01023101806640625, 0.011826515197753906, 0.013422012329101562, 0.015017509460449219, 0.016613006591796875, 0.01820850372314453, 0.019804000854492188, 0.021399497985839844, 0.0229949951171875, 0.024590492248535156, 0.026185989379882812, 0.02778148651123047, 0.029376983642578125, 0.03097248077392578, 0.03256797790527344, 0.034163475036621094, 0.03575897216796875, 0.037354469299316406, 0.03894996643066406, 0.04054546356201172, 0.042140960693359375, 0.04373645782470703, 0.04533195495605469, 0.046927452087402344, 0.04852294921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 17.0, 7.0, 23.0, 41.0, 59.0, 120.0, 188.0, 302.0, 599.0, 1293.0, 2805.0, 7604.0, 24441.0, 112993.0, 852593.0, 2582129.0, 505662.0, 75021.0, 17975.0, 5856.0, 2287.0, 1038.0, 521.0, 315.0, 168.0, 85.0, 51.0, 33.0, 19.0, 13.0, 9.0, 9.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13138961791992188, -0.12813568115234375, -0.12488174438476562, -0.1216278076171875, -0.11837387084960938, -0.11511993408203125, -0.11186599731445312, -0.108612060546875, -0.10535812377929688, -0.10210418701171875, -0.09885025024414062, -0.0955963134765625, -0.09234237670898438, -0.08908843994140625, -0.08583450317382812, -0.08258056640625, -0.07932662963867188, -0.07607269287109375, -0.07281875610351562, -0.0695648193359375, -0.06631088256835938, -0.06305694580078125, -0.059803009033203125, -0.056549072265625, -0.053295135498046875, -0.05004119873046875, -0.046787261962890625, -0.0435333251953125, -0.040279388427734375, -0.03702545166015625, -0.033771514892578125, -0.030517578125, -0.027263641357421875, -0.02400970458984375, -0.020755767822265625, -0.0175018310546875, -0.014247894287109375, -0.01099395751953125, -0.007740020751953125, -0.004486083984375, -0.001232147216796875, 0.00202178955078125, 0.005275726318359375, 0.0085296630859375, 0.011783599853515625, 0.01503753662109375, 0.018291473388671875, 0.02154541015625, 0.024799346923828125, 0.02805328369140625, 0.031307220458984375, 0.0345611572265625, 0.037815093994140625, 0.04106903076171875, 0.044322967529296875, 0.047576904296875, 0.050830841064453125, 0.05408477783203125, 0.057338714599609375, 0.0605926513671875, 0.06384658813476562, 0.06710052490234375, 0.07035446166992188, 0.0736083984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 12.0, 5.0, 28.0, 28.0, 50.0, 55.0, 88.0, 161.0, 255.0, 391.0, 633.0, 703.0, 581.0, 387.0, 264.0, 161.0, 76.0, 66.0, 40.0, 24.0, 16.0, 15.0, 10.0, 5.0, 8.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062347412109375, -0.05931520462036133, -0.056282997131347656, -0.053250789642333984, -0.05021858215332031, -0.04718637466430664, -0.04415416717529297, -0.0411219596862793, -0.038089752197265625, -0.03505754470825195, -0.03202533721923828, -0.02899312973022461, -0.025960922241210938, -0.022928714752197266, -0.019896507263183594, -0.016864299774169922, -0.01383209228515625, -0.010799884796142578, -0.007767677307128906, -0.004735469818115234, -0.0017032623291015625, 0.0013289451599121094, 0.004361152648925781, 0.007393360137939453, 0.010425567626953125, 0.013457775115966797, 0.01648998260498047, 0.01952219009399414, 0.022554397583007812, 0.025586605072021484, 0.028618812561035156, 0.03165102005004883, 0.0346832275390625, 0.03771543502807617, 0.040747642517089844, 0.043779850006103516, 0.04681205749511719, 0.04984426498413086, 0.05287647247314453, 0.0559086799621582, 0.058940887451171875, 0.06197309494018555, 0.06500530242919922, 0.06803750991821289, 0.07106971740722656, 0.07410192489624023, 0.0771341323852539, 0.08016633987426758, 0.08319854736328125, 0.08623075485229492, 0.0892629623413086, 0.09229516983032227, 0.09532737731933594, 0.09835958480834961, 0.10139179229736328, 0.10442399978637695, 0.10745620727539062, 0.1104884147644043, 0.11352062225341797, 0.11655282974243164, 0.11958503723144531, 0.12261724472045898, 0.12564945220947266, 0.12868165969848633, 0.1317138671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 12.0, 16.0, 15.0, 26.0, 29.0, 39.0, 39.0, 47.0, 71.0, 64.0, 79.0, 83.0, 82.0, 82.0, 59.0, 50.0, 34.0, 48.0, 32.0, 26.0, 17.0, 14.0, 10.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2281726896762848, -0.2185133844614029, -0.2088540941476822, -0.1991947889328003, -0.1895354986190796, -0.1798761934041977, -0.1702168881893158, -0.1605575978755951, -0.1508982926607132, -0.1412389874458313, -0.1315796971321106, -0.1219203919172287, -0.1122610941529274, -0.1026017963886261, -0.0929424911737442, -0.0832831934094429, -0.0736238956451416, -0.0639645978808403, -0.0543052963912487, -0.044645994901657104, -0.034986697137355804, -0.025327399373054504, -0.015668097883462906, -0.006008796393871307, 0.0036505013704299927, 0.013309800997376442, 0.02296910062432289, 0.03262840211391449, 0.04228769987821579, 0.05194699764251709, 0.06160629913210869, 0.07126560062170029, 0.0809248685836792, 0.0905841663479805, 0.1002434641122818, 0.1099027693271637, 0.119562067091465, 0.1292213648557663, 0.1388806700706482, 0.1485399603843689, 0.1581992655992508, 0.1678585708141327, 0.1775178611278534, 0.1871771663427353, 0.1968364715576172, 0.2064957618713379, 0.2161550670862198, 0.22581437230110168, 0.2354736626148224, 0.24513296782970428, 0.2547922730445862, 0.2644515633583069, 0.2741108536720276, 0.2837701439857483, 0.2934294641017914, 0.3030887544155121, 0.3127480745315552, 0.3224073648452759, 0.33206668496131897, 0.3417259752750397, 0.3513852655887604, 0.36104458570480347, 0.37070387601852417, 0.3803631663322449, 0.3900224566459656]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 10.0, 8.0, 5.0, 20.0, 14.0, 15.0, 25.0, 19.0, 20.0, 21.0, 43.0, 39.0, 34.0, 50.0, 40.0, 45.0, 48.0, 35.0, 56.0, 43.0, 27.0, 52.0, 49.0, 44.0, 37.0, 26.0, 28.0, 29.0, 25.0, 20.0, 12.0, 13.0, 17.0, 10.0, 7.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3033410310745239, -0.2945897579193115, -0.2858384847640991, -0.2770872116088867, -0.2683359384536743, -0.2595846652984619, -0.2508333921432495, -0.24208210408687592, -0.2333308309316635, -0.2245795577764511, -0.2158282846212387, -0.2070770114660263, -0.1983257234096527, -0.1895744502544403, -0.1808231770992279, -0.1720719039440155, -0.1633206307888031, -0.1545693576335907, -0.1458180844783783, -0.1370668113231659, -0.1283155381679535, -0.11956425756216049, -0.11081297695636749, -0.10206170380115509, -0.09331043064594269, -0.08455915749073029, -0.07580788433551788, -0.06705660372972488, -0.05830533057451248, -0.04955405741930008, -0.04080278053879738, -0.03205150365829468, -0.023300230503082275, -0.014548955485224724, -0.005797680467367172, 0.0029535945504903793, 0.011704869568347931, 0.020456142723560333, 0.029207419604063034, 0.037958696484565735, 0.04670996963977814, 0.05546124279499054, 0.06421251595020294, 0.07296379655599594, 0.08171506971120834, 0.09046634286642075, 0.09921762347221375, 0.10796889662742615, 0.11672016978263855, 0.12547144293785095, 0.13422271609306335, 0.14297398924827576, 0.15172526240348816, 0.16047653555870056, 0.16922782361507416, 0.17797909677028656, 0.18673036992549896, 0.19548164308071136, 0.20423291623592377, 0.21298418939113617, 0.22173547744750977, 0.23048675060272217, 0.23923802375793457, 0.24798929691314697, 0.2567405700683594]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 13.0, 9.0, 11.0, 22.0, 27.0, 40.0, 63.0, 69.0, 126.0, 208.0, 291.0, 684.0, 1241.0, 2307.0, 4890.0, 9884.0, 20999.0, 45868.0, 114073.0, 295207.0, 323825.0, 131328.0, 51927.0, 23162.0, 11097.0, 5481.0, 2595.0, 1393.0, 706.0, 408.0, 217.0, 151.0, 78.0, 44.0, 36.0, 22.0, 20.0, 6.0, 6.0, 4.0, 3.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11968994140625, -0.11557292938232422, -0.11145591735839844, -0.10733890533447266, -0.10322189331054688, -0.0991048812866211, -0.09498786926269531, -0.09087085723876953, -0.08675384521484375, -0.08263683319091797, -0.07851982116699219, -0.0744028091430664, -0.07028579711914062, -0.06616878509521484, -0.06205177307128906, -0.05793476104736328, -0.0538177490234375, -0.04970073699951172, -0.04558372497558594, -0.041466712951660156, -0.037349700927734375, -0.033232688903808594, -0.029115676879882812, -0.02499866485595703, -0.02088165283203125, -0.01676464080810547, -0.012647628784179688, -0.008530616760253906, -0.004413604736328125, -0.00029659271240234375, 0.0038204193115234375, 0.007937431335449219, 0.012054443359375, 0.01617145538330078, 0.020288467407226562, 0.024405479431152344, 0.028522491455078125, 0.032639503479003906, 0.03675651550292969, 0.04087352752685547, 0.04499053955078125, 0.04910755157470703, 0.05322456359863281, 0.057341575622558594, 0.061458587646484375, 0.06557559967041016, 0.06969261169433594, 0.07380962371826172, 0.0779266357421875, 0.08204364776611328, 0.08616065979003906, 0.09027767181396484, 0.09439468383789062, 0.0985116958618164, 0.10262870788574219, 0.10674571990966797, 0.11086273193359375, 0.11497974395751953, 0.11909675598144531, 0.1232137680053711, 0.12733078002929688, 0.13144779205322266, 0.13556480407714844, 0.13968181610107422, 0.143798828125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 7.0, 13.0, 20.0, 23.0, 20.0, 26.0, 39.0, 38.0, 39.0, 43.0, 49.0, 70.0, 65.0, 50.0, 55.0, 64.0, 61.0, 44.0, 54.0, 42.0, 35.0, 31.0, 26.0, 15.0, 24.0, 11.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05029296875, -0.048707008361816406, -0.04712104797363281, -0.04553508758544922, -0.043949127197265625, -0.04236316680908203, -0.04077720642089844, -0.039191246032714844, -0.03760528564453125, -0.036019325256347656, -0.03443336486816406, -0.03284740447998047, -0.031261444091796875, -0.02967548370361328, -0.028089523315429688, -0.026503562927246094, -0.0249176025390625, -0.023331642150878906, -0.021745681762695312, -0.02015972137451172, -0.018573760986328125, -0.01698780059814453, -0.015401840209960938, -0.013815879821777344, -0.01222991943359375, -0.010643959045410156, -0.009057998657226562, -0.007472038269042969, -0.005886077880859375, -0.004300117492675781, -0.0027141571044921875, -0.0011281967163085938, 0.000457763671875, 0.0020437240600585938, 0.0036296844482421875, 0.005215644836425781, 0.006801605224609375, 0.008387565612792969, 0.009973526000976562, 0.011559486389160156, 0.01314544677734375, 0.014731407165527344, 0.016317367553710938, 0.01790332794189453, 0.019489288330078125, 0.02107524871826172, 0.022661209106445312, 0.024247169494628906, 0.0258331298828125, 0.027419090270996094, 0.029005050659179688, 0.03059101104736328, 0.032176971435546875, 0.03376293182373047, 0.03534889221191406, 0.036934852600097656, 0.03852081298828125, 0.040106773376464844, 0.04169273376464844, 0.04327869415283203, 0.044864654541015625, 0.04645061492919922, 0.04803657531738281, 0.049622535705566406, 0.05120849609375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 18.0, 10.0, 22.0, 31.0, 37.0, 59.0, 93.0, 157.0, 256.0, 510.0, 1221.0, 3766.0, 12665.0, 45684.0, 184837.0, 519534.0, 208342.0, 50578.0, 13993.0, 4091.0, 1374.0, 550.0, 283.0, 133.0, 97.0, 55.0, 48.0, 34.0, 16.0, 17.0, 16.0, 10.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.17942237854003906, -0.17390823364257812, -0.1683940887451172, -0.16287994384765625, -0.1573657989501953, -0.15185165405273438, -0.14633750915527344, -0.1408233642578125, -0.13530921936035156, -0.12979507446289062, -0.12428092956542969, -0.11876678466796875, -0.11325263977050781, -0.10773849487304688, -0.10222434997558594, -0.096710205078125, -0.09119606018066406, -0.08568191528320312, -0.08016777038574219, -0.07465362548828125, -0.06913948059082031, -0.06362533569335938, -0.05811119079589844, -0.0525970458984375, -0.04708290100097656, -0.041568756103515625, -0.03605461120605469, -0.03054046630859375, -0.025026321411132812, -0.019512176513671875, -0.013998031616210938, -0.00848388671875, -0.0029697418212890625, 0.002544403076171875, 0.008058547973632812, 0.01357269287109375, 0.019086837768554688, 0.024600982666015625, 0.030115127563476562, 0.0356292724609375, 0.04114341735839844, 0.046657562255859375, 0.05217170715332031, 0.05768585205078125, 0.06319999694824219, 0.06871414184570312, 0.07422828674316406, 0.079742431640625, 0.08525657653808594, 0.09077072143554688, 0.09628486633300781, 0.10179901123046875, 0.10731315612792969, 0.11282730102539062, 0.11834144592285156, 0.1238555908203125, 0.12936973571777344, 0.13488388061523438, 0.1403980255126953, 0.14591217041015625, 0.1514263153076172, 0.15694046020507812, 0.16245460510253906, 0.16796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 12.0, 11.0, 12.0, 12.0, 19.0, 30.0, 28.0, 29.0, 33.0, 45.0, 44.0, 48.0, 52.0, 52.0, 60.0, 52.0, 52.0, 57.0, 43.0, 46.0, 44.0, 27.0, 42.0, 33.0, 21.0, 22.0, 15.0, 9.0, 8.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.130615234375, -0.12652969360351562, -0.12244415283203125, -0.11835861206054688, -0.1142730712890625, -0.11018753051757812, -0.10610198974609375, -0.10201644897460938, -0.097930908203125, -0.09384536743164062, -0.08975982666015625, -0.08567428588867188, -0.0815887451171875, -0.07750320434570312, -0.07341766357421875, -0.06933212280273438, -0.06524658203125, -0.061161041259765625, -0.05707550048828125, -0.052989959716796875, -0.0489044189453125, -0.044818878173828125, -0.04073333740234375, -0.036647796630859375, -0.032562255859375, -0.028476715087890625, -0.02439117431640625, -0.020305633544921875, -0.0162200927734375, -0.012134552001953125, -0.00804901123046875, -0.003963470458984375, 0.0001220703125, 0.004207611083984375, 0.00829315185546875, 0.012378692626953125, 0.0164642333984375, 0.020549774169921875, 0.02463531494140625, 0.028720855712890625, 0.032806396484375, 0.036891937255859375, 0.04097747802734375, 0.045063018798828125, 0.0491485595703125, 0.053234100341796875, 0.05731964111328125, 0.061405181884765625, 0.06549072265625, 0.06957626342773438, 0.07366180419921875, 0.07774734497070312, 0.0818328857421875, 0.08591842651367188, 0.09000396728515625, 0.09408950805664062, 0.098175048828125, 0.10226058959960938, 0.10634613037109375, 0.11043167114257812, 0.1145172119140625, 0.11860275268554688, 0.12268829345703125, 0.12677383422851562, 0.130859375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 18.0, 6.0, 15.0, 29.0, 47.0, 83.0, 114.0, 167.0, 211.0, 322.0, 583.0, 926.0, 1486.0, 2343.0, 3844.0, 5849.0, 9797.0, 15463.0, 24937.0, 40096.0, 71270.0, 139067.0, 230764.0, 218134.0, 122582.0, 63701.0, 36597.0, 22319.0, 14241.0, 8830.0, 5508.0, 3393.0, 2215.0, 1326.0, 807.0, 524.0, 334.0, 235.0, 127.0, 81.0, 45.0, 46.0, 29.0, 13.0, 11.0, 7.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04400634765625, -0.04274559020996094, -0.041484832763671875, -0.04022407531738281, -0.03896331787109375, -0.03770256042480469, -0.036441802978515625, -0.03518104553222656, -0.0339202880859375, -0.03265953063964844, -0.031398773193359375, -0.030138015747070312, -0.02887725830078125, -0.027616500854492188, -0.026355743408203125, -0.025094985961914062, -0.023834228515625, -0.022573471069335938, -0.021312713623046875, -0.020051956176757812, -0.01879119873046875, -0.017530441284179688, -0.016269683837890625, -0.015008926391601562, -0.0137481689453125, -0.012487411499023438, -0.011226654052734375, -0.009965896606445312, -0.00870513916015625, -0.0074443817138671875, -0.006183624267578125, -0.0049228668212890625, -0.003662109375, -0.0024013519287109375, -0.001140594482421875, 0.0001201629638671875, 0.00138092041015625, 0.0026416778564453125, 0.003902435302734375, 0.0051631927490234375, 0.0064239501953125, 0.0076847076416015625, 0.008945465087890625, 0.010206222534179688, 0.01146697998046875, 0.012727737426757812, 0.013988494873046875, 0.015249252319335938, 0.016510009765625, 0.017770767211914062, 0.019031524658203125, 0.020292282104492188, 0.02155303955078125, 0.022813796997070312, 0.024074554443359375, 0.025335311889648438, 0.0265960693359375, 0.027856826782226562, 0.029117584228515625, 0.030378341674804688, 0.03163909912109375, 0.03289985656738281, 0.034160614013671875, 0.03542137145996094, 0.03668212890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 8.0, 6.0, 3.0, 8.0, 15.0, 16.0, 19.0, 22.0, 28.0, 34.0, 39.0, 45.0, 56.0, 71.0, 59.0, 65.0, 65.0, 53.0, 58.0, 44.0, 67.0, 48.0, 36.0, 24.0, 13.0, 23.0, 19.0, 8.0, 12.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0623207092285156e-05, -1.9931234419345856e-05, -1.9239261746406555e-05, -1.8547289073467255e-05, -1.7855316400527954e-05, -1.7163343727588654e-05, -1.6471371054649353e-05, -1.5779398381710052e-05, -1.5087425708770752e-05, -1.4395453035831451e-05, -1.3703480362892151e-05, -1.301150768995285e-05, -1.231953501701355e-05, -1.162756234407425e-05, -1.0935589671134949e-05, -1.0243616998195648e-05, -9.551644325256348e-06, -8.859671652317047e-06, -8.167698979377747e-06, -7.475726306438446e-06, -6.7837536334991455e-06, -6.091780960559845e-06, -5.3998082876205444e-06, -4.707835614681244e-06, -4.015862941741943e-06, -3.323890268802643e-06, -2.6319175958633423e-06, -1.9399449229240417e-06, -1.2479722499847412e-06, -5.559995770454407e-07, 1.3597309589385986e-07, 8.279457688331604e-07, 1.519918441772461e-06, 2.2118911147117615e-06, 2.903863787651062e-06, 3.5958364605903625e-06, 4.287809133529663e-06, 4.979781806468964e-06, 5.671754479408264e-06, 6.363727152347565e-06, 7.055699825286865e-06, 7.747672498226166e-06, 8.439645171165466e-06, 9.131617844104767e-06, 9.823590517044067e-06, 1.0515563189983368e-05, 1.1207535862922668e-05, 1.1899508535861969e-05, 1.259148120880127e-05, 1.328345388174057e-05, 1.397542655467987e-05, 1.4667399227619171e-05, 1.535937190055847e-05, 1.6051344573497772e-05, 1.6743317246437073e-05, 1.7435289919376373e-05, 1.8127262592315674e-05, 1.8819235265254974e-05, 1.9511207938194275e-05, 2.0203180611133575e-05, 2.0895153284072876e-05, 2.1587125957012177e-05, 2.2279098629951477e-05, 2.2971071302890778e-05, 2.3663043975830078e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 9.0, 10.0, 12.0, 8.0, 36.0, 51.0, 64.0, 93.0, 144.0, 250.0, 416.0, 883.0, 1853.0, 4021.0, 9198.0, 20894.0, 47399.0, 120804.0, 359506.0, 309233.0, 100177.0, 40700.0, 18021.0, 7708.0, 3548.0, 1636.0, 823.0, 424.0, 238.0, 138.0, 102.0, 66.0, 26.0, 17.0, 12.0, 10.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052215576171875, -0.050275325775146484, -0.04833507537841797, -0.04639482498168945, -0.04445457458496094, -0.04251432418823242, -0.040574073791503906, -0.03863382339477539, -0.036693572998046875, -0.03475332260131836, -0.032813072204589844, -0.030872821807861328, -0.028932571411132812, -0.026992321014404297, -0.02505207061767578, -0.023111820220947266, -0.02117156982421875, -0.019231319427490234, -0.01729106903076172, -0.015350818634033203, -0.013410568237304688, -0.011470317840576172, -0.009530067443847656, -0.007589817047119141, -0.005649566650390625, -0.0037093162536621094, -0.0017690658569335938, 0.00017118453979492188, 0.0021114349365234375, 0.004051685333251953, 0.005991935729980469, 0.007932186126708984, 0.0098724365234375, 0.011812686920166016, 0.013752937316894531, 0.015693187713623047, 0.017633438110351562, 0.019573688507080078, 0.021513938903808594, 0.02345418930053711, 0.025394439697265625, 0.02733469009399414, 0.029274940490722656, 0.031215190887451172, 0.03315544128417969, 0.0350956916809082, 0.03703594207763672, 0.038976192474365234, 0.04091644287109375, 0.042856693267822266, 0.04479694366455078, 0.0467371940612793, 0.04867744445800781, 0.05061769485473633, 0.052557945251464844, 0.05449819564819336, 0.056438446044921875, 0.05837869644165039, 0.060318946838378906, 0.06225919723510742, 0.06419944763183594, 0.06613969802856445, 0.06807994842529297, 0.07002019882202148, 0.07196044921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 5.0, 8.0, 6.0, 5.0, 11.0, 11.0, 11.0, 16.0, 17.0, 25.0, 21.0, 23.0, 35.0, 57.0, 72.0, 82.0, 90.0, 86.0, 73.0, 63.0, 49.0, 44.0, 42.0, 23.0, 26.0, 20.0, 12.0, 10.0, 10.0, 8.0, 7.0, 8.0, 6.0, 6.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.052093505859375, -0.050559043884277344, -0.04902458190917969, -0.04749011993408203, -0.045955657958984375, -0.04442119598388672, -0.04288673400878906, -0.041352272033691406, -0.03981781005859375, -0.038283348083496094, -0.03674888610839844, -0.03521442413330078, -0.033679962158203125, -0.03214550018310547, -0.030611038208007812, -0.029076576232910156, -0.0275421142578125, -0.026007652282714844, -0.024473190307617188, -0.02293872833251953, -0.021404266357421875, -0.01986980438232422, -0.018335342407226562, -0.016800880432128906, -0.01526641845703125, -0.013731956481933594, -0.012197494506835938, -0.010663032531738281, -0.009128570556640625, -0.007594108581542969, -0.0060596466064453125, -0.004525184631347656, -0.00299072265625, -0.0014562606811523438, 7.82012939453125e-05, 0.0016126632690429688, 0.003147125244140625, 0.004681587219238281, 0.0062160491943359375, 0.007750511169433594, 0.00928497314453125, 0.010819435119628906, 0.012353897094726562, 0.013888359069824219, 0.015422821044921875, 0.01695728302001953, 0.018491744995117188, 0.020026206970214844, 0.0215606689453125, 0.023095130920410156, 0.024629592895507812, 0.02616405487060547, 0.027698516845703125, 0.02923297882080078, 0.030767440795898438, 0.032301902770996094, 0.03383636474609375, 0.035370826721191406, 0.03690528869628906, 0.03843975067138672, 0.039974212646484375, 0.04150867462158203, 0.04304313659667969, 0.044577598571777344, 0.046112060546875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 26.0, 121.0, 264.0, 293.0, 180.0, 78.0, 32.0, 13.0, 4.0, 1.0, 1.0], "bins": [-2.8056085109710693, -2.755821943283081, -2.7060351371765137, -2.6562485694885254, -2.606462001800537, -2.556675434112549, -2.5068886280059814, -2.457102060317993, -2.407315492630005, -2.3575289249420166, -2.307742118835449, -2.257955551147461, -2.2081689834594727, -2.1583824157714844, -2.108595609664917, -2.0588090419769287, -2.0090224742889404, -1.9592357873916626, -1.9094492197036743, -1.8596625328063965, -1.8098759651184082, -1.7600892782211304, -1.710302710533142, -1.6605160236358643, -1.6107293367385864, -1.5609426498413086, -1.5111560821533203, -1.4613693952560425, -1.4115828275680542, -1.3617961406707764, -1.312009572982788, -1.2622228860855103, -1.2124361991882324, -1.1626495122909546, -1.1128629446029663, -1.0630762577056885, -1.0132896900177002, -0.9635030627250671, -0.9137164354324341, -0.8639297485351562, -0.814143180847168, -0.7643565535545349, -0.7145699262619019, -0.6647832989692688, -0.6149966716766357, -0.5652100443840027, -0.5154234170913696, -0.4656367599964142, -0.4158501625061035, -0.36606353521347046, -0.3162769079208374, -0.26649028062820435, -0.2167036384344101, -0.16691701114177704, -0.11713036894798279, -0.06734374165534973, -0.017557114362716675, 0.03222951665520668, 0.08201614767313004, 0.1318027824163437, 0.18158940970897675, 0.2313760370016098, 0.28116267919540405, 0.3309493064880371, 0.38073593378067017]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 15.0, 17.0, 11.0, 18.0, 18.0, 18.0, 27.0, 31.0, 29.0, 30.0, 43.0, 43.0, 46.0, 43.0, 47.0, 44.0, 57.0, 46.0, 34.0, 45.0, 40.0, 40.0, 22.0, 34.0, 29.0, 25.0, 32.0, 18.0, 19.0, 13.0, 15.0, 11.0, 6.0, 7.0, 5.0, 6.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3697403073310852, -0.3588676154613495, -0.34799495339393616, -0.33712226152420044, -0.3262495696544647, -0.315376877784729, -0.3045042157173157, -0.29363152384757996, -0.28275883197784424, -0.2718861401081085, -0.2610134780406952, -0.2501407861709595, -0.23926809430122375, -0.22839541733264923, -0.2175227403640747, -0.206650048494339, -0.19577738642692566, -0.18490470945835114, -0.17403201758861542, -0.1631593406200409, -0.15228664875030518, -0.14141397178173065, -0.13054129481315613, -0.11966861039400101, -0.10879592597484589, -0.09792324155569077, -0.08705055713653564, -0.07617788016796112, -0.065305195748806, -0.05443251132965088, -0.043559834361076355, -0.032687149941921234, -0.021814465522766113, -0.010941782966256142, -6.910040974617004e-05, 0.010803580284118652, 0.021676264703273773, 0.032548949122428894, 0.04342162609100342, 0.05429431051015854, 0.06516699492931366, 0.07603967934846878, 0.0869123637676239, 0.09778504073619843, 0.10865772515535355, 0.11953040957450867, 0.1304030865430832, 0.14127576351165771, 0.15214845538139343, 0.16302113234996796, 0.17389382421970367, 0.1847665011882782, 0.19563919305801392, 0.20651187002658844, 0.21738454699516296, 0.22825723886489868, 0.2391299158334732, 0.25000259280204773, 0.26087528467178345, 0.2717479467391968, 0.2826206386089325, 0.2934933304786682, 0.30436599254608154, 0.31523868441581726, 0.326111376285553]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 18.0, 24.0, 46.0, 74.0, 87.0, 155.0, 257.0, 458.0, 871.0, 1637.0, 3173.0, 7169.0, 18760.0, 59948.0, 266926.0, 1458100.0, 1864577.0, 390333.0, 81018.0, 24049.0, 8856.0, 3788.0, 1787.0, 933.0, 530.0, 268.0, 171.0, 88.0, 65.0, 43.0, 24.0, 12.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09527587890625, -0.09283971786499023, -0.09040355682373047, -0.0879673957824707, -0.08553123474121094, -0.08309507369995117, -0.0806589126586914, -0.07822275161743164, -0.07578659057617188, -0.07335042953491211, -0.07091426849365234, -0.06847810745239258, -0.06604194641113281, -0.06360578536987305, -0.06116962432861328, -0.058733463287353516, -0.05629730224609375, -0.053861141204833984, -0.05142498016357422, -0.04898881912231445, -0.04655265808105469, -0.04411649703979492, -0.041680335998535156, -0.03924417495727539, -0.036808013916015625, -0.03437185287475586, -0.031935691833496094, -0.029499530792236328, -0.027063369750976562, -0.024627208709716797, -0.02219104766845703, -0.019754886627197266, -0.0173187255859375, -0.014882564544677734, -0.012446403503417969, -0.010010242462158203, -0.0075740814208984375, -0.005137920379638672, -0.0027017593383789062, -0.0002655982971191406, 0.002170562744140625, 0.004606723785400391, 0.007042884826660156, 0.009479045867919922, 0.011915206909179688, 0.014351367950439453, 0.01678752899169922, 0.019223690032958984, 0.02165985107421875, 0.024096012115478516, 0.02653217315673828, 0.028968334197998047, 0.03140449523925781, 0.03384065628051758, 0.036276817321777344, 0.03871297836303711, 0.041149139404296875, 0.04358530044555664, 0.046021461486816406, 0.04845762252807617, 0.05089378356933594, 0.0533299446105957, 0.05576610565185547, 0.058202266693115234, 0.060638427734375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 16.0, 20.0, 23.0, 34.0, 43.0, 32.0, 53.0, 39.0, 47.0, 58.0, 41.0, 51.0, 43.0, 55.0, 54.0, 44.0, 47.0, 45.0, 38.0, 27.0, 37.0, 31.0, 23.0, 10.0, 21.0, 7.0, 18.0, 3.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05517578125, -0.05360746383666992, -0.052039146423339844, -0.050470829010009766, -0.04890251159667969, -0.04733419418334961, -0.04576587677001953, -0.04419755935668945, -0.042629241943359375, -0.0410609245300293, -0.03949260711669922, -0.03792428970336914, -0.03635597229003906, -0.034787654876708984, -0.033219337463378906, -0.03165102005004883, -0.03008270263671875, -0.028514385223388672, -0.026946067810058594, -0.025377750396728516, -0.023809432983398438, -0.02224111557006836, -0.02067279815673828, -0.019104480743408203, -0.017536163330078125, -0.015967845916748047, -0.014399528503417969, -0.01283121109008789, -0.011262893676757812, -0.009694576263427734, -0.008126258850097656, -0.006557941436767578, -0.0049896240234375, -0.003421306610107422, -0.0018529891967773438, -0.0002846717834472656, 0.0012836456298828125, 0.0028519630432128906, 0.004420280456542969, 0.005988597869873047, 0.007556915283203125, 0.009125232696533203, 0.010693550109863281, 0.01226186752319336, 0.013830184936523438, 0.015398502349853516, 0.016966819763183594, 0.018535137176513672, 0.02010345458984375, 0.021671772003173828, 0.023240089416503906, 0.024808406829833984, 0.026376724243164062, 0.02794504165649414, 0.02951335906982422, 0.031081676483154297, 0.032649993896484375, 0.03421831130981445, 0.03578662872314453, 0.03735494613647461, 0.03892326354980469, 0.040491580963134766, 0.042059898376464844, 0.04362821578979492, 0.045196533203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 6.0, 11.0, 27.0, 35.0, 53.0, 84.0, 162.0, 237.0, 388.0, 722.0, 1389.0, 2884.0, 6544.0, 18048.0, 63976.0, 346163.0, 2094329.0, 1388322.0, 204601.0, 42848.0, 13369.0, 5213.0, 2318.0, 1127.0, 595.0, 317.0, 197.0, 116.0, 72.0, 46.0, 26.0, 12.0, 19.0, 12.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11126708984375, -0.10741138458251953, -0.10355567932128906, -0.0996999740600586, -0.09584426879882812, -0.09198856353759766, -0.08813285827636719, -0.08427715301513672, -0.08042144775390625, -0.07656574249267578, -0.07271003723144531, -0.06885433197021484, -0.06499862670898438, -0.061142921447753906, -0.05728721618652344, -0.05343151092529297, -0.0495758056640625, -0.04572010040283203, -0.04186439514160156, -0.038008689880371094, -0.034152984619140625, -0.030297279357910156, -0.026441574096679688, -0.02258586883544922, -0.01873016357421875, -0.014874458312988281, -0.011018753051757812, -0.007163047790527344, -0.003307342529296875, 0.0005483627319335938, 0.0044040679931640625, 0.008259773254394531, 0.012115478515625, 0.01597118377685547, 0.019826889038085938, 0.023682594299316406, 0.027538299560546875, 0.031394004821777344, 0.03524971008300781, 0.03910541534423828, 0.04296112060546875, 0.04681682586669922, 0.05067253112792969, 0.054528236389160156, 0.058383941650390625, 0.062239646911621094, 0.06609535217285156, 0.06995105743408203, 0.0738067626953125, 0.07766246795654297, 0.08151817321777344, 0.0853738784790039, 0.08922958374023438, 0.09308528900146484, 0.09694099426269531, 0.10079669952392578, 0.10465240478515625, 0.10850811004638672, 0.11236381530761719, 0.11621952056884766, 0.12007522583007812, 0.1239309310913086, 0.12778663635253906, 0.13164234161376953, 0.135498046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 9.0, 18.0, 33.0, 33.0, 32.0, 73.0, 147.0, 194.0, 305.0, 504.0, 653.0, 698.0, 498.0, 330.0, 201.0, 108.0, 78.0, 47.0, 36.0, 16.0, 17.0, 13.0, 8.0, 2.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.07871246337890625, -0.0747833251953125, -0.07085418701171875, -0.066925048828125, -0.06299591064453125, -0.0590667724609375, -0.05513763427734375, -0.05120849609375, -0.04727935791015625, -0.0433502197265625, -0.03942108154296875, -0.035491943359375, -0.03156280517578125, -0.0276336669921875, -0.02370452880859375, -0.019775390625, -0.01584625244140625, -0.0119171142578125, -0.00798797607421875, -0.004058837890625, -0.00012969970703125, 0.0037994384765625, 0.00772857666015625, 0.01165771484375, 0.01558685302734375, 0.0195159912109375, 0.02344512939453125, 0.027374267578125, 0.03130340576171875, 0.0352325439453125, 0.03916168212890625, 0.0430908203125, 0.04701995849609375, 0.0509490966796875, 0.05487823486328125, 0.058807373046875, 0.06273651123046875, 0.0666656494140625, 0.07059478759765625, 0.07452392578125, 0.07845306396484375, 0.0823822021484375, 0.08631134033203125, 0.090240478515625, 0.09416961669921875, 0.0980987548828125, 0.10202789306640625, 0.10595703125, 0.10988616943359375, 0.1138153076171875, 0.11774444580078125, 0.121673583984375, 0.12560272216796875, 0.1295318603515625, 0.13346099853515625, 0.13739013671875, 0.14131927490234375, 0.1452484130859375, 0.14917755126953125, 0.153106689453125, 0.15703582763671875, 0.1609649658203125, 0.16489410400390625, 0.1688232421875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 8.0, 9.0, 20.0, 52.0, 55.0, 125.0, 134.0, 161.0, 161.0, 115.0, 78.0, 53.0, 18.0, 9.0, 7.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1258838176727295, -1.0969610214233398, -1.0680381059646606, -1.039115309715271, -1.0101925134658813, -0.9812695980072021, -0.9523468017578125, -0.9234239459037781, -0.8945010900497437, -0.8655782341957092, -0.8366554379463196, -0.8077325820922852, -0.7788097262382507, -0.7498868703842163, -0.7209640741348267, -0.6920412182807922, -0.6631183624267578, -0.6341955065727234, -0.6052727103233337, -0.5763498544692993, -0.5474269986152649, -0.5185041427612305, -0.4895813465118408, -0.4606584906578064, -0.43173569440841675, -0.4028128683567047, -0.3738900125026703, -0.34496718645095825, -0.31604433059692383, -0.2871215045452118, -0.25819867849349976, -0.22927582263946533, -0.2003529667854309, -0.17143012583255768, -0.14250728487968445, -0.11358445137739182, -0.08466161042451859, -0.05573877692222595, -0.026815935969352722, 0.002106904983520508, 0.031029745936393738, 0.05995258688926697, 0.0888754278421402, 0.11779826134443283, 0.14672109484672546, 0.1756439357995987, 0.20456677675247192, 0.23348961770534515, 0.2624124586582184, 0.2913352847099304, 0.32025814056396484, 0.3491809666156769, 0.3781038224697113, 0.40702664852142334, 0.43594950437545776, 0.4648723304271698, 0.49379515647888184, 0.5227180123329163, 0.5516408085823059, 0.5805636644363403, 0.6094865202903748, 0.6384093761444092, 0.6673321723937988, 0.6962550282478333, 0.7251778841018677]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 10.0, 4.0, 12.0, 9.0, 12.0, 13.0, 11.0, 16.0, 19.0, 23.0, 24.0, 36.0, 39.0, 39.0, 38.0, 38.0, 54.0, 43.0, 56.0, 44.0, 51.0, 31.0, 42.0, 39.0, 47.0, 38.0, 23.0, 37.0, 23.0, 31.0, 17.0, 18.0, 13.0, 13.0, 14.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-0.4480839967727661, -0.43620961904525757, -0.424335241317749, -0.4124608635902405, -0.40058648586273193, -0.3887121081352234, -0.37683773040771484, -0.3649633526802063, -0.35308897495269775, -0.3412145972251892, -0.32934021949768066, -0.3174658417701721, -0.3055914640426636, -0.29371708631515503, -0.2818427085876465, -0.26996833086013794, -0.2580939531326294, -0.24621957540512085, -0.2343451976776123, -0.22247081995010376, -0.21059644222259521, -0.19872206449508667, -0.18684768676757812, -0.17497330904006958, -0.16309893131256104, -0.1512245535850525, -0.13935017585754395, -0.1274757981300354, -0.11560142040252686, -0.10372704267501831, -0.09185266494750977, -0.07997828722000122, -0.06810390949249268, -0.05622953176498413, -0.044355154037475586, -0.03248077630996704, -0.020606398582458496, -0.008732020854949951, 0.0031423568725585938, 0.015016734600067139, 0.026891112327575684, 0.03876549005508423, 0.05063986778259277, 0.06251424551010132, 0.07438862323760986, 0.08626300096511841, 0.09813737869262695, 0.1100117564201355, 0.12188613414764404, 0.1337605118751526, 0.14563488960266113, 0.15750926733016968, 0.16938364505767822, 0.18125802278518677, 0.1931324005126953, 0.20500677824020386, 0.2168811559677124, 0.22875553369522095, 0.2406299114227295, 0.25250428915023804, 0.2643786668777466, 0.2762530446052551, 0.28812742233276367, 0.3000018000602722, 0.31187617778778076]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 18.0, 14.0, 17.0, 24.0, 56.0, 60.0, 110.0, 152.0, 314.0, 432.0, 790.0, 1401.0, 2408.0, 4229.0, 7405.0, 13126.0, 22796.0, 40306.0, 71674.0, 131119.0, 224158.0, 226836.0, 133300.0, 72697.0, 40775.0, 23293.0, 13157.0, 7656.0, 4281.0, 2429.0, 1417.0, 810.0, 480.0, 275.0, 192.0, 113.0, 76.0, 47.0, 20.0, 19.0, 14.0, 16.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.1134033203125, -0.11006927490234375, -0.1067352294921875, -0.10340118408203125, -0.100067138671875, -0.09673309326171875, -0.0933990478515625, -0.09006500244140625, -0.08673095703125, -0.08339691162109375, -0.0800628662109375, -0.07672882080078125, -0.073394775390625, -0.07006072998046875, -0.0667266845703125, -0.06339263916015625, -0.06005859375, -0.05672454833984375, -0.0533905029296875, -0.05005645751953125, -0.046722412109375, -0.04338836669921875, -0.0400543212890625, -0.03672027587890625, -0.03338623046875, -0.03005218505859375, -0.0267181396484375, -0.02338409423828125, -0.020050048828125, -0.01671600341796875, -0.0133819580078125, -0.01004791259765625, -0.0067138671875, -0.00337982177734375, -4.57763671875e-05, 0.00328826904296875, 0.006622314453125, 0.00995635986328125, 0.0132904052734375, 0.01662445068359375, 0.01995849609375, 0.02329254150390625, 0.0266265869140625, 0.02996063232421875, 0.033294677734375, 0.03662872314453125, 0.0399627685546875, 0.04329681396484375, 0.046630859375, 0.04996490478515625, 0.0532989501953125, 0.05663299560546875, 0.059967041015625, 0.06330108642578125, 0.0666351318359375, 0.06996917724609375, 0.07330322265625, 0.07663726806640625, 0.0799713134765625, 0.08330535888671875, 0.086639404296875, 0.08997344970703125, 0.0933074951171875, 0.09664154052734375, 0.0999755859375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 11.0, 7.0, 15.0, 18.0, 24.0, 26.0, 22.0, 32.0, 31.0, 41.0, 66.0, 48.0, 51.0, 46.0, 62.0, 54.0, 53.0, 64.0, 61.0, 46.0, 31.0, 29.0, 31.0, 22.0, 25.0, 20.0, 16.0, 17.0, 11.0, 5.0, 12.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0623779296875, -0.0605926513671875, -0.058807373046875, -0.0570220947265625, -0.05523681640625, -0.0534515380859375, -0.051666259765625, -0.0498809814453125, -0.048095703125, -0.0463104248046875, -0.044525146484375, -0.0427398681640625, -0.04095458984375, -0.0391693115234375, -0.037384033203125, -0.0355987548828125, -0.0338134765625, -0.0320281982421875, -0.030242919921875, -0.0284576416015625, -0.02667236328125, -0.0248870849609375, -0.023101806640625, -0.0213165283203125, -0.01953125, -0.0177459716796875, -0.015960693359375, -0.0141754150390625, -0.01239013671875, -0.0106048583984375, -0.008819580078125, -0.0070343017578125, -0.0052490234375, -0.0034637451171875, -0.001678466796875, 0.0001068115234375, 0.00189208984375, 0.0036773681640625, 0.005462646484375, 0.0072479248046875, 0.009033203125, 0.0108184814453125, 0.012603759765625, 0.0143890380859375, 0.01617431640625, 0.0179595947265625, 0.019744873046875, 0.0215301513671875, 0.0233154296875, 0.0251007080078125, 0.026885986328125, 0.0286712646484375, 0.03045654296875, 0.0322418212890625, 0.034027099609375, 0.0358123779296875, 0.03759765625, 0.0393829345703125, 0.041168212890625, 0.0429534912109375, 0.04473876953125, 0.0465240478515625, 0.048309326171875, 0.0500946044921875, 0.0518798828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 13.0, 10.0, 12.0, 13.0, 17.0, 30.0, 45.0, 78.0, 78.0, 135.0, 187.0, 311.0, 559.0, 1109.0, 2176.0, 4480.0, 9333.0, 20327.0, 44982.0, 106326.0, 278852.0, 336461.0, 138776.0, 56205.0, 25128.0, 11844.0, 5356.0, 2707.0, 1316.0, 651.0, 358.0, 226.0, 109.0, 94.0, 73.0, 51.0, 46.0, 21.0, 11.0, 5.0, 10.0, 5.0, 9.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1510009765625, -0.14581871032714844, -0.14063644409179688, -0.1354541778564453, -0.13027191162109375, -0.1250896453857422, -0.11990737915039062, -0.11472511291503906, -0.1095428466796875, -0.10436058044433594, -0.09917831420898438, -0.09399604797363281, -0.08881378173828125, -0.08363151550292969, -0.07844924926757812, -0.07326698303222656, -0.068084716796875, -0.06290245056152344, -0.057720184326171875, -0.05253791809082031, -0.04735565185546875, -0.04217338562011719, -0.036991119384765625, -0.03180885314941406, -0.0266265869140625, -0.021444320678710938, -0.016262054443359375, -0.011079788208007812, -0.00589752197265625, -0.0007152557373046875, 0.004467010498046875, 0.009649276733398438, 0.01483154296875, 0.020013809204101562, 0.025196075439453125, 0.030378341674804688, 0.03556060791015625, 0.04074287414550781, 0.045925140380859375, 0.05110740661621094, 0.0562896728515625, 0.06147193908691406, 0.06665420532226562, 0.07183647155761719, 0.07701873779296875, 0.08220100402832031, 0.08738327026367188, 0.09256553649902344, 0.097747802734375, 0.10293006896972656, 0.10811233520507812, 0.11329460144042969, 0.11847686767578125, 0.12365913391113281, 0.12884140014648438, 0.13402366638183594, 0.1392059326171875, 0.14438819885253906, 0.14957046508789062, 0.1547527313232422, 0.15993499755859375, 0.1651172637939453, 0.17029953002929688, 0.17548179626464844, 0.1806640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 8.0, 17.0, 12.0, 20.0, 22.0, 22.0, 23.0, 28.0, 34.0, 33.0, 36.0, 49.0, 36.0, 52.0, 48.0, 62.0, 32.0, 50.0, 59.0, 46.0, 33.0, 52.0, 43.0, 24.0, 26.0, 29.0, 23.0, 16.0, 14.0, 7.0, 8.0, 4.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.20556640625, -0.20009231567382812, -0.19461822509765625, -0.18914413452148438, -0.1836700439453125, -0.17819595336914062, -0.17272186279296875, -0.16724777221679688, -0.161773681640625, -0.15629959106445312, -0.15082550048828125, -0.14535140991210938, -0.1398773193359375, -0.13440322875976562, -0.12892913818359375, -0.12345504760742188, -0.11798095703125, -0.11250686645507812, -0.10703277587890625, -0.10155868530273438, -0.0960845947265625, -0.09061050415039062, -0.08513641357421875, -0.07966232299804688, -0.074188232421875, -0.06871414184570312, -0.06324005126953125, -0.057765960693359375, -0.0522918701171875, -0.046817779541015625, -0.04134368896484375, -0.035869598388671875, -0.0303955078125, -0.024921417236328125, -0.01944732666015625, -0.013973236083984375, -0.0084991455078125, -0.003025054931640625, 0.00244903564453125, 0.007923126220703125, 0.013397216796875, 0.018871307373046875, 0.02434539794921875, 0.029819488525390625, 0.0352935791015625, 0.040767669677734375, 0.04624176025390625, 0.051715850830078125, 0.05718994140625, 0.06266403198242188, 0.06813812255859375, 0.07361221313476562, 0.0790863037109375, 0.08456039428710938, 0.09003448486328125, 0.09550857543945312, 0.100982666015625, 0.10645675659179688, 0.11193084716796875, 0.11740493774414062, 0.1228790283203125, 0.12835311889648438, 0.13382720947265625, 0.13930130004882812, 0.144775390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 5.0, 15.0, 12.0, 22.0, 38.0, 73.0, 96.0, 135.0, 244.0, 383.0, 630.0, 1031.0, 1963.0, 3486.0, 6593.0, 12323.0, 23111.0, 43940.0, 84038.0, 160456.0, 258611.0, 211459.0, 113235.0, 59503.0, 31028.0, 16586.0, 8864.0, 4604.0, 2612.0, 1365.0, 873.0, 472.0, 275.0, 169.0, 108.0, 62.0, 42.0, 21.0, 20.0, 15.0, 11.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05731201171875, -0.05544710159301758, -0.053582191467285156, -0.051717281341552734, -0.04985237121582031, -0.04798746109008789, -0.04612255096435547, -0.04425764083862305, -0.042392730712890625, -0.0405278205871582, -0.03866291046142578, -0.03679800033569336, -0.03493309020996094, -0.033068180084228516, -0.031203269958496094, -0.029338359832763672, -0.02747344970703125, -0.025608539581298828, -0.023743629455566406, -0.021878719329833984, -0.020013809204101562, -0.01814889907836914, -0.01628398895263672, -0.014419078826904297, -0.012554168701171875, -0.010689258575439453, -0.008824348449707031, -0.006959438323974609, -0.0050945281982421875, -0.0032296180725097656, -0.0013647079467773438, 0.0005002021789550781, 0.0023651123046875, 0.004230022430419922, 0.006094932556152344, 0.007959842681884766, 0.009824752807617188, 0.01168966293334961, 0.013554573059082031, 0.015419483184814453, 0.017284393310546875, 0.019149303436279297, 0.02101421356201172, 0.02287912368774414, 0.024744033813476562, 0.026608943939208984, 0.028473854064941406, 0.030338764190673828, 0.03220367431640625, 0.03406858444213867, 0.035933494567871094, 0.037798404693603516, 0.03966331481933594, 0.04152822494506836, 0.04339313507080078, 0.0452580451965332, 0.047122955322265625, 0.04898786544799805, 0.05085277557373047, 0.05271768569946289, 0.05458259582519531, 0.056447505950927734, 0.058312416076660156, 0.06017732620239258, 0.062042236328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 5.0, 5.0, 8.0, 7.0, 8.0, 6.0, 15.0, 11.0, 23.0, 14.0, 29.0, 30.0, 46.0, 49.0, 58.0, 58.0, 60.0, 61.0, 72.0, 78.0, 46.0, 52.0, 51.0, 34.0, 22.0, 33.0, 33.0, 18.0, 17.0, 7.0, 5.0, 5.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4080276489257812e-05, -2.3369677364826202e-05, -2.2659078240394592e-05, -2.1948479115962982e-05, -2.1237879991531372e-05, -2.0527280867099762e-05, -1.9816681742668152e-05, -1.9106082618236542e-05, -1.839548349380493e-05, -1.768488436937332e-05, -1.697428524494171e-05, -1.62636861205101e-05, -1.555308699607849e-05, -1.4842487871646881e-05, -1.4131888747215271e-05, -1.3421289622783661e-05, -1.271069049835205e-05, -1.200009137392044e-05, -1.128949224948883e-05, -1.057889312505722e-05, -9.86829400062561e-06, -9.157694876194e-06, -8.44709575176239e-06, -7.73649662733078e-06, -7.02589750289917e-06, -6.31529837846756e-06, -5.60469925403595e-06, -4.89410012960434e-06, -4.1835010051727295e-06, -3.4729018807411194e-06, -2.7623027563095093e-06, -2.051703631877899e-06, -1.341104507446289e-06, -6.30505383014679e-07, 8.009374141693115e-08, 7.906928658485413e-07, 1.5012919902801514e-06, 2.2118911147117615e-06, 2.9224902391433716e-06, 3.6330893635749817e-06, 4.343688488006592e-06, 5.054287612438202e-06, 5.764886736869812e-06, 6.475485861301422e-06, 7.186084985733032e-06, 7.896684110164642e-06, 8.607283234596252e-06, 9.317882359027863e-06, 1.0028481483459473e-05, 1.0739080607891083e-05, 1.1449679732322693e-05, 1.2160278856754303e-05, 1.2870877981185913e-05, 1.3581477105617523e-05, 1.4292076230049133e-05, 1.5002675354480743e-05, 1.5713274478912354e-05, 1.6423873603343964e-05, 1.7134472727775574e-05, 1.7845071852207184e-05, 1.8555670976638794e-05, 1.9266270101070404e-05, 1.9976869225502014e-05, 2.0687468349933624e-05, 2.1398067474365234e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 8.0, 9.0, 11.0, 24.0, 24.0, 30.0, 57.0, 106.0, 154.0, 248.0, 464.0, 950.0, 2109.0, 5032.0, 12388.0, 31797.0, 78623.0, 191012.0, 347893.0, 222585.0, 92592.0, 37144.0, 14579.0, 5923.0, 2477.0, 1084.0, 527.0, 258.0, 177.0, 91.0, 62.0, 33.0, 32.0, 16.0, 7.0, 8.0, 10.0, 11.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07501220703125, -0.07263755798339844, -0.07026290893554688, -0.06788825988769531, -0.06551361083984375, -0.06313896179199219, -0.060764312744140625, -0.05838966369628906, -0.0560150146484375, -0.05364036560058594, -0.051265716552734375, -0.04889106750488281, -0.04651641845703125, -0.04414176940917969, -0.041767120361328125, -0.03939247131347656, -0.037017822265625, -0.03464317321777344, -0.032268524169921875, -0.029893875122070312, -0.02751922607421875, -0.025144577026367188, -0.022769927978515625, -0.020395278930664062, -0.0180206298828125, -0.015645980834960938, -0.013271331787109375, -0.010896682739257812, -0.00852203369140625, -0.0061473846435546875, -0.003772735595703125, -0.0013980865478515625, 0.0009765625, 0.0033512115478515625, 0.005725860595703125, 0.008100509643554688, 0.01047515869140625, 0.012849807739257812, 0.015224456787109375, 0.017599105834960938, 0.0199737548828125, 0.022348403930664062, 0.024723052978515625, 0.027097702026367188, 0.02947235107421875, 0.03184700012207031, 0.034221649169921875, 0.03659629821777344, 0.038970947265625, 0.04134559631347656, 0.043720245361328125, 0.04609489440917969, 0.04846954345703125, 0.05084419250488281, 0.053218841552734375, 0.05559349060058594, 0.0579681396484375, 0.06034278869628906, 0.06271743774414062, 0.06509208679199219, 0.06746673583984375, 0.06984138488769531, 0.07221603393554688, 0.07459068298339844, 0.07696533203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 8.0, 3.0, 8.0, 17.0, 12.0, 30.0, 25.0, 35.0, 31.0, 50.0, 66.0, 68.0, 73.0, 75.0, 100.0, 83.0, 64.0, 54.0, 37.0, 38.0, 30.0, 21.0, 16.0, 12.0, 6.0, 7.0, 6.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049652099609375, -0.047335147857666016, -0.04501819610595703, -0.04270124435424805, -0.04038429260253906, -0.03806734085083008, -0.035750389099121094, -0.03343343734741211, -0.031116485595703125, -0.02879953384399414, -0.026482582092285156, -0.024165630340576172, -0.021848678588867188, -0.019531726837158203, -0.01721477508544922, -0.014897823333740234, -0.01258087158203125, -0.010263919830322266, -0.007946968078613281, -0.005630016326904297, -0.0033130645751953125, -0.0009961128234863281, 0.0013208389282226562, 0.0036377906799316406, 0.005954742431640625, 0.00827169418334961, 0.010588645935058594, 0.012905597686767578, 0.015222549438476562, 0.017539501190185547, 0.01985645294189453, 0.022173404693603516, 0.0244903564453125, 0.026807308197021484, 0.02912425994873047, 0.03144121170043945, 0.03375816345214844, 0.03607511520385742, 0.038392066955566406, 0.04070901870727539, 0.043025970458984375, 0.04534292221069336, 0.047659873962402344, 0.04997682571411133, 0.05229377746582031, 0.0546107292175293, 0.05692768096923828, 0.059244632720947266, 0.06156158447265625, 0.06387853622436523, 0.06619548797607422, 0.0685124397277832, 0.07082939147949219, 0.07314634323120117, 0.07546329498291016, 0.07778024673461914, 0.08009719848632812, 0.08241415023803711, 0.0847311019897461, 0.08704805374145508, 0.08936500549316406, 0.09168195724487305, 0.09399890899658203, 0.09631586074829102, 0.0986328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 20.0, 52.0, 79.0, 106.0, 163.0, 159.0, 149.0, 110.0, 61.0, 52.0, 26.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.876379132270813, -1.836872935295105, -1.7973666191101074, -1.7578604221343994, -1.7183542251586914, -1.6788479089736938, -1.6393417119979858, -1.5998353958129883, -1.5603291988372803, -1.5208230018615723, -1.4813166856765747, -1.4418104887008667, -1.4023041725158691, -1.3627979755401611, -1.3232917785644531, -1.2837855815887451, -1.2442792654037476, -1.2047730684280396, -1.165266752243042, -1.125760555267334, -1.086254358291626, -1.0467480421066284, -1.0072418451309204, -0.9677355885505676, -0.9282293319702148, -0.8887230753898621, -0.8492168188095093, -0.8097106218338013, -0.7702043652534485, -0.7306981086730957, -0.6911919116973877, -0.6516856551170349, -0.6121794581413269, -0.5726732015609741, -0.5331670045852661, -0.49366074800491333, -0.45415449142456055, -0.41464823484420776, -0.37514200806617737, -0.335635781288147, -0.2961295247077942, -0.2566232681274414, -0.217117041349411, -0.17761079967021942, -0.13810455799102783, -0.09859831631183624, -0.05909207463264465, -0.019585847854614258, 0.019920408725738525, 0.059426650404930115, 0.0989328920841217, 0.1384391337633133, 0.17794537544250488, 0.21745161712169647, 0.25695785880088806, 0.29646408557891846, 0.33597034215927124, 0.375476598739624, 0.4149828255176544, 0.4544890522956848, 0.4939953088760376, 0.5335015654563904, 0.5730078220367432, 0.6125140190124512, 0.652020275592804]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 10.0, 8.0, 6.0, 13.0, 11.0, 13.0, 13.0, 20.0, 16.0, 24.0, 30.0, 28.0, 31.0, 38.0, 34.0, 33.0, 41.0, 31.0, 38.0, 32.0, 56.0, 39.0, 54.0, 29.0, 30.0, 37.0, 29.0, 31.0, 33.0, 27.0, 27.0, 20.0, 12.0, 17.0, 18.0, 11.0, 7.0, 11.0, 8.0, 7.0, 6.0, 3.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36016714572906494, -0.34839215874671936, -0.3366171717643738, -0.3248422145843506, -0.313067227602005, -0.3012922406196594, -0.28951725363731384, -0.27774226665496826, -0.26596730947494507, -0.2541923224925995, -0.2424173504114151, -0.23064236342906952, -0.21886739134788513, -0.20709240436553955, -0.19531741738319397, -0.18354244530200958, -0.171767458319664, -0.15999247133731842, -0.14821749925613403, -0.13644251227378845, -0.12466754019260406, -0.11289255321025848, -0.1011175736784935, -0.08934259414672852, -0.07756761461496353, -0.06579263508319855, -0.05401765555143356, -0.04224267229437828, -0.030467692762613297, -0.018692713230848312, -0.00691772997379303, 0.004857249557971954, 0.01663222908973694, 0.028407208621501923, 0.04018218815326691, 0.05195717141032219, 0.06373214721679688, 0.07550713419914246, 0.08728211373090744, 0.09905709326267242, 0.11083207279443741, 0.12260705232620239, 0.13438203930854797, 0.14615701138973236, 0.15793199837207794, 0.16970697045326233, 0.1814819574356079, 0.1932569444179535, 0.20503191649913788, 0.21680690348148346, 0.22858187556266785, 0.24035686254501343, 0.252131849527359, 0.2639068067073822, 0.2756817936897278, 0.28745678067207336, 0.29923176765441895, 0.3110067546367645, 0.3227817416191101, 0.3345566987991333, 0.3463316857814789, 0.35810667276382446, 0.36988165974617004, 0.3816566467285156, 0.3934316039085388]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 11.0, 10.0, 13.0, 10.0, 19.0, 14.0, 26.0, 48.0, 75.0, 126.0, 209.0, 478.0, 1007.0, 2323.0, 6017.0, 17763.0, 64381.0, 334061.0, 2176434.0, 1336445.0, 192625.0, 42501.0, 12225.0, 4357.0, 1626.0, 674.0, 348.0, 165.0, 88.0, 44.0, 35.0, 25.0, 24.0, 16.0, 12.0, 15.0, 5.0, 11.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.130615234375, -0.12707042694091797, -0.12352561950683594, -0.1199808120727539, -0.11643600463867188, -0.11289119720458984, -0.10934638977050781, -0.10580158233642578, -0.10225677490234375, -0.09871196746826172, -0.09516716003417969, -0.09162235260009766, -0.08807754516601562, -0.0845327377319336, -0.08098793029785156, -0.07744312286376953, -0.0738983154296875, -0.07035350799560547, -0.06680870056152344, -0.0632638931274414, -0.059719085693359375, -0.056174278259277344, -0.05262947082519531, -0.04908466339111328, -0.04553985595703125, -0.04199504852294922, -0.03845024108886719, -0.034905433654785156, -0.031360626220703125, -0.027815818786621094, -0.024271011352539062, -0.02072620391845703, -0.017181396484375, -0.013636589050292969, -0.010091781616210938, -0.006546974182128906, -0.003002166748046875, 0.0005426406860351562, 0.0040874481201171875, 0.007632255554199219, 0.01117706298828125, 0.014721870422363281, 0.018266677856445312, 0.021811485290527344, 0.025356292724609375, 0.028901100158691406, 0.03244590759277344, 0.03599071502685547, 0.0395355224609375, 0.04308032989501953, 0.04662513732910156, 0.050169944763183594, 0.053714752197265625, 0.057259559631347656, 0.06080436706542969, 0.06434917449951172, 0.06789398193359375, 0.07143878936767578, 0.07498359680175781, 0.07852840423583984, 0.08207321166992188, 0.0856180191040039, 0.08916282653808594, 0.09270763397216797, 0.09625244140625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 4.0, 10.0, 12.0, 11.0, 16.0, 10.0, 27.0, 15.0, 23.0, 26.0, 35.0, 39.0, 38.0, 46.0, 53.0, 38.0, 64.0, 51.0, 50.0, 43.0, 52.0, 33.0, 43.0, 37.0, 53.0, 31.0, 21.0, 29.0, 19.0, 12.0, 15.0, 13.0, 8.0, 10.0, 7.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.06805419921875, -0.0662994384765625, -0.064544677734375, -0.0627899169921875, -0.06103515625, -0.0592803955078125, -0.057525634765625, -0.0557708740234375, -0.05401611328125, -0.0522613525390625, -0.050506591796875, -0.0487518310546875, -0.0469970703125, -0.0452423095703125, -0.043487548828125, -0.0417327880859375, -0.03997802734375, -0.0382232666015625, -0.036468505859375, -0.0347137451171875, -0.032958984375, -0.0312042236328125, -0.029449462890625, -0.0276947021484375, -0.02593994140625, -0.0241851806640625, -0.022430419921875, -0.0206756591796875, -0.0189208984375, -0.0171661376953125, -0.015411376953125, -0.0136566162109375, -0.01190185546875, -0.0101470947265625, -0.008392333984375, -0.0066375732421875, -0.0048828125, -0.0031280517578125, -0.001373291015625, 0.0003814697265625, 0.00213623046875, 0.0038909912109375, 0.005645751953125, 0.0074005126953125, 0.0091552734375, 0.0109100341796875, 0.012664794921875, 0.0144195556640625, 0.01617431640625, 0.0179290771484375, 0.019683837890625, 0.0214385986328125, 0.023193359375, 0.0249481201171875, 0.026702880859375, 0.0284576416015625, 0.03021240234375, 0.0319671630859375, 0.033721923828125, 0.0354766845703125, 0.0372314453125, 0.0389862060546875, 0.040740966796875, 0.0424957275390625, 0.04425048828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 9.0, 17.0, 24.0, 44.0, 60.0, 89.0, 114.0, 162.0, 252.0, 398.0, 623.0, 998.0, 1782.0, 2986.0, 5552.0, 10992.0, 24198.0, 58323.0, 163626.0, 534667.0, 1626158.0, 1211139.0, 356928.0, 114281.0, 42825.0, 18369.0, 8641.0, 4608.0, 2505.0, 1483.0, 887.0, 503.0, 345.0, 212.0, 151.0, 105.0, 52.0, 41.0, 39.0, 28.0, 13.0, 13.0, 7.0, 4.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10205078125, -0.0985116958618164, -0.09497261047363281, -0.09143352508544922, -0.08789443969726562, -0.08435535430908203, -0.08081626892089844, -0.07727718353271484, -0.07373809814453125, -0.07019901275634766, -0.06665992736816406, -0.06312084197998047, -0.059581756591796875, -0.05604267120361328, -0.05250358581542969, -0.048964500427246094, -0.0454254150390625, -0.041886329650878906, -0.03834724426269531, -0.03480815887451172, -0.031269073486328125, -0.02772998809814453, -0.024190902709960938, -0.020651817321777344, -0.01711273193359375, -0.013573646545410156, -0.010034561157226562, -0.006495475769042969, -0.002956390380859375, 0.0005826950073242188, 0.0041217803955078125, 0.007660865783691406, 0.011199951171875, 0.014739036560058594, 0.018278121948242188, 0.02181720733642578, 0.025356292724609375, 0.02889537811279297, 0.03243446350097656, 0.035973548889160156, 0.03951263427734375, 0.043051719665527344, 0.04659080505371094, 0.05012989044189453, 0.053668975830078125, 0.05720806121826172, 0.06074714660644531, 0.0642862319946289, 0.0678253173828125, 0.0713644027709961, 0.07490348815917969, 0.07844257354736328, 0.08198165893554688, 0.08552074432373047, 0.08905982971191406, 0.09259891510009766, 0.09613800048828125, 0.09967708587646484, 0.10321617126464844, 0.10675525665283203, 0.11029434204101562, 0.11383342742919922, 0.11737251281738281, 0.1209115982055664, 0.12445068359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 3.0, 8.0, 10.0, 20.0, 22.0, 36.0, 61.0, 60.0, 112.0, 143.0, 206.0, 335.0, 477.0, 646.0, 598.0, 424.0, 285.0, 188.0, 137.0, 102.0, 69.0, 39.0, 25.0, 14.0, 10.0, 14.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1026611328125, -0.09851646423339844, -0.09437179565429688, -0.09022712707519531, -0.08608245849609375, -0.08193778991699219, -0.07779312133789062, -0.07364845275878906, -0.0695037841796875, -0.06535911560058594, -0.061214447021484375, -0.05706977844238281, -0.05292510986328125, -0.04878044128417969, -0.044635772705078125, -0.04049110412597656, -0.036346435546875, -0.03220176696777344, -0.028057098388671875, -0.023912429809570312, -0.01976776123046875, -0.015623092651367188, -0.011478424072265625, -0.0073337554931640625, -0.0031890869140625, 0.0009555816650390625, 0.005100250244140625, 0.009244918823242188, 0.01338958740234375, 0.017534255981445312, 0.021678924560546875, 0.025823593139648438, 0.02996826171875, 0.03411293029785156, 0.038257598876953125, 0.04240226745605469, 0.04654693603515625, 0.05069160461425781, 0.054836273193359375, 0.05898094177246094, 0.0631256103515625, 0.06727027893066406, 0.07141494750976562, 0.07555961608886719, 0.07970428466796875, 0.08384895324707031, 0.08799362182617188, 0.09213829040527344, 0.096282958984375, 0.10042762756347656, 0.10457229614257812, 0.10871696472167969, 0.11286163330078125, 0.11700630187988281, 0.12115097045898438, 0.12529563903808594, 0.1294403076171875, 0.13358497619628906, 0.13772964477539062, 0.1418743133544922, 0.14601898193359375, 0.1501636505126953, 0.15430831909179688, 0.15845298767089844, 0.16259765625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 8.0, 19.0, 18.0, 29.0, 49.0, 51.0, 60.0, 69.0, 73.0, 90.0, 83.0, 96.0, 81.0, 73.0, 56.0, 41.0, 34.0, 25.0, 14.0, 9.0, 8.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.8232011795043945, -0.8040823340415955, -0.7849634289741516, -0.7658445835113525, -0.7467256784439087, -0.7276068329811096, -0.7084879875183105, -0.6893690824508667, -0.6702502369880676, -0.6511313915252686, -0.6320124864578247, -0.6128936409950256, -0.5937747359275818, -0.5746558904647827, -0.5555369853973389, -0.5364181399345398, -0.5172992944717407, -0.49818041920661926, -0.4790615439414978, -0.45994269847869873, -0.44082382321357727, -0.4217049479484558, -0.40258607268333435, -0.3834671974182129, -0.36434829235076904, -0.3452294170856476, -0.3261105418205261, -0.30699169635772705, -0.2878728210926056, -0.26875394582748413, -0.24963507056236267, -0.2305162101984024, -0.21139734983444214, -0.19227847456932068, -0.1731596142053604, -0.15404073894023895, -0.1349218785762787, -0.11580300331115723, -0.09668412804603577, -0.0775652676820755, -0.05844639241695404, -0.03932752460241318, -0.020208653062582016, -0.0010897815227508545, 0.01802908629179001, 0.03714795410633087, 0.05626682937145233, 0.0753856897354126, 0.09450456500053406, 0.11362343281507492, 0.13274230062961578, 0.15186117589473724, 0.1709800362586975, 0.19009891152381897, 0.20921778678894043, 0.2283366471529007, 0.24745552241802216, 0.2665743827819824, 0.2856932580471039, 0.30481213331222534, 0.3239310085773468, 0.34304988384246826, 0.36216872930526733, 0.3812876045703888, 0.40040647983551025]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 3.0, 7.0, 10.0, 7.0, 13.0, 14.0, 11.0, 19.0, 13.0, 18.0, 30.0, 28.0, 33.0, 38.0, 29.0, 42.0, 34.0, 41.0, 43.0, 39.0, 57.0, 45.0, 39.0, 37.0, 43.0, 42.0, 39.0, 34.0, 24.0, 27.0, 23.0, 19.0, 17.0, 13.0, 11.0, 17.0, 7.0, 13.0, 5.0, 3.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.3826666474342346, -0.3711805045604706, -0.35969439148902893, -0.3482082486152649, -0.33672213554382324, -0.3252359926700592, -0.31374984979629517, -0.3022637367248535, -0.29077762365341187, -0.2792914807796478, -0.2678053677082062, -0.25631922483444214, -0.2448331117630005, -0.23334696888923645, -0.2218608409166336, -0.21037471294403076, -0.19888857007026672, -0.18740244209766388, -0.17591631412506104, -0.164430171251297, -0.15294405817985535, -0.1414579153060913, -0.12997178733348846, -0.11848565936088562, -0.10699953138828278, -0.09551340341567993, -0.08402727544307709, -0.07254114001989365, -0.0610550120472908, -0.04956888407468796, -0.03808274865150452, -0.026596620678901672, -0.015110492706298828, -0.0036243628710508347, 0.007861766964197159, 0.0193478986620903, 0.030834026634693146, 0.04232015460729599, 0.05380629003047943, 0.06529241800308228, 0.07677854597568512, 0.08826467394828796, 0.09975080192089081, 0.11123693734407425, 0.1227230653166771, 0.13420918583869934, 0.14569532871246338, 0.15718145668506622, 0.16866758465766907, 0.1801537126302719, 0.19163984060287476, 0.2031259834766388, 0.21461209654808044, 0.22609823942184448, 0.23758436739444733, 0.24907049536705017, 0.2605566382408142, 0.27204278111457825, 0.2835288941860199, 0.29501503705978394, 0.3065011501312256, 0.3179872930049896, 0.32947343587875366, 0.3409595489501953, 0.35244566202163696]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 10.0, 20.0, 42.0, 42.0, 53.0, 85.0, 137.0, 181.0, 282.0, 472.0, 707.0, 1053.0, 1579.0, 2543.0, 4000.0, 6296.0, 9928.0, 16204.0, 26603.0, 44987.0, 82914.0, 161702.0, 246216.0, 198117.0, 105128.0, 55431.0, 31856.0, 19438.0, 11940.0, 7411.0, 4654.0, 2951.0, 1936.0, 1221.0, 830.0, 520.0, 345.0, 232.0, 171.0, 97.0, 76.0, 46.0, 27.0, 16.0, 12.0, 14.0, 7.0, 6.0, 1.0, 4.0, 1.0], "bins": [-0.09912109375, -0.0963430404663086, -0.09356498718261719, -0.09078693389892578, -0.08800888061523438, -0.08523082733154297, -0.08245277404785156, -0.07967472076416016, -0.07689666748046875, -0.07411861419677734, -0.07134056091308594, -0.06856250762939453, -0.06578445434570312, -0.06300640106201172, -0.06022834777832031, -0.057450294494628906, -0.0546722412109375, -0.051894187927246094, -0.04911613464355469, -0.04633808135986328, -0.043560028076171875, -0.04078197479248047, -0.03800392150878906, -0.035225868225097656, -0.03244781494140625, -0.029669761657714844, -0.026891708374023438, -0.02411365509033203, -0.021335601806640625, -0.01855754852294922, -0.015779495239257812, -0.013001441955566406, -0.010223388671875, -0.007445335388183594, -0.0046672821044921875, -0.0018892288208007812, 0.000888824462890625, 0.0036668777465820312, 0.0064449310302734375, 0.009222984313964844, 0.01200103759765625, 0.014779090881347656, 0.017557144165039062, 0.02033519744873047, 0.023113250732421875, 0.02589130401611328, 0.028669357299804688, 0.031447410583496094, 0.0342254638671875, 0.037003517150878906, 0.03978157043457031, 0.04255962371826172, 0.045337677001953125, 0.04811573028564453, 0.05089378356933594, 0.053671836853027344, 0.05644989013671875, 0.059227943420410156, 0.06200599670410156, 0.06478404998779297, 0.06756210327148438, 0.07034015655517578, 0.07311820983886719, 0.0758962631225586, 0.07867431640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 8.0, 8.0, 5.0, 13.0, 16.0, 19.0, 18.0, 27.0, 27.0, 25.0, 33.0, 40.0, 39.0, 32.0, 53.0, 51.0, 44.0, 57.0, 50.0, 52.0, 38.0, 45.0, 40.0, 34.0, 43.0, 27.0, 31.0, 22.0, 17.0, 19.0, 13.0, 9.0, 13.0, 13.0, 6.0, 5.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 3.0, 3.0], "bins": [-0.07257080078125, -0.07063865661621094, -0.06870651245117188, -0.06677436828613281, -0.06484222412109375, -0.06291007995605469, -0.060977935791015625, -0.05904579162597656, -0.0571136474609375, -0.05518150329589844, -0.053249359130859375, -0.05131721496582031, -0.04938507080078125, -0.04745292663574219, -0.045520782470703125, -0.04358863830566406, -0.041656494140625, -0.03972434997558594, -0.037792205810546875, -0.03586006164550781, -0.03392791748046875, -0.03199577331542969, -0.030063629150390625, -0.028131484985351562, -0.0261993408203125, -0.024267196655273438, -0.022335052490234375, -0.020402908325195312, -0.01847076416015625, -0.016538619995117188, -0.014606475830078125, -0.012674331665039062, -0.0107421875, -0.008810043334960938, -0.006877899169921875, -0.0049457550048828125, -0.00301361083984375, -0.0010814666748046875, 0.000850677490234375, 0.0027828216552734375, 0.0047149658203125, 0.0066471099853515625, 0.008579254150390625, 0.010511398315429688, 0.01244354248046875, 0.014375686645507812, 0.016307830810546875, 0.018239974975585938, 0.020172119140625, 0.022104263305664062, 0.024036407470703125, 0.025968551635742188, 0.02790069580078125, 0.029832839965820312, 0.031764984130859375, 0.03369712829589844, 0.0356292724609375, 0.03756141662597656, 0.039493560791015625, 0.04142570495605469, 0.04335784912109375, 0.04528999328613281, 0.047222137451171875, 0.04915428161621094, 0.05108642578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 9.0, 9.0, 14.0, 11.0, 14.0, 14.0, 32.0, 41.0, 57.0, 92.0, 149.0, 347.0, 693.0, 1447.0, 3552.0, 8818.0, 22861.0, 64423.0, 260619.0, 496327.0, 125211.0, 39030.0, 14531.0, 5806.0, 2362.0, 973.0, 470.0, 228.0, 142.0, 71.0, 55.0, 37.0, 26.0, 14.0, 20.0, 9.0, 6.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.22900390625, -0.222320556640625, -0.21563720703125, -0.208953857421875, -0.2022705078125, -0.195587158203125, -0.18890380859375, -0.182220458984375, -0.175537109375, -0.168853759765625, -0.16217041015625, -0.155487060546875, -0.1488037109375, -0.142120361328125, -0.13543701171875, -0.128753662109375, -0.1220703125, -0.115386962890625, -0.10870361328125, -0.102020263671875, -0.0953369140625, -0.088653564453125, -0.08197021484375, -0.075286865234375, -0.068603515625, -0.061920166015625, -0.05523681640625, -0.048553466796875, -0.0418701171875, -0.035186767578125, -0.02850341796875, -0.021820068359375, -0.01513671875, -0.008453369140625, -0.00177001953125, 0.004913330078125, 0.0115966796875, 0.018280029296875, 0.02496337890625, 0.031646728515625, 0.038330078125, 0.045013427734375, 0.05169677734375, 0.058380126953125, 0.0650634765625, 0.071746826171875, 0.07843017578125, 0.085113525390625, 0.091796875, 0.098480224609375, 0.10516357421875, 0.111846923828125, 0.1185302734375, 0.125213623046875, 0.13189697265625, 0.138580322265625, 0.145263671875, 0.151947021484375, 0.15863037109375, 0.165313720703125, 0.1719970703125, 0.178680419921875, 0.18536376953125, 0.192047119140625, 0.19873046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 6.0, 10.0, 11.0, 5.0, 8.0, 10.0, 26.0, 29.0, 45.0, 30.0, 45.0, 48.0, 54.0, 43.0, 43.0, 64.0, 61.0, 60.0, 65.0, 67.0, 43.0, 43.0, 24.0, 25.0, 32.0, 15.0, 16.0, 12.0, 15.0, 7.0, 4.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2078857421875, -0.20049095153808594, -0.19309616088867188, -0.1857013702392578, -0.17830657958984375, -0.1709117889404297, -0.16351699829101562, -0.15612220764160156, -0.1487274169921875, -0.14133262634277344, -0.13393783569335938, -0.1265430450439453, -0.11914825439453125, -0.11175346374511719, -0.10435867309570312, -0.09696388244628906, -0.089569091796875, -0.08217430114746094, -0.07477951049804688, -0.06738471984863281, -0.05998992919921875, -0.05259513854980469, -0.045200347900390625, -0.03780555725097656, -0.0304107666015625, -0.023015975952148438, -0.015621185302734375, -0.008226394653320312, -0.00083160400390625, 0.0065631866455078125, 0.013957977294921875, 0.021352767944335938, 0.02874755859375, 0.03614234924316406, 0.043537139892578125, 0.05093193054199219, 0.05832672119140625, 0.06572151184082031, 0.07311630249023438, 0.08051109313964844, 0.0879058837890625, 0.09530067443847656, 0.10269546508789062, 0.11009025573730469, 0.11748504638671875, 0.12487983703613281, 0.13227462768554688, 0.13966941833496094, 0.147064208984375, 0.15445899963378906, 0.16185379028320312, 0.1692485809326172, 0.17664337158203125, 0.1840381622314453, 0.19143295288085938, 0.19882774353027344, 0.2062225341796875, 0.21361732482910156, 0.22101211547851562, 0.2284069061279297, 0.23580169677734375, 0.2431964874267578, 0.2505912780761719, 0.25798606872558594, 0.265380859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 13.0, 21.0, 30.0, 32.0, 43.0, 70.0, 105.0, 153.0, 224.0, 354.0, 532.0, 871.0, 1310.0, 2021.0, 3167.0, 4944.0, 8166.0, 13470.0, 22677.0, 39856.0, 75505.0, 167063.0, 306790.0, 201776.0, 88587.0, 45367.0, 25479.0, 15181.0, 9123.0, 5709.0, 3553.0, 2165.0, 1477.0, 944.0, 620.0, 391.0, 239.0, 173.0, 100.0, 78.0, 53.0, 37.0, 27.0, 12.0, 13.0, 11.0, 10.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.07012939453125, -0.0681600570678711, -0.06619071960449219, -0.06422138214111328, -0.062252044677734375, -0.06028270721435547, -0.05831336975097656, -0.056344032287597656, -0.05437469482421875, -0.052405357360839844, -0.05043601989746094, -0.04846668243408203, -0.046497344970703125, -0.04452800750732422, -0.04255867004394531, -0.040589332580566406, -0.0386199951171875, -0.036650657653808594, -0.03468132019042969, -0.03271198272705078, -0.030742645263671875, -0.02877330780029297, -0.026803970336914062, -0.024834632873535156, -0.02286529541015625, -0.020895957946777344, -0.018926620483398438, -0.01695728302001953, -0.014987945556640625, -0.013018608093261719, -0.011049270629882812, -0.009079933166503906, -0.007110595703125, -0.005141258239746094, -0.0031719207763671875, -0.0012025833129882812, 0.000766754150390625, 0.0027360916137695312, 0.0047054290771484375, 0.006674766540527344, 0.00864410400390625, 0.010613441467285156, 0.012582778930664062, 0.014552116394042969, 0.016521453857421875, 0.01849079132080078, 0.020460128784179688, 0.022429466247558594, 0.0243988037109375, 0.026368141174316406, 0.028337478637695312, 0.03030681610107422, 0.032276153564453125, 0.03424549102783203, 0.03621482849121094, 0.038184165954589844, 0.04015350341796875, 0.042122840881347656, 0.04409217834472656, 0.04606151580810547, 0.048030853271484375, 0.05000019073486328, 0.05196952819824219, 0.053938865661621094, 0.055908203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 14.0, 8.0, 19.0, 24.0, 32.0, 32.0, 48.0, 51.0, 53.0, 85.0, 78.0, 88.0, 88.0, 57.0, 52.0, 56.0, 41.0, 29.0, 20.0, 22.0, 12.0, 12.0, 6.0, 7.0, 8.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.4437904357910156e-05, -2.37245112657547e-05, -2.3011118173599243e-05, -2.2297725081443787e-05, -2.158433198928833e-05, -2.0870938897132874e-05, -2.0157545804977417e-05, -1.944415271282196e-05, -1.8730759620666504e-05, -1.8017366528511047e-05, -1.730397343635559e-05, -1.6590580344200134e-05, -1.5877187252044678e-05, -1.5163794159889221e-05, -1.4450401067733765e-05, -1.3737007975578308e-05, -1.3023614883422852e-05, -1.2310221791267395e-05, -1.1596828699111938e-05, -1.0883435606956482e-05, -1.0170042514801025e-05, -9.456649422645569e-06, -8.743256330490112e-06, -8.029863238334656e-06, -7.316470146179199e-06, -6.603077054023743e-06, -5.889683961868286e-06, -5.17629086971283e-06, -4.462897777557373e-06, -3.7495046854019165e-06, -3.03611159324646e-06, -2.3227185010910034e-06, -1.6093254089355469e-06, -8.959323167800903e-07, -1.825392246246338e-07, 5.308538675308228e-07, 1.2442469596862793e-06, 1.957640051841736e-06, 2.6710331439971924e-06, 3.384426236152649e-06, 4.0978193283081055e-06, 4.811212420463562e-06, 5.5246055126190186e-06, 6.237998604774475e-06, 6.951391696929932e-06, 7.664784789085388e-06, 8.378177881240845e-06, 9.091570973396301e-06, 9.804964065551758e-06, 1.0518357157707214e-05, 1.1231750249862671e-05, 1.1945143342018127e-05, 1.2658536434173584e-05, 1.337192952632904e-05, 1.4085322618484497e-05, 1.4798715710639954e-05, 1.551210880279541e-05, 1.6225501894950867e-05, 1.6938894987106323e-05, 1.765228807926178e-05, 1.8365681171417236e-05, 1.9079074263572693e-05, 1.979246735572815e-05, 2.0505860447883606e-05, 2.1219253540039062e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 5.0, 6.0, 10.0, 15.0, 24.0, 25.0, 29.0, 75.0, 116.0, 193.0, 347.0, 633.0, 1274.0, 2703.0, 5910.0, 13300.0, 30946.0, 76158.0, 223986.0, 425502.0, 163162.0, 59762.0, 24659.0, 10529.0, 4700.0, 2199.0, 1052.0, 561.0, 251.0, 159.0, 87.0, 53.0, 43.0, 22.0, 11.0, 9.0, 8.0, 8.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08685302734375, -0.08399295806884766, -0.08113288879394531, -0.07827281951904297, -0.07541275024414062, -0.07255268096923828, -0.06969261169433594, -0.0668325424194336, -0.06397247314453125, -0.061112403869628906, -0.05825233459472656, -0.05539226531982422, -0.052532196044921875, -0.04967212677001953, -0.04681205749511719, -0.043951988220214844, -0.0410919189453125, -0.038231849670410156, -0.03537178039550781, -0.03251171112060547, -0.029651641845703125, -0.02679157257080078, -0.023931503295898438, -0.021071434020996094, -0.01821136474609375, -0.015351295471191406, -0.012491226196289062, -0.009631156921386719, -0.006771087646484375, -0.003911018371582031, -0.0010509490966796875, 0.0018091201782226562, 0.004669189453125, 0.007529258728027344, 0.010389328002929688, 0.013249397277832031, 0.016109466552734375, 0.01896953582763672, 0.021829605102539062, 0.024689674377441406, 0.02754974365234375, 0.030409812927246094, 0.03326988220214844, 0.03612995147705078, 0.038990020751953125, 0.04185009002685547, 0.04471015930175781, 0.047570228576660156, 0.0504302978515625, 0.053290367126464844, 0.05615043640136719, 0.05901050567626953, 0.061870574951171875, 0.06473064422607422, 0.06759071350097656, 0.0704507827758789, 0.07331085205078125, 0.0761709213256836, 0.07903099060058594, 0.08189105987548828, 0.08475112915039062, 0.08761119842529297, 0.09047126770019531, 0.09333133697509766, 0.09619140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 4.0, 7.0, 6.0, 11.0, 15.0, 13.0, 19.0, 19.0, 29.0, 36.0, 49.0, 83.0, 99.0, 120.0, 109.0, 85.0, 67.0, 38.0, 40.0, 25.0, 20.0, 14.0, 17.0, 9.0, 13.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.060333251953125, -0.057569026947021484, -0.05480480194091797, -0.05204057693481445, -0.04927635192871094, -0.04651212692260742, -0.043747901916503906, -0.04098367691040039, -0.038219451904296875, -0.03545522689819336, -0.032691001892089844, -0.029926776885986328, -0.027162551879882812, -0.024398326873779297, -0.02163410186767578, -0.018869876861572266, -0.01610565185546875, -0.013341426849365234, -0.010577201843261719, -0.007812976837158203, -0.0050487518310546875, -0.002284526824951172, 0.00047969818115234375, 0.0032439231872558594, 0.006008148193359375, 0.00877237319946289, 0.011536598205566406, 0.014300823211669922, 0.017065048217773438, 0.019829273223876953, 0.02259349822998047, 0.025357723236083984, 0.0281219482421875, 0.030886173248291016, 0.03365039825439453, 0.03641462326049805, 0.03917884826660156, 0.04194307327270508, 0.044707298278808594, 0.04747152328491211, 0.050235748291015625, 0.05299997329711914, 0.055764198303222656, 0.05852842330932617, 0.06129264831542969, 0.0640568733215332, 0.06682109832763672, 0.06958532333374023, 0.07234954833984375, 0.07511377334594727, 0.07787799835205078, 0.0806422233581543, 0.08340644836425781, 0.08617067337036133, 0.08893489837646484, 0.09169912338256836, 0.09446334838867188, 0.09722757339477539, 0.0999917984008789, 0.10275602340698242, 0.10552024841308594, 0.10828447341918945, 0.11104869842529297, 0.11381292343139648, 0.1165771484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 11.0, 48.0, 203.0, 387.0, 256.0, 89.0, 19.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7232165336608887, -1.6262346506118774, -1.5292527675628662, -1.432270884513855, -1.3352890014648438, -1.2383071184158325, -1.1413252353668213, -1.0443432331085205, -0.947361409664154, -0.8503795266151428, -0.7533976435661316, -0.6564157009124756, -0.5594338178634644, -0.4624519646167755, -0.3654700517654419, -0.26848816871643066, -0.17150628566741943, -0.0745243951678276, 0.02245749533176422, 0.11943939328193665, 0.21642127633094788, 0.3134031593799591, 0.4103850722312927, 0.507366955280304, 0.6043488383293152, 0.7013307213783264, 0.7983126044273376, 0.8952945470809937, 0.9922764301300049, 1.0892583131790161, 1.1862401962280273, 1.2832220792770386, 1.3802039623260498, 1.477185845375061, 1.5741677284240723, 1.6711496114730835, 1.7681314945220947, 1.865113377571106, 1.9620952606201172, 2.059077262878418, 2.1560590267181396, 2.2530410289764404, 2.350022792816162, 2.447004795074463, 2.5439865589141846, 2.6409685611724854, 2.737950325012207, 2.834932327270508, 2.9319143295288086, 3.0288963317871094, 3.125878095626831, 3.222860097885132, 3.3198418617248535, 3.4168238639831543, 3.513805627822876, 3.6107876300811768, 3.7077693939208984, 3.804751396179199, 3.901733160018921, 3.9987151622772217, 4.095696926116943, 4.192678928375244, 4.289660930633545, 4.3866424560546875, 4.483624458312988]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 5.0, 3.0, 5.0, 15.0, 17.0, 4.0, 13.0, 16.0, 15.0, 13.0, 17.0, 20.0, 28.0, 20.0, 36.0, 28.0, 39.0, 31.0, 40.0, 32.0, 43.0, 25.0, 44.0, 30.0, 39.0, 38.0, 27.0, 38.0, 50.0, 26.0, 25.0, 21.0, 34.0, 29.0, 19.0, 19.0, 22.0, 10.0, 11.0, 13.0, 5.0, 9.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.5647876262664795, -0.5483518242835999, -0.5319159626960754, -0.5154801607131958, -0.4990442991256714, -0.48260849714279175, -0.4661726653575897, -0.4497368335723877, -0.43330100178718567, -0.41686517000198364, -0.4004293382167816, -0.3839935064315796, -0.36755770444869995, -0.35112184286117554, -0.3346860408782959, -0.31825020909309387, -0.30181437730789185, -0.2853785455226898, -0.2689427137374878, -0.25250688195228577, -0.23607106506824493, -0.2196352332830429, -0.20319941639900208, -0.18676358461380005, -0.17032775282859802, -0.153891921043396, -0.13745608925819397, -0.12102027237415314, -0.10458444058895111, -0.08814860880374908, -0.07171278446912766, -0.055276960134506226, -0.038841068744659424, -0.022405240684747696, -0.005969412624835968, 0.01046641543507576, 0.026902243494987488, 0.043338075280189514, 0.059773899614810944, 0.07620972394943237, 0.0926455557346344, 0.10908138751983643, 0.12551721930503845, 0.14195303618907928, 0.1583888679742813, 0.17482469975948334, 0.19126051664352417, 0.2076963484287262, 0.22413218021392822, 0.24056801199913025, 0.2570038437843323, 0.2734396755695343, 0.28987550735473633, 0.30631130933761597, 0.322747141122818, 0.33918297290802, 0.35561880469322205, 0.3720546364784241, 0.3884904682636261, 0.4049263000488281, 0.42136210203170776, 0.4377979636192322, 0.4542337656021118, 0.47066959738731384, 0.48710542917251587]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 2.0, 10.0, 11.0, 11.0, 17.0, 28.0, 31.0, 48.0, 68.0, 88.0, 137.0, 240.0, 344.0, 552.0, 981.0, 1705.0, 3319.0, 6527.0, 14564.0, 36182.0, 108271.0, 429539.0, 2203014.0, 1061639.0, 219963.0, 63884.0, 23217.0, 9868.0, 4614.0, 2241.0, 1220.0, 708.0, 442.0, 254.0, 172.0, 116.0, 74.0, 57.0, 23.0, 34.0, 20.0, 14.0, 7.0, 10.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.11846923828125, -0.1151571273803711, -0.11184501647949219, -0.10853290557861328, -0.10522079467773438, -0.10190868377685547, -0.09859657287597656, -0.09528446197509766, -0.09197235107421875, -0.08866024017333984, -0.08534812927246094, -0.08203601837158203, -0.07872390747070312, -0.07541179656982422, -0.07209968566894531, -0.0687875747680664, -0.0654754638671875, -0.062163352966308594, -0.05885124206542969, -0.05553913116455078, -0.052227020263671875, -0.04891490936279297, -0.04560279846191406, -0.042290687561035156, -0.03897857666015625, -0.035666465759277344, -0.03235435485839844, -0.02904224395751953, -0.025730133056640625, -0.02241802215576172, -0.019105911254882812, -0.015793800354003906, -0.012481689453125, -0.009169578552246094, -0.0058574676513671875, -0.0025453567504882812, 0.000766754150390625, 0.004078865051269531, 0.0073909759521484375, 0.010703086853027344, 0.01401519775390625, 0.017327308654785156, 0.020639419555664062, 0.02395153045654297, 0.027263641357421875, 0.03057575225830078, 0.03388786315917969, 0.037199974060058594, 0.0405120849609375, 0.043824195861816406, 0.04713630676269531, 0.05044841766357422, 0.053760528564453125, 0.05707263946533203, 0.06038475036621094, 0.06369686126708984, 0.06700897216796875, 0.07032108306884766, 0.07363319396972656, 0.07694530487060547, 0.08025741577148438, 0.08356952667236328, 0.08688163757324219, 0.0901937484741211, 0.093505859375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 8.0, 3.0, 11.0, 6.0, 12.0, 7.0, 10.0, 14.0, 22.0, 16.0, 19.0, 28.0, 26.0, 46.0, 34.0, 46.0, 37.0, 50.0, 44.0, 51.0, 60.0, 37.0, 48.0, 40.0, 40.0, 43.0, 33.0, 27.0, 31.0, 26.0, 20.0, 23.0, 21.0, 19.0, 10.0, 12.0, 5.0, 3.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.0762939453125, -0.07423210144042969, -0.07217025756835938, -0.07010841369628906, -0.06804656982421875, -0.06598472595214844, -0.06392288208007812, -0.06186103820800781, -0.0597991943359375, -0.05773735046386719, -0.055675506591796875, -0.05361366271972656, -0.05155181884765625, -0.04948997497558594, -0.047428131103515625, -0.04536628723144531, -0.043304443359375, -0.04124259948730469, -0.039180755615234375, -0.03711891174316406, -0.03505706787109375, -0.03299522399902344, -0.030933380126953125, -0.028871536254882812, -0.0268096923828125, -0.024747848510742188, -0.022686004638671875, -0.020624160766601562, -0.01856231689453125, -0.016500473022460938, -0.014438629150390625, -0.012376785278320312, -0.01031494140625, -0.008253097534179688, -0.006191253662109375, -0.0041294097900390625, -0.00206756591796875, -5.7220458984375e-06, 0.002056121826171875, 0.0041179656982421875, 0.0061798095703125, 0.008241653442382812, 0.010303497314453125, 0.012365341186523438, 0.01442718505859375, 0.016489028930664062, 0.018550872802734375, 0.020612716674804688, 0.022674560546875, 0.024736404418945312, 0.026798248291015625, 0.028860092163085938, 0.03092193603515625, 0.03298377990722656, 0.035045623779296875, 0.03710746765136719, 0.0391693115234375, 0.04123115539550781, 0.043292999267578125, 0.04535484313964844, 0.04741668701171875, 0.04947853088378906, 0.051540374755859375, 0.05360221862792969, 0.0556640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 8.0, 5.0, 13.0, 21.0, 23.0, 35.0, 66.0, 82.0, 118.0, 173.0, 325.0, 575.0, 1046.0, 2078.0, 4545.0, 11217.0, 33856.0, 128198.0, 722717.0, 2600350.0, 538612.0, 103484.0, 28825.0, 9686.0, 3985.0, 1882.0, 964.0, 515.0, 309.0, 193.0, 110.0, 65.0, 47.0, 41.0, 37.0, 17.0, 12.0, 9.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2301025390625, -0.2227802276611328, -0.21545791625976562, -0.20813560485839844, -0.20081329345703125, -0.19349098205566406, -0.18616867065429688, -0.1788463592529297, -0.1715240478515625, -0.1642017364501953, -0.15687942504882812, -0.14955711364746094, -0.14223480224609375, -0.13491249084472656, -0.12759017944335938, -0.12026786804199219, -0.112945556640625, -0.10562324523925781, -0.09830093383789062, -0.09097862243652344, -0.08365631103515625, -0.07633399963378906, -0.06901168823242188, -0.06168937683105469, -0.0543670654296875, -0.04704475402832031, -0.039722442626953125, -0.03240013122558594, -0.02507781982421875, -0.017755508422851562, -0.010433197021484375, -0.0031108856201171875, 0.00421142578125, 0.011533737182617188, 0.018856048583984375, 0.026178359985351562, 0.03350067138671875, 0.04082298278808594, 0.048145294189453125, 0.05546760559082031, 0.0627899169921875, 0.07011222839355469, 0.07743453979492188, 0.08475685119628906, 0.09207916259765625, 0.09940147399902344, 0.10672378540039062, 0.11404609680175781, 0.121368408203125, 0.1286907196044922, 0.13601303100585938, 0.14333534240722656, 0.15065765380859375, 0.15797996520996094, 0.16530227661132812, 0.1726245880126953, 0.1799468994140625, 0.1872692108154297, 0.19459152221679688, 0.20191383361816406, 0.20923614501953125, 0.21655845642089844, 0.22388076782226562, 0.2312030792236328, 0.238525390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 12.0, 9.0, 21.0, 20.0, 45.0, 63.0, 79.0, 145.0, 269.0, 490.0, 792.0, 884.0, 510.0, 275.0, 152.0, 105.0, 71.0, 38.0, 31.0, 16.0, 16.0, 7.0, 5.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.125, -0.11875152587890625, -0.1125030517578125, -0.10625457763671875, -0.100006103515625, -0.09375762939453125, -0.0875091552734375, -0.08126068115234375, -0.07501220703125, -0.06876373291015625, -0.0625152587890625, -0.05626678466796875, -0.050018310546875, -0.04376983642578125, -0.0375213623046875, -0.03127288818359375, -0.0250244140625, -0.01877593994140625, -0.0125274658203125, -0.00627899169921875, -3.0517578125e-05, 0.00621795654296875, 0.0124664306640625, 0.01871490478515625, 0.02496337890625, 0.03121185302734375, 0.0374603271484375, 0.04370880126953125, 0.049957275390625, 0.05620574951171875, 0.0624542236328125, 0.06870269775390625, 0.074951171875, 0.08119964599609375, 0.0874481201171875, 0.09369659423828125, 0.099945068359375, 0.10619354248046875, 0.1124420166015625, 0.11869049072265625, 0.12493896484375, 0.13118743896484375, 0.1374359130859375, 0.14368438720703125, 0.149932861328125, 0.15618133544921875, 0.1624298095703125, 0.16867828369140625, 0.1749267578125, 0.18117523193359375, 0.1874237060546875, 0.19367218017578125, 0.199920654296875, 0.20616912841796875, 0.2124176025390625, 0.21866607666015625, 0.22491455078125, 0.23116302490234375, 0.2374114990234375, 0.24365997314453125, 0.249908447265625, 0.25615692138671875, 0.2624053955078125, 0.26865386962890625, 0.27490234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 8.0, 7.0, 17.0, 37.0, 52.0, 86.0, 113.0, 119.0, 135.0, 130.0, 95.0, 89.0, 41.0, 33.0, 18.0, 15.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7478920221328735, -0.7160083651542664, -0.6841246485710144, -0.6522409915924072, -0.6203572750091553, -0.5884736180305481, -0.5565899610519409, -0.524706244468689, -0.4928225576877594, -0.46093887090682983, -0.42905518412590027, -0.3971714973449707, -0.3652878403663635, -0.3334041237831116, -0.3015204668045044, -0.26963678002357483, -0.23775309324264526, -0.2058694064617157, -0.17398571968078613, -0.14210204780101776, -0.1102183610200882, -0.07833467423915863, -0.04645100235939026, -0.014567315578460693, 0.017316371202468872, 0.04920005425810814, 0.0810837373137474, 0.11296741664409637, 0.14485110342502594, 0.1767347902059555, 0.20861846208572388, 0.24050214886665344, 0.272385835647583, 0.3042695224285126, 0.33615320920944214, 0.3680368661880493, 0.39992058277130127, 0.43180423974990845, 0.463687926530838, 0.4955716133117676, 0.5274553298950195, 0.5593389868736267, 0.5912227034568787, 0.6231063604354858, 0.6549900770187378, 0.686873733997345, 0.7187573909759521, 0.7506411075592041, 0.7825247645378113, 0.8144084215164185, 0.8462921380996704, 0.8781757950782776, 0.9100595116615295, 0.9419431686401367, 0.9738268852233887, 1.0057106018066406, 1.037594199180603, 1.069477915763855, 1.1013615131378174, 1.1332452297210693, 1.1651289463043213, 1.1970126628875732, 1.2288962602615356, 1.2607799768447876, 1.2926636934280396]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 0.0, 5.0, 6.0, 9.0, 11.0, 11.0, 10.0, 19.0, 18.0, 18.0, 32.0, 17.0, 17.0, 36.0, 22.0, 41.0, 36.0, 32.0, 40.0, 33.0, 36.0, 30.0, 46.0, 34.0, 41.0, 33.0, 42.0, 34.0, 36.0, 28.0, 22.0, 41.0, 15.0, 28.0, 24.0, 14.0, 13.0, 7.0, 16.0, 10.0, 8.0, 6.0, 10.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.38295233249664307, -0.37084120512008667, -0.3587300479412079, -0.3466189205646515, -0.3345077931880951, -0.3223966658115387, -0.3102855086326599, -0.2981743812561035, -0.2860632538795471, -0.2739521265029907, -0.26184096932411194, -0.24972984194755554, -0.23761871457099915, -0.22550757229328156, -0.21339643001556396, -0.20128530263900757, -0.18917416036128998, -0.1770630180835724, -0.164951890707016, -0.1528407484292984, -0.140729621052742, -0.12861847877502441, -0.11650734394788742, -0.10439620912075043, -0.09228507429361343, -0.08017393946647644, -0.06806280463933945, -0.055951666086912155, -0.04384053125977516, -0.03172939643263817, -0.019618257880210876, -0.007507123053073883, 0.00460401177406311, 0.016715146601200104, 0.028826283290982246, 0.04093741998076439, 0.05304855480790138, 0.06515969336032867, 0.07727082818746567, 0.08938196301460266, 0.10149309784173965, 0.11360423266887665, 0.12571537494659424, 0.13782650232315063, 0.14993764460086823, 0.16204877197742462, 0.1741599142551422, 0.1862710416316986, 0.1983821839094162, 0.2104933261871338, 0.22260445356369019, 0.23471559584140778, 0.24682672321796417, 0.25893786549568176, 0.27104899287223816, 0.28316015005111694, 0.29527127742767334, 0.30738240480422974, 0.3194935619831085, 0.3316046893596649, 0.3437158167362213, 0.3558269441127777, 0.3679381012916565, 0.3800492286682129, 0.3921603560447693]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 21.0, 20.0, 26.0, 51.0, 76.0, 111.0, 161.0, 232.0, 358.0, 576.0, 826.0, 1185.0, 1934.0, 2961.0, 4413.0, 6689.0, 10454.0, 16067.0, 25925.0, 44720.0, 87275.0, 189924.0, 282622.0, 178359.0, 81994.0, 42251.0, 24828.0, 15469.0, 10092.0, 6472.0, 4187.0, 2834.0, 1900.0, 1151.0, 817.0, 511.0, 326.0, 246.0, 158.0, 114.0, 76.0, 37.0, 42.0, 25.0, 8.0, 10.0, 12.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.098876953125, -0.09592151641845703, -0.09296607971191406, -0.0900106430053711, -0.08705520629882812, -0.08409976959228516, -0.08114433288574219, -0.07818889617919922, -0.07523345947265625, -0.07227802276611328, -0.06932258605957031, -0.06636714935302734, -0.06341171264648438, -0.060456275939941406, -0.05750083923339844, -0.05454540252685547, -0.0515899658203125, -0.04863452911376953, -0.04567909240722656, -0.042723655700683594, -0.039768218994140625, -0.036812782287597656, -0.03385734558105469, -0.03090190887451172, -0.02794647216796875, -0.02499103546142578, -0.022035598754882812, -0.019080162048339844, -0.016124725341796875, -0.013169288635253906, -0.010213851928710938, -0.007258415222167969, -0.004302978515625, -0.0013475418090820312, 0.0016078948974609375, 0.004563331604003906, 0.007518768310546875, 0.010474205017089844, 0.013429641723632812, 0.01638507843017578, 0.01934051513671875, 0.02229595184326172, 0.025251388549804688, 0.028206825256347656, 0.031162261962890625, 0.034117698669433594, 0.03707313537597656, 0.04002857208251953, 0.0429840087890625, 0.04593944549560547, 0.04889488220214844, 0.051850318908691406, 0.054805755615234375, 0.057761192321777344, 0.06071662902832031, 0.06367206573486328, 0.06662750244140625, 0.06958293914794922, 0.07253837585449219, 0.07549381256103516, 0.07844924926757812, 0.0814046859741211, 0.08436012268066406, 0.08731555938720703, 0.09027099609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 7.0, 10.0, 10.0, 7.0, 13.0, 17.0, 26.0, 25.0, 23.0, 18.0, 32.0, 31.0, 29.0, 33.0, 33.0, 37.0, 45.0, 50.0, 38.0, 34.0, 53.0, 49.0, 37.0, 36.0, 26.0, 38.0, 29.0, 25.0, 23.0, 26.0, 34.0, 13.0, 12.0, 17.0, 13.0, 9.0, 7.0, 8.0, 5.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.07305908203125, -0.07106924057006836, -0.06907939910888672, -0.06708955764770508, -0.06509971618652344, -0.0631098747253418, -0.061120033264160156, -0.059130191802978516, -0.057140350341796875, -0.055150508880615234, -0.053160667419433594, -0.05117082595825195, -0.04918098449707031, -0.04719114303588867, -0.04520130157470703, -0.04321146011352539, -0.04122161865234375, -0.03923177719116211, -0.03724193572998047, -0.03525209426879883, -0.03326225280761719, -0.03127241134643555, -0.029282569885253906, -0.027292728424072266, -0.025302886962890625, -0.023313045501708984, -0.021323204040527344, -0.019333362579345703, -0.017343521118164062, -0.015353679656982422, -0.013363838195800781, -0.01137399673461914, -0.0093841552734375, -0.007394313812255859, -0.005404472351074219, -0.003414630889892578, -0.0014247894287109375, 0.0005650520324707031, 0.0025548934936523438, 0.004544734954833984, 0.006534576416015625, 0.008524417877197266, 0.010514259338378906, 0.012504100799560547, 0.014493942260742188, 0.016483783721923828, 0.01847362518310547, 0.02046346664428711, 0.02245330810546875, 0.02444314956665039, 0.02643299102783203, 0.028422832489013672, 0.030412673950195312, 0.03240251541137695, 0.034392356872558594, 0.036382198333740234, 0.038372039794921875, 0.040361881256103516, 0.042351722717285156, 0.0443415641784668, 0.04633140563964844, 0.04832124710083008, 0.05031108856201172, 0.05230093002319336, 0.054290771484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 10.0, 8.0, 3.0, 7.0, 6.0, 13.0, 17.0, 28.0, 45.0, 45.0, 63.0, 99.0, 183.0, 289.0, 592.0, 1203.0, 2802.0, 6994.0, 18253.0, 52629.0, 259388.0, 556116.0, 101375.0, 29639.0, 10971.0, 4238.0, 1739.0, 785.0, 376.0, 223.0, 130.0, 84.0, 53.0, 36.0, 28.0, 26.0, 12.0, 13.0, 7.0, 7.0, 7.0, 6.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.281982421875, -0.2742023468017578, -0.2664222717285156, -0.25864219665527344, -0.25086212158203125, -0.24308204650878906, -0.23530197143554688, -0.2275218963623047, -0.2197418212890625, -0.2119617462158203, -0.20418167114257812, -0.19640159606933594, -0.18862152099609375, -0.18084144592285156, -0.17306137084960938, -0.1652812957763672, -0.157501220703125, -0.1497211456298828, -0.14194107055664062, -0.13416099548339844, -0.12638092041015625, -0.11860084533691406, -0.11082077026367188, -0.10304069519042969, -0.0952606201171875, -0.08748054504394531, -0.07970046997070312, -0.07192039489746094, -0.06414031982421875, -0.05636024475097656, -0.048580169677734375, -0.04080009460449219, -0.03302001953125, -0.025239944458007812, -0.017459869384765625, -0.009679794311523438, -0.00189971923828125, 0.0058803558349609375, 0.013660430908203125, 0.021440505981445312, 0.0292205810546875, 0.03700065612792969, 0.044780731201171875, 0.05256080627441406, 0.06034088134765625, 0.06812095642089844, 0.07590103149414062, 0.08368110656738281, 0.091461181640625, 0.09924125671386719, 0.10702133178710938, 0.11480140686035156, 0.12258148193359375, 0.13036155700683594, 0.13814163208007812, 0.1459217071533203, 0.1537017822265625, 0.1614818572998047, 0.16926193237304688, 0.17704200744628906, 0.18482208251953125, 0.19260215759277344, 0.20038223266601562, 0.2081623077392578, 0.2159423828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 10.0, 9.0, 20.0, 21.0, 24.0, 28.0, 33.0, 36.0, 45.0, 53.0, 66.0, 58.0, 59.0, 65.0, 53.0, 64.0, 44.0, 48.0, 50.0, 41.0, 40.0, 30.0, 26.0, 18.0, 11.0, 11.0, 4.0, 8.0, 3.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2685546875, -0.25923919677734375, -0.2499237060546875, -0.24060821533203125, -0.231292724609375, -0.22197723388671875, -0.2126617431640625, -0.20334625244140625, -0.19403076171875, -0.18471527099609375, -0.1753997802734375, -0.16608428955078125, -0.156768798828125, -0.14745330810546875, -0.1381378173828125, -0.12882232666015625, -0.1195068359375, -0.11019134521484375, -0.1008758544921875, -0.09156036376953125, -0.082244873046875, -0.07292938232421875, -0.0636138916015625, -0.05429840087890625, -0.04498291015625, -0.03566741943359375, -0.0263519287109375, -0.01703643798828125, -0.007720947265625, 0.00159454345703125, 0.0109100341796875, 0.02022552490234375, 0.029541015625, 0.03885650634765625, 0.0481719970703125, 0.05748748779296875, 0.066802978515625, 0.07611846923828125, 0.0854339599609375, 0.09474945068359375, 0.10406494140625, 0.11338043212890625, 0.1226959228515625, 0.13201141357421875, 0.141326904296875, 0.15064239501953125, 0.1599578857421875, 0.16927337646484375, 0.1785888671875, 0.18790435791015625, 0.1972198486328125, 0.20653533935546875, 0.215850830078125, 0.22516632080078125, 0.2344818115234375, 0.24379730224609375, 0.25311279296875, 0.26242828369140625, 0.2717437744140625, 0.28105926513671875, 0.290374755859375, 0.29969024658203125, 0.3090057373046875, 0.31832122802734375, 0.32763671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 1.0, 9.0, 3.0, 14.0, 23.0, 19.0, 30.0, 31.0, 53.0, 76.0, 97.0, 137.0, 178.0, 300.0, 337.0, 541.0, 804.0, 1159.0, 2007.0, 3658.0, 7836.0, 18212.0, 48207.0, 245363.0, 569405.0, 96074.0, 29087.0, 12062.0, 5483.0, 2670.0, 1549.0, 888.0, 609.0, 448.0, 352.0, 237.0, 150.0, 126.0, 87.0, 72.0, 44.0, 37.0, 22.0, 16.0, 14.0, 14.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.130126953125, -0.12609291076660156, -0.12205886840820312, -0.11802482604980469, -0.11399078369140625, -0.10995674133300781, -0.10592269897460938, -0.10188865661621094, -0.0978546142578125, -0.09382057189941406, -0.08978652954101562, -0.08575248718261719, -0.08171844482421875, -0.07768440246582031, -0.07365036010742188, -0.06961631774902344, -0.065582275390625, -0.06154823303222656, -0.057514190673828125, -0.05348014831542969, -0.04944610595703125, -0.04541206359863281, -0.041378021240234375, -0.03734397888183594, -0.0333099365234375, -0.029275894165039062, -0.025241851806640625, -0.021207809448242188, -0.01717376708984375, -0.013139724731445312, -0.009105682373046875, -0.0050716400146484375, -0.00103759765625, 0.0029964447021484375, 0.007030487060546875, 0.011064529418945312, 0.01509857177734375, 0.019132614135742188, 0.023166656494140625, 0.027200698852539062, 0.0312347412109375, 0.03526878356933594, 0.039302825927734375, 0.04333686828613281, 0.04737091064453125, 0.05140495300292969, 0.055438995361328125, 0.05947303771972656, 0.063507080078125, 0.06754112243652344, 0.07157516479492188, 0.07560920715332031, 0.07964324951171875, 0.08367729187011719, 0.08771133422851562, 0.09174537658691406, 0.0957794189453125, 0.09981346130371094, 0.10384750366210938, 0.10788154602050781, 0.11191558837890625, 0.11594963073730469, 0.11998367309570312, 0.12401771545410156, 0.1280517578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 6.0, 2.0, 3.0, 12.0, 13.0, 15.0, 31.0, 31.0, 33.0, 43.0, 67.0, 79.0, 83.0, 98.0, 91.0, 71.0, 80.0, 62.0, 41.0, 24.0, 14.0, 17.0, 7.0, 14.0, 10.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5570392608642578e-05, -2.4809502065181732e-05, -2.4048611521720886e-05, -2.328772097826004e-05, -2.2526830434799194e-05, -2.176593989133835e-05, -2.1005049347877502e-05, -2.0244158804416656e-05, -1.948326826095581e-05, -1.8722377717494965e-05, -1.796148717403412e-05, -1.7200596630573273e-05, -1.6439706087112427e-05, -1.567881554365158e-05, -1.4917925000190735e-05, -1.4157034456729889e-05, -1.3396143913269043e-05, -1.2635253369808197e-05, -1.1874362826347351e-05, -1.1113472282886505e-05, -1.035258173942566e-05, -9.591691195964813e-06, -8.830800652503967e-06, -8.069910109043121e-06, -7.309019565582275e-06, -6.5481290221214294e-06, -5.7872384786605835e-06, -5.0263479351997375e-06, -4.265457391738892e-06, -3.5045668482780457e-06, -2.7436763048171997e-06, -1.9827857613563538e-06, -1.2218952178955078e-06, -4.6100467443466187e-07, 2.998858690261841e-07, 1.06077641248703e-06, 1.821666955947876e-06, 2.582557499408722e-06, 3.343448042869568e-06, 4.104338586330414e-06, 4.86522912979126e-06, 5.626119673252106e-06, 6.387010216712952e-06, 7.147900760173798e-06, 7.908791303634644e-06, 8.66968184709549e-06, 9.430572390556335e-06, 1.0191462934017181e-05, 1.0952353477478027e-05, 1.1713244020938873e-05, 1.247413456439972e-05, 1.3235025107860565e-05, 1.3995915651321411e-05, 1.4756806194782257e-05, 1.5517696738243103e-05, 1.627858728170395e-05, 1.7039477825164795e-05, 1.780036836862564e-05, 1.8561258912086487e-05, 1.9322149455547333e-05, 2.008303999900818e-05, 2.0843930542469025e-05, 2.160482108592987e-05, 2.2365711629390717e-05, 2.3126602172851562e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 3.0, 9.0, 8.0, 7.0, 8.0, 12.0, 13.0, 26.0, 35.0, 46.0, 81.0, 203.0, 379.0, 836.0, 2051.0, 4915.0, 13506.0, 39555.0, 189694.0, 639068.0, 111589.0, 29452.0, 10104.0, 3917.0, 1556.0, 677.0, 349.0, 191.0, 95.0, 37.0, 26.0, 27.0, 17.0, 13.0, 15.0, 9.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1514892578125, -0.1470813751220703, -0.14267349243164062, -0.13826560974121094, -0.13385772705078125, -0.12944984436035156, -0.12504196166992188, -0.12063407897949219, -0.1162261962890625, -0.11181831359863281, -0.10741043090820312, -0.10300254821777344, -0.09859466552734375, -0.09418678283691406, -0.08977890014648438, -0.08537101745605469, -0.080963134765625, -0.07655525207519531, -0.07214736938476562, -0.06773948669433594, -0.06333160400390625, -0.05892372131347656, -0.054515838623046875, -0.05010795593261719, -0.0457000732421875, -0.04129219055175781, -0.036884307861328125, -0.03247642517089844, -0.02806854248046875, -0.023660659790039062, -0.019252777099609375, -0.014844894409179688, -0.01043701171875, -0.0060291290283203125, -0.001621246337890625, 0.0027866363525390625, 0.00719451904296875, 0.011602401733398438, 0.016010284423828125, 0.020418167114257812, 0.0248260498046875, 0.029233932495117188, 0.033641815185546875, 0.03804969787597656, 0.04245758056640625, 0.04686546325683594, 0.051273345947265625, 0.05568122863769531, 0.060089111328125, 0.06449699401855469, 0.06890487670898438, 0.07331275939941406, 0.07772064208984375, 0.08212852478027344, 0.08653640747070312, 0.09094429016113281, 0.0953521728515625, 0.09976005554199219, 0.10416793823242188, 0.10857582092285156, 0.11298370361328125, 0.11739158630371094, 0.12179946899414062, 0.1262073516845703, 0.130615234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 7.0, 17.0, 19.0, 29.0, 66.0, 149.0, 241.0, 208.0, 101.0, 42.0, 24.0, 16.0, 20.0, 7.0, 4.0, 4.0, 7.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1865234375, -0.18144798278808594, -0.17637252807617188, -0.1712970733642578, -0.16622161865234375, -0.1611461639404297, -0.15607070922851562, -0.15099525451660156, -0.1459197998046875, -0.14084434509277344, -0.13576889038085938, -0.1306934356689453, -0.12561798095703125, -0.12054252624511719, -0.11546707153320312, -0.11039161682128906, -0.105316162109375, -0.10024070739746094, -0.09516525268554688, -0.09008979797363281, -0.08501434326171875, -0.07993888854980469, -0.07486343383789062, -0.06978797912597656, -0.0647125244140625, -0.05963706970214844, -0.054561614990234375, -0.04948616027832031, -0.04441070556640625, -0.03933525085449219, -0.034259796142578125, -0.029184341430664062, -0.02410888671875, -0.019033432006835938, -0.013957977294921875, -0.008882522583007812, -0.00380706787109375, 0.0012683868408203125, 0.006343841552734375, 0.011419296264648438, 0.0164947509765625, 0.021570205688476562, 0.026645660400390625, 0.03172111511230469, 0.03679656982421875, 0.04187202453613281, 0.046947479248046875, 0.05202293395996094, 0.057098388671875, 0.06217384338378906, 0.06724929809570312, 0.07232475280761719, 0.07740020751953125, 0.08247566223144531, 0.08755111694335938, 0.09262657165527344, 0.0977020263671875, 0.10277748107910156, 0.10785293579101562, 0.11292839050292969, 0.11800384521484375, 0.12307929992675781, 0.12815475463867188, 0.13323020935058594, 0.1383056640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 9.0, 9.0, 34.0, 110.0, 210.0, 279.0, 166.0, 120.0, 44.0, 24.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7653948664665222, -0.6990396976470947, -0.6326845288276672, -0.5663293600082397, -0.49997416138648987, -0.4336189925670624, -0.3672637939453125, -0.300908625125885, -0.23455345630645752, -0.16819828748703003, -0.10184310376644135, -0.03548792004585266, 0.03086724877357483, 0.09722241759300232, 0.1635776162147522, 0.2299327850341797, 0.2962879538536072, 0.36264312267303467, 0.42899829149246216, 0.49535349011421204, 0.5617086887359619, 0.6280637979507446, 0.6944190263748169, 0.7607741951942444, 0.8271293640136719, 0.8934845328330994, 0.9598397016525269, 1.0261949300765991, 1.0925500392913818, 1.158905267715454, 1.2252604961395264, 1.291615605354309, 1.3579707145690918, 1.424325942993164, 1.4906810522079468, 1.557036280632019, 1.6233913898468018, 1.689746618270874, 1.7561018466949463, 1.822456955909729, 1.8888120651245117, 1.955167293548584, 2.0215225219726562, 2.0878775119781494, 2.1542327404022217, 2.220587968826294, 2.286943197250366, 2.3532981872558594, 2.4196534156799316, 2.486008644104004, 2.552363872528076, 2.6187188625335693, 2.6850740909576416, 2.751429319381714, 2.817784547805786, 2.8841395378112793, 2.9504950046539307, 3.016850233078003, 3.083205461502075, 3.1495604515075684, 3.2159156799316406, 3.282270908355713, 3.348626136779785, 3.4149813652038574, 3.4813363552093506]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 7.0, 19.0, 16.0, 20.0, 34.0, 17.0, 26.0, 43.0, 29.0, 29.0, 43.0, 38.0, 52.0, 43.0, 42.0, 52.0, 47.0, 33.0, 40.0, 41.0, 57.0, 30.0, 40.0, 23.0, 24.0, 21.0, 20.0, 20.0, 11.0, 9.0, 14.0, 9.0, 0.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.651595950126648, -0.6304101943969727, -0.6092244386672974, -0.5880386829376221, -0.5668529272079468, -0.5456671714782715, -0.5244814157485962, -0.5032956600189209, -0.4821099042892456, -0.4609241485595703, -0.439738392829895, -0.4185526371002197, -0.39736688137054443, -0.37618112564086914, -0.35499536991119385, -0.33380961418151855, -0.31262385845184326, -0.29143810272216797, -0.2702523469924927, -0.24906659126281738, -0.2278808355331421, -0.2066950798034668, -0.1855093240737915, -0.1643235683441162, -0.14313781261444092, -0.12195205688476562, -0.10076630115509033, -0.07958054542541504, -0.058394789695739746, -0.03720903396606445, -0.01602327823638916, 0.005162477493286133, 0.0263482928276062, 0.047534048557281494, 0.06871980428695679, 0.08990556001663208, 0.11109131574630737, 0.13227707147598267, 0.15346282720565796, 0.17464858293533325, 0.19583433866500854, 0.21702009439468384, 0.23820585012435913, 0.2593916058540344, 0.2805773615837097, 0.301763117313385, 0.3229488730430603, 0.3441346287727356, 0.3653203845024109, 0.3865061402320862, 0.4076918959617615, 0.42887765169143677, 0.45006340742111206, 0.47124916315078735, 0.49243491888046265, 0.5136206746101379, 0.5348064303398132, 0.5559921860694885, 0.5771779417991638, 0.5983636975288391, 0.6195494532585144, 0.6407352089881897, 0.661920964717865, 0.6831067204475403, 0.7042924761772156]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 18.0, 23.0, 19.0, 26.0, 33.0, 51.0, 110.0, 102.0, 213.0, 325.0, 563.0, 1023.0, 1834.0, 3624.0, 7094.0, 15904.0, 39515.0, 119465.0, 489449.0, 2546712.0, 723668.0, 158927.0, 50165.0, 18970.0, 8148.0, 3959.0, 1943.0, 1013.0, 546.0, 318.0, 193.0, 91.0, 74.0, 49.0, 24.0, 28.0, 11.0, 14.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.14697265625, -0.14272594451904297, -0.13847923278808594, -0.1342325210571289, -0.12998580932617188, -0.12573909759521484, -0.12149238586425781, -0.11724567413330078, -0.11299896240234375, -0.10875225067138672, -0.10450553894042969, -0.10025882720947266, -0.09601211547851562, -0.0917654037475586, -0.08751869201660156, -0.08327198028564453, -0.0790252685546875, -0.07477855682373047, -0.07053184509277344, -0.0662851333618164, -0.062038421630859375, -0.057791709899902344, -0.05354499816894531, -0.04929828643798828, -0.04505157470703125, -0.04080486297607422, -0.03655815124511719, -0.032311439514160156, -0.028064727783203125, -0.023818016052246094, -0.019571304321289062, -0.015324592590332031, -0.011077880859375, -0.006831169128417969, -0.0025844573974609375, 0.0016622543334960938, 0.005908966064453125, 0.010155677795410156, 0.014402389526367188, 0.01864910125732422, 0.02289581298828125, 0.02714252471923828, 0.03138923645019531, 0.035635948181152344, 0.039882659912109375, 0.044129371643066406, 0.04837608337402344, 0.05262279510498047, 0.0568695068359375, 0.06111621856689453, 0.06536293029785156, 0.0696096420288086, 0.07385635375976562, 0.07810306549072266, 0.08234977722167969, 0.08659648895263672, 0.09084320068359375, 0.09508991241455078, 0.09933662414550781, 0.10358333587646484, 0.10783004760742188, 0.1120767593383789, 0.11632347106933594, 0.12057018280029297, 0.12481689453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 9.0, 7.0, 11.0, 10.0, 13.0, 15.0, 13.0, 18.0, 24.0, 29.0, 28.0, 33.0, 30.0, 29.0, 31.0, 37.0, 42.0, 30.0, 44.0, 39.0, 45.0, 41.0, 29.0, 46.0, 46.0, 40.0, 34.0, 31.0, 26.0, 21.0, 15.0, 21.0, 14.0, 20.0, 10.0, 15.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 7.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.07684326171875, -0.0746612548828125, -0.072479248046875, -0.0702972412109375, -0.068115234375, -0.0659332275390625, -0.063751220703125, -0.0615692138671875, -0.05938720703125, -0.0572052001953125, -0.055023193359375, -0.0528411865234375, -0.0506591796875, -0.0484771728515625, -0.046295166015625, -0.0441131591796875, -0.04193115234375, -0.0397491455078125, -0.037567138671875, -0.0353851318359375, -0.033203125, -0.0310211181640625, -0.028839111328125, -0.0266571044921875, -0.02447509765625, -0.0222930908203125, -0.020111083984375, -0.0179290771484375, -0.0157470703125, -0.0135650634765625, -0.011383056640625, -0.0092010498046875, -0.00701904296875, -0.0048370361328125, -0.002655029296875, -0.0004730224609375, 0.001708984375, 0.0038909912109375, 0.006072998046875, 0.0082550048828125, 0.01043701171875, 0.0126190185546875, 0.014801025390625, 0.0169830322265625, 0.0191650390625, 0.0213470458984375, 0.023529052734375, 0.0257110595703125, 0.02789306640625, 0.0300750732421875, 0.032257080078125, 0.0344390869140625, 0.03662109375, 0.0388031005859375, 0.040985107421875, 0.0431671142578125, 0.04534912109375, 0.0475311279296875, 0.049713134765625, 0.0518951416015625, 0.0540771484375, 0.0562591552734375, 0.058441162109375, 0.0606231689453125, 0.06280517578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 1.0, 4.0, 3.0, 9.0, 7.0, 13.0, 14.0, 22.0, 29.0, 41.0, 69.0, 84.0, 103.0, 128.0, 237.0, 302.0, 494.0, 856.0, 1665.0, 3319.0, 8112.0, 21181.0, 68673.0, 299678.0, 2198609.0, 1310268.0, 201395.0, 50005.0, 16259.0, 6216.0, 2842.0, 1408.0, 796.0, 446.0, 272.0, 213.0, 119.0, 97.0, 84.0, 66.0, 35.0, 32.0, 21.0, 13.0, 11.0, 10.0, 6.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.2900390625, -0.2817230224609375, -0.273406982421875, -0.2650909423828125, -0.25677490234375, -0.2484588623046875, -0.240142822265625, -0.2318267822265625, -0.2235107421875, -0.2151947021484375, -0.206878662109375, -0.1985626220703125, -0.19024658203125, -0.1819305419921875, -0.173614501953125, -0.1652984619140625, -0.156982421875, -0.1486663818359375, -0.140350341796875, -0.1320343017578125, -0.12371826171875, -0.1154022216796875, -0.107086181640625, -0.0987701416015625, -0.0904541015625, -0.0821380615234375, -0.073822021484375, -0.0655059814453125, -0.05718994140625, -0.0488739013671875, -0.040557861328125, -0.0322418212890625, -0.02392578125, -0.0156097412109375, -0.007293701171875, 0.0010223388671875, 0.00933837890625, 0.0176544189453125, 0.025970458984375, 0.0342864990234375, 0.0426025390625, 0.0509185791015625, 0.059234619140625, 0.0675506591796875, 0.07586669921875, 0.0841827392578125, 0.092498779296875, 0.1008148193359375, 0.109130859375, 0.1174468994140625, 0.125762939453125, 0.1340789794921875, 0.14239501953125, 0.1507110595703125, 0.159027099609375, 0.1673431396484375, 0.1756591796875, 0.1839752197265625, 0.192291259765625, 0.2006072998046875, 0.20892333984375, 0.2172393798828125, 0.225555419921875, 0.2338714599609375, 0.2421875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 12.0, 14.0, 29.0, 66.0, 86.0, 176.0, 339.0, 704.0, 1248.0, 685.0, 327.0, 156.0, 94.0, 50.0, 30.0, 13.0, 12.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.19922828674316406, -0.19032669067382812, -0.1814250946044922, -0.17252349853515625, -0.1636219024658203, -0.15472030639648438, -0.14581871032714844, -0.1369171142578125, -0.12801551818847656, -0.11911392211914062, -0.11021232604980469, -0.10131072998046875, -0.09240913391113281, -0.08350753784179688, -0.07460594177246094, -0.065704345703125, -0.05680274963378906, -0.047901153564453125, -0.03899955749511719, -0.03009796142578125, -0.021196365356445312, -0.012294769287109375, -0.0033931732177734375, 0.0055084228515625, 0.014410018920898438, 0.023311614990234375, 0.03221321105957031, 0.04111480712890625, 0.05001640319824219, 0.058917999267578125, 0.06781959533691406, 0.07672119140625, 0.08562278747558594, 0.09452438354492188, 0.10342597961425781, 0.11232757568359375, 0.12122917175292969, 0.13013076782226562, 0.13903236389160156, 0.1479339599609375, 0.15683555603027344, 0.16573715209960938, 0.1746387481689453, 0.18354034423828125, 0.1924419403076172, 0.20134353637695312, 0.21024513244628906, 0.219146728515625, 0.22804832458496094, 0.23694992065429688, 0.2458515167236328, 0.25475311279296875, 0.2636547088623047, 0.2725563049316406, 0.28145790100097656, 0.2903594970703125, 0.29926109313964844, 0.3081626892089844, 0.3170642852783203, 0.32596588134765625, 0.3348674774169922, 0.3437690734863281, 0.35267066955566406, 0.361572265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 3.0, 20.0, 16.0, 29.0, 32.0, 47.0, 66.0, 62.0, 82.0, 105.0, 107.0, 86.0, 88.0, 74.0, 52.0, 37.0, 38.0, 16.0, 17.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9097804427146912, -0.8842428922653198, -0.8587054014205933, -0.8331679105758667, -0.8076303601264954, -0.782092809677124, -0.7565553188323975, -0.7310178279876709, -0.7054802775382996, -0.6799427270889282, -0.6544052362442017, -0.6288677453994751, -0.6033301949501038, -0.5777926445007324, -0.5522551536560059, -0.5267176628112793, -0.501180112361908, -0.475642591714859, -0.45010507106781006, -0.4245675504207611, -0.39903002977371216, -0.3734925091266632, -0.34795498847961426, -0.3224174678325653, -0.29687994718551636, -0.2713424265384674, -0.24580490589141846, -0.2202673852443695, -0.19472986459732056, -0.1691923439502716, -0.14365482330322266, -0.1181173026561737, -0.09257972240447998, -0.06704220175743103, -0.04150468111038208, -0.01596716046333313, 0.00957036018371582, 0.03510788083076477, 0.06064540147781372, 0.08618292212486267, 0.11172044277191162, 0.13725796341896057, 0.16279548406600952, 0.18833300471305847, 0.21387052536010742, 0.23940804600715637, 0.2649455666542053, 0.2904830873012543, 0.3160206079483032, 0.3415581285953522, 0.3670956492424011, 0.3926331698894501, 0.418170690536499, 0.443708211183548, 0.4692457318305969, 0.4947832524776459, 0.5203207731246948, 0.5458582639694214, 0.5713958144187927, 0.5969333648681641, 0.6224708557128906, 0.6480083465576172, 0.6735458970069885, 0.6990834474563599, 0.7246209383010864]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 9.0, 5.0, 9.0, 11.0, 11.0, 12.0, 21.0, 17.0, 31.0, 24.0, 32.0, 25.0, 36.0, 49.0, 43.0, 36.0, 34.0, 39.0, 55.0, 41.0, 52.0, 39.0, 30.0, 47.0, 43.0, 34.0, 25.0, 22.0, 31.0, 19.0, 20.0, 15.0, 15.0, 18.0, 10.0, 7.0, 6.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5010194182395935, -0.48457351326942444, -0.46812760829925537, -0.4516817033290863, -0.43523579835891724, -0.41878989338874817, -0.4023439884185791, -0.3858981132507324, -0.36945217847824097, -0.3530062735080719, -0.33656036853790283, -0.32011446356773376, -0.3036685585975647, -0.28722265362739563, -0.27077674865722656, -0.2543308734893799, -0.23788496851921082, -0.22143906354904175, -0.20499315857887268, -0.1885472536087036, -0.17210134863853455, -0.15565544366836548, -0.1392095535993576, -0.12276364862918854, -0.10631774365901947, -0.0898718386888504, -0.07342593371868134, -0.056980036199092865, -0.0405341312289238, -0.02408822625875473, -0.00764232873916626, 0.008803576231002808, 0.025249481201171875, 0.04169538617134094, 0.05814128741621971, 0.07458718866109848, 0.09103309363126755, 0.10747899860143661, 0.12392489612102509, 0.14037080109119415, 0.15681670606136322, 0.1732626110315323, 0.18970851600170135, 0.20615440607070923, 0.2226003110408783, 0.23904621601104736, 0.25549212098121643, 0.2719380259513855, 0.28838393092155457, 0.30482983589172363, 0.3212757408618927, 0.33772164583206177, 0.35416755080223083, 0.3706134557723999, 0.3870593309402466, 0.40350526571273804, 0.4199511408805847, 0.4363970458507538, 0.45284295082092285, 0.4692888557910919, 0.485734760761261, 0.5021806359291077, 0.5186265707015991, 0.5350724458694458, 0.5515183806419373]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 19.0, 28.0, 32.0, 66.0, 95.0, 163.0, 227.0, 377.0, 628.0, 967.0, 1521.0, 2501.0, 3980.0, 6238.0, 10748.0, 17928.0, 30591.0, 53213.0, 95177.0, 186100.0, 269349.0, 164743.0, 85864.0, 48248.0, 27996.0, 16326.0, 9818.0, 5924.0, 3693.0, 2240.0, 1335.0, 906.0, 552.0, 343.0, 230.0, 130.0, 78.0, 71.0, 32.0, 20.0, 18.0, 10.0, 9.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.10833740234375, -0.10518932342529297, -0.10204124450683594, -0.0988931655883789, -0.09574508666992188, -0.09259700775146484, -0.08944892883300781, -0.08630084991455078, -0.08315277099609375, -0.08000469207763672, -0.07685661315917969, -0.07370853424072266, -0.07056045532226562, -0.0674123764038086, -0.06426429748535156, -0.06111621856689453, -0.0579681396484375, -0.05482006072998047, -0.05167198181152344, -0.048523902893066406, -0.045375823974609375, -0.042227745056152344, -0.03907966613769531, -0.03593158721923828, -0.03278350830078125, -0.02963542938232422, -0.026487350463867188, -0.023339271545410156, -0.020191192626953125, -0.017043113708496094, -0.013895034790039062, -0.010746955871582031, -0.007598876953125, -0.004450798034667969, -0.0013027191162109375, 0.0018453598022460938, 0.004993438720703125, 0.008141517639160156, 0.011289596557617188, 0.014437675476074219, 0.01758575439453125, 0.02073383331298828, 0.023881912231445312, 0.027029991149902344, 0.030178070068359375, 0.033326148986816406, 0.03647422790527344, 0.03962230682373047, 0.0427703857421875, 0.04591846466064453, 0.04906654357910156, 0.052214622497558594, 0.055362701416015625, 0.058510780334472656, 0.06165885925292969, 0.06480693817138672, 0.06795501708984375, 0.07110309600830078, 0.07425117492675781, 0.07739925384521484, 0.08054733276367188, 0.0836954116821289, 0.08684349060058594, 0.08999156951904297, 0.0931396484375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 5.0, 3.0, 3.0, 8.0, 9.0, 8.0, 10.0, 17.0, 27.0, 17.0, 22.0, 30.0, 26.0, 37.0, 26.0, 39.0, 45.0, 43.0, 42.0, 60.0, 45.0, 50.0, 42.0, 36.0, 42.0, 35.0, 34.0, 39.0, 31.0, 17.0, 24.0, 24.0, 19.0, 14.0, 14.0, 9.0, 9.0, 9.0, 9.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.0832672119140625, -0.080718994140625, -0.0781707763671875, -0.07562255859375, -0.0730743408203125, -0.070526123046875, -0.0679779052734375, -0.0654296875, -0.0628814697265625, -0.060333251953125, -0.0577850341796875, -0.05523681640625, -0.0526885986328125, -0.050140380859375, -0.0475921630859375, -0.0450439453125, -0.0424957275390625, -0.039947509765625, -0.0373992919921875, -0.03485107421875, -0.0323028564453125, -0.029754638671875, -0.0272064208984375, -0.024658203125, -0.0221099853515625, -0.019561767578125, -0.0170135498046875, -0.01446533203125, -0.0119171142578125, -0.009368896484375, -0.0068206787109375, -0.0042724609375, -0.0017242431640625, 0.000823974609375, 0.0033721923828125, 0.00592041015625, 0.0084686279296875, 0.011016845703125, 0.0135650634765625, 0.01611328125, 0.0186614990234375, 0.021209716796875, 0.0237579345703125, 0.02630615234375, 0.0288543701171875, 0.031402587890625, 0.0339508056640625, 0.0364990234375, 0.0390472412109375, 0.041595458984375, 0.0441436767578125, 0.04669189453125, 0.0492401123046875, 0.051788330078125, 0.0543365478515625, 0.056884765625, 0.0594329833984375, 0.061981201171875, 0.0645294189453125, 0.06707763671875, 0.0696258544921875, 0.072174072265625, 0.0747222900390625, 0.0772705078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 11.0, 9.0, 14.0, 17.0, 21.0, 26.0, 48.0, 72.0, 144.0, 373.0, 1423.0, 6707.0, 40979.0, 512635.0, 441867.0, 36132.0, 6072.0, 1299.0, 336.0, 124.0, 80.0, 54.0, 20.0, 25.0, 19.0, 11.0, 9.0, 6.0, 6.0, 4.0, 1.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31103515625, -0.29749298095703125, -0.2839508056640625, -0.27040863037109375, -0.256866455078125, -0.24332427978515625, -0.2297821044921875, -0.21623992919921875, -0.20269775390625, -0.18915557861328125, -0.1756134033203125, -0.16207122802734375, -0.148529052734375, -0.13498687744140625, -0.1214447021484375, -0.10790252685546875, -0.0943603515625, -0.08081817626953125, -0.0672760009765625, -0.05373382568359375, -0.040191650390625, -0.02664947509765625, -0.0131072998046875, 0.00043487548828125, 0.01397705078125, 0.02751922607421875, 0.0410614013671875, 0.05460357666015625, 0.068145751953125, 0.08168792724609375, 0.0952301025390625, 0.10877227783203125, 0.122314453125, 0.13585662841796875, 0.1493988037109375, 0.16294097900390625, 0.176483154296875, 0.19002532958984375, 0.2035675048828125, 0.21710968017578125, 0.23065185546875, 0.24419403076171875, 0.2577362060546875, 0.27127838134765625, 0.284820556640625, 0.29836273193359375, 0.3119049072265625, 0.32544708251953125, 0.3389892578125, 0.35253143310546875, 0.3660736083984375, 0.37961578369140625, 0.393157958984375, 0.40670013427734375, 0.4202423095703125, 0.43378448486328125, 0.44732666015625, 0.46086883544921875, 0.4744110107421875, 0.48795318603515625, 0.501495361328125, 0.5150375366210938, 0.5285797119140625, 0.5421218872070312, 0.5556640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 6.0, 3.0, 6.0, 10.0, 13.0, 10.0, 16.0, 21.0, 16.0, 26.0, 31.0, 35.0, 43.0, 53.0, 46.0, 47.0, 48.0, 59.0, 62.0, 63.0, 57.0, 48.0, 58.0, 40.0, 39.0, 30.0, 18.0, 17.0, 23.0, 16.0, 6.0, 12.0, 8.0, 9.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38818359375, -0.37804412841796875, -0.3679046630859375, -0.35776519775390625, -0.347625732421875, -0.33748626708984375, -0.3273468017578125, -0.31720733642578125, -0.30706787109375, -0.29692840576171875, -0.2867889404296875, -0.27664947509765625, -0.266510009765625, -0.25637054443359375, -0.2462310791015625, -0.23609161376953125, -0.2259521484375, -0.21581268310546875, -0.2056732177734375, -0.19553375244140625, -0.185394287109375, -0.17525482177734375, -0.1651153564453125, -0.15497589111328125, -0.14483642578125, -0.13469696044921875, -0.1245574951171875, -0.11441802978515625, -0.104278564453125, -0.09413909912109375, -0.0839996337890625, -0.07386016845703125, -0.063720703125, -0.05358123779296875, -0.0434417724609375, -0.03330230712890625, -0.023162841796875, -0.01302337646484375, -0.0028839111328125, 0.00725555419921875, 0.01739501953125, 0.02753448486328125, 0.0376739501953125, 0.04781341552734375, 0.057952880859375, 0.06809234619140625, 0.0782318115234375, 0.08837127685546875, 0.0985107421875, 0.10865020751953125, 0.1187896728515625, 0.12892913818359375, 0.139068603515625, 0.14920806884765625, 0.1593475341796875, 0.16948699951171875, 0.17962646484375, 0.18976593017578125, 0.1999053955078125, 0.21004486083984375, 0.220184326171875, 0.23032379150390625, 0.2404632568359375, 0.25060272216796875, 0.2607421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 20.0, 26.0, 38.0, 58.0, 78.0, 150.0, 247.0, 329.0, 521.0, 818.0, 1411.0, 2263.0, 3786.0, 6605.0, 10928.0, 18431.0, 30251.0, 50395.0, 90707.0, 214321.0, 309923.0, 139188.0, 68053.0, 39716.0, 24255.0, 14456.0, 8544.0, 5197.0, 3037.0, 1809.0, 1078.0, 699.0, 449.0, 279.0, 161.0, 111.0, 61.0, 47.0, 26.0, 15.0, 9.0, 19.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.06005859375, -0.05813789367675781, -0.056217193603515625, -0.05429649353027344, -0.05237579345703125, -0.05045509338378906, -0.048534393310546875, -0.04661369323730469, -0.0446929931640625, -0.04277229309082031, -0.040851593017578125, -0.03893089294433594, -0.03701019287109375, -0.03508949279785156, -0.033168792724609375, -0.031248092651367188, -0.029327392578125, -0.027406692504882812, -0.025485992431640625, -0.023565292358398438, -0.02164459228515625, -0.019723892211914062, -0.017803192138671875, -0.015882492065429688, -0.0139617919921875, -0.012041091918945312, -0.010120391845703125, -0.008199691772460938, -0.00627899169921875, -0.0043582916259765625, -0.002437591552734375, -0.0005168914794921875, 0.00140380859375, 0.0033245086669921875, 0.005245208740234375, 0.0071659088134765625, 0.00908660888671875, 0.011007308959960938, 0.012928009033203125, 0.014848709106445312, 0.0167694091796875, 0.018690109252929688, 0.020610809326171875, 0.022531509399414062, 0.02445220947265625, 0.026372909545898438, 0.028293609619140625, 0.030214309692382812, 0.032135009765625, 0.03405570983886719, 0.035976409912109375, 0.03789710998535156, 0.03981781005859375, 0.04173851013183594, 0.043659210205078125, 0.04557991027832031, 0.0475006103515625, 0.04942131042480469, 0.051342010498046875, 0.05326271057128906, 0.05518341064453125, 0.05710411071777344, 0.059024810791015625, 0.06094551086425781, 0.0628662109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 10.0, 9.0, 13.0, 10.0, 7.0, 19.0, 22.0, 19.0, 22.0, 33.0, 51.0, 62.0, 60.0, 57.0, 80.0, 75.0, 73.0, 69.0, 59.0, 58.0, 33.0, 33.0, 24.0, 18.0, 12.0, 14.0, 9.0, 8.0, 6.0, 4.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.9490718841552734e-05, -1.887138932943344e-05, -1.8252059817314148e-05, -1.7632730305194855e-05, -1.701340079307556e-05, -1.639407128095627e-05, -1.5774741768836975e-05, -1.5155412256717682e-05, -1.4536082744598389e-05, -1.3916753232479095e-05, -1.3297423720359802e-05, -1.2678094208240509e-05, -1.2058764696121216e-05, -1.1439435184001923e-05, -1.082010567188263e-05, -1.0200776159763336e-05, -9.581446647644043e-06, -8.96211713552475e-06, -8.342787623405457e-06, -7.723458111286163e-06, -7.10412859916687e-06, -6.484799087047577e-06, -5.865469574928284e-06, -5.2461400628089905e-06, -4.626810550689697e-06, -4.007481038570404e-06, -3.388151526451111e-06, -2.7688220143318176e-06, -2.1494925022125244e-06, -1.5301629900932312e-06, -9.10833477973938e-07, -2.915039658546448e-07, 3.2782554626464844e-07, 9.471550583839417e-07, 1.5664845705032349e-06, 2.185814082622528e-06, 2.8051435947418213e-06, 3.4244731068611145e-06, 4.043802618980408e-06, 4.663132131099701e-06, 5.282461643218994e-06, 5.901791155338287e-06, 6.5211206674575806e-06, 7.140450179576874e-06, 7.759779691696167e-06, 8.37910920381546e-06, 8.998438715934753e-06, 9.617768228054047e-06, 1.023709774017334e-05, 1.0856427252292633e-05, 1.1475756764411926e-05, 1.209508627653122e-05, 1.2714415788650513e-05, 1.3333745300769806e-05, 1.3953074812889099e-05, 1.4572404325008392e-05, 1.5191733837127686e-05, 1.581106334924698e-05, 1.6430392861366272e-05, 1.7049722373485565e-05, 1.766905188560486e-05, 1.828838139772415e-05, 1.8907710909843445e-05, 1.9527040421962738e-05, 2.014636993408203e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 14.0, 18.0, 16.0, 45.0, 54.0, 76.0, 149.0, 212.0, 470.0, 1131.0, 3442.0, 12577.0, 49333.0, 200210.0, 593471.0, 138040.0, 35612.0, 9197.0, 2668.0, 879.0, 413.0, 213.0, 125.0, 64.0, 42.0, 23.0, 21.0, 11.0, 8.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13232421875, -0.12730789184570312, -0.12229156494140625, -0.11727523803710938, -0.1122589111328125, -0.10724258422851562, -0.10222625732421875, -0.09720993041992188, -0.092193603515625, -0.08717727661132812, -0.08216094970703125, -0.07714462280273438, -0.0721282958984375, -0.06711196899414062, -0.06209564208984375, -0.057079315185546875, -0.05206298828125, -0.047046661376953125, -0.04203033447265625, -0.037014007568359375, -0.0319976806640625, -0.026981353759765625, -0.02196502685546875, -0.016948699951171875, -0.011932373046875, -0.006916046142578125, -0.00189971923828125, 0.003116607666015625, 0.0081329345703125, 0.013149261474609375, 0.01816558837890625, 0.023181915283203125, 0.0281982421875, 0.033214569091796875, 0.03823089599609375, 0.043247222900390625, 0.0482635498046875, 0.053279876708984375, 0.05829620361328125, 0.06331253051757812, 0.068328857421875, 0.07334518432617188, 0.07836151123046875, 0.08337783813476562, 0.0883941650390625, 0.09341049194335938, 0.09842681884765625, 0.10344314575195312, 0.10845947265625, 0.11347579956054688, 0.11849212646484375, 0.12350845336914062, 0.1285247802734375, 0.13354110717773438, 0.13855743408203125, 0.14357376098632812, 0.148590087890625, 0.15360641479492188, 0.15862274169921875, 0.16363906860351562, 0.1686553955078125, 0.17367172241210938, 0.17868804931640625, 0.18370437622070312, 0.188720703125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 2.0, 7.0, 10.0, 11.0, 13.0, 19.0, 15.0, 26.0, 38.0, 49.0, 55.0, 76.0, 98.0, 129.0, 111.0, 75.0, 46.0, 54.0, 28.0, 28.0, 19.0, 19.0, 14.0, 13.0, 15.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08697509765625, -0.08394336700439453, -0.08091163635253906, -0.0778799057006836, -0.07484817504882812, -0.07181644439697266, -0.06878471374511719, -0.06575298309326172, -0.06272125244140625, -0.05968952178955078, -0.05665779113769531, -0.053626060485839844, -0.050594329833984375, -0.047562599182128906, -0.04453086853027344, -0.04149913787841797, -0.0384674072265625, -0.03543567657470703, -0.03240394592285156, -0.029372215270996094, -0.026340484619140625, -0.023308753967285156, -0.020277023315429688, -0.01724529266357422, -0.01421356201171875, -0.011181831359863281, -0.008150100708007812, -0.005118370056152344, -0.002086639404296875, 0.0009450912475585938, 0.0039768218994140625, 0.007008552551269531, 0.010040283203125, 0.013072013854980469, 0.016103744506835938, 0.019135475158691406, 0.022167205810546875, 0.025198936462402344, 0.028230667114257812, 0.03126239776611328, 0.03429412841796875, 0.03732585906982422, 0.04035758972167969, 0.043389320373535156, 0.046421051025390625, 0.049452781677246094, 0.05248451232910156, 0.05551624298095703, 0.0585479736328125, 0.06157970428466797, 0.06461143493652344, 0.0676431655883789, 0.07067489624023438, 0.07370662689208984, 0.07673835754394531, 0.07977008819580078, 0.08280181884765625, 0.08583354949951172, 0.08886528015136719, 0.09189701080322266, 0.09492874145507812, 0.0979604721069336, 0.10099220275878906, 0.10402393341064453, 0.1070556640625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 17.0, 26.0, 61.0, 113.0, 169.0, 217.0, 182.0, 124.0, 63.0, 24.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6537616848945618, -0.5969516634941101, -0.5401415824890137, -0.483331561088562, -0.42652150988578796, -0.3697114586830139, -0.31290143728256226, -0.2560913860797882, -0.19928133487701416, -0.1424712836742401, -0.08566124737262726, -0.028851211071014404, 0.027958840131759644, 0.08476889133453369, 0.14157891273498535, 0.1983889639377594, 0.25519901514053345, 0.3120090663433075, 0.36881911754608154, 0.4256291389465332, 0.48243919014930725, 0.5392492413520813, 0.596059262752533, 0.6528693437576294, 0.709679365158081, 0.7664893865585327, 0.8232994675636292, 0.8801094889640808, 0.9369195699691772, 0.9937295913696289, 1.0505396127700806, 1.1073496341705322, 1.1641597747802734, 1.220969796180725, 1.2777798175811768, 1.334589958190918, 1.3913999795913696, 1.4482100009918213, 1.505020022392273, 1.5618300437927246, 1.6186401844024658, 1.6754502058029175, 1.7322602272033691, 1.7890703678131104, 1.845880389213562, 1.9026904106140137, 1.9595004320144653, 2.016310453414917, 2.073120594024658, 2.1299307346343994, 2.1867406368255615, 2.2435507774353027, 2.300360679626465, 2.357170820236206, 2.4139809608459473, 2.4707908630371094, 2.5276007652282715, 2.5844109058380127, 2.641220808029175, 2.698030948638916, 2.754840850830078, 2.8116509914398193, 2.8684611320495605, 2.9252710342407227, 2.982081174850464]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 9.0, 4.0, 5.0, 9.0, 12.0, 15.0, 14.0, 14.0, 22.0, 28.0, 18.0, 30.0, 33.0, 32.0, 22.0, 31.0, 32.0, 36.0, 42.0, 50.0, 40.0, 34.0, 34.0, 34.0, 33.0, 38.0, 37.0, 38.0, 25.0, 31.0, 32.0, 19.0, 16.0, 18.0, 10.0, 20.0, 15.0, 12.0, 7.0, 8.0, 10.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5651933550834656, -0.5453123450279236, -0.5254312753677368, -0.5055502653121948, -0.48566919565200806, -0.46578818559646606, -0.4459071457386017, -0.4260261058807373, -0.4061450660228729, -0.38626402616500854, -0.36638298630714417, -0.3465019464492798, -0.3266209363937378, -0.306739866733551, -0.28685885667800903, -0.26697781682014465, -0.24709677696228027, -0.2272157371044159, -0.2073346972465515, -0.18745367228984833, -0.16757263243198395, -0.14769159257411957, -0.12781056761741638, -0.107929527759552, -0.08804848790168762, -0.06816744804382324, -0.04828641563653946, -0.028405379503965378, -0.008524343371391296, 0.011356696486473083, 0.031237728893756866, 0.05111876130104065, 0.07099980115890503, 0.09088084101676941, 0.11076187342405319, 0.13064290583133698, 0.15052394568920135, 0.17040498554706573, 0.19028601050376892, 0.2101670503616333, 0.23004809021949768, 0.24992913007736206, 0.26981016993522644, 0.2896912097930908, 0.3095722198486328, 0.3294532895088196, 0.3493342995643616, 0.36921533942222595, 0.38909637928009033, 0.4089774191379547, 0.4288584589958191, 0.44873949885368347, 0.46862053871154785, 0.48850154876708984, 0.5083826184272766, 0.5282636284828186, 0.5481446981430054, 0.5680257081985474, 0.5879067778587341, 0.6077877879142761, 0.6276688575744629, 0.6475498676300049, 0.6674309372901917, 0.6873119473457336, 0.7071929574012756]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 18.0, 18.0, 29.0, 39.0, 35.0, 78.0, 88.0, 108.0, 202.0, 306.0, 473.0, 728.0, 1211.0, 2159.0, 3658.0, 6483.0, 12374.0, 25758.0, 57899.0, 150253.0, 495527.0, 2043889.0, 979325.0, 249045.0, 89441.0, 37592.0, 17332.0, 8777.0, 4716.0, 2696.0, 1543.0, 829.0, 578.0, 365.0, 206.0, 160.0, 91.0, 70.0, 42.0, 31.0, 28.0, 17.0, 19.0, 9.0, 6.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.1179208755493164, -0.11395454406738281, -0.10998821258544922, -0.10602188110351562, -0.10205554962158203, -0.09808921813964844, -0.09412288665771484, -0.09015655517578125, -0.08619022369384766, -0.08222389221191406, -0.07825756072998047, -0.07429122924804688, -0.07032489776611328, -0.06635856628417969, -0.062392234802246094, -0.0584259033203125, -0.054459571838378906, -0.05049324035644531, -0.04652690887451172, -0.042560577392578125, -0.03859424591064453, -0.03462791442871094, -0.030661582946777344, -0.02669525146484375, -0.022728919982910156, -0.018762588500976562, -0.014796257019042969, -0.010829925537109375, -0.006863594055175781, -0.0028972625732421875, 0.0010690689086914062, 0.005035400390625, 0.009001731872558594, 0.012968063354492188, 0.01693439483642578, 0.020900726318359375, 0.02486705780029297, 0.028833389282226562, 0.032799720764160156, 0.03676605224609375, 0.040732383728027344, 0.04469871520996094, 0.04866504669189453, 0.052631378173828125, 0.05659770965576172, 0.06056404113769531, 0.0645303726196289, 0.0684967041015625, 0.0724630355834961, 0.07642936706542969, 0.08039569854736328, 0.08436203002929688, 0.08832836151123047, 0.09229469299316406, 0.09626102447509766, 0.10022735595703125, 0.10419368743896484, 0.10816001892089844, 0.11212635040283203, 0.11609268188476562, 0.12005901336669922, 0.12402534484863281, 0.1279916763305664, 0.1319580078125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 4.0, 2.0, 7.0, 10.0, 9.0, 9.0, 14.0, 17.0, 20.0, 10.0, 29.0, 31.0, 34.0, 30.0, 20.0, 36.0, 41.0, 33.0, 48.0, 50.0, 34.0, 49.0, 47.0, 42.0, 35.0, 46.0, 28.0, 26.0, 32.0, 28.0, 19.0, 21.0, 25.0, 18.0, 11.0, 13.0, 14.0, 7.0, 6.0, 7.0, 9.0, 3.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.08343505859375, -0.08101940155029297, -0.07860374450683594, -0.0761880874633789, -0.07377243041992188, -0.07135677337646484, -0.06894111633300781, -0.06652545928955078, -0.06410980224609375, -0.06169414520263672, -0.05927848815917969, -0.056862831115722656, -0.054447174072265625, -0.052031517028808594, -0.04961585998535156, -0.04720020294189453, -0.0447845458984375, -0.04236888885498047, -0.03995323181152344, -0.037537574768066406, -0.035121917724609375, -0.032706260681152344, -0.030290603637695312, -0.02787494659423828, -0.02545928955078125, -0.02304363250732422, -0.020627975463867188, -0.018212318420410156, -0.015796661376953125, -0.013381004333496094, -0.010965347290039062, -0.008549690246582031, -0.006134033203125, -0.0037183761596679688, -0.0013027191162109375, 0.0011129379272460938, 0.003528594970703125, 0.005944252014160156, 0.008359909057617188, 0.010775566101074219, 0.01319122314453125, 0.015606880187988281, 0.018022537231445312, 0.020438194274902344, 0.022853851318359375, 0.025269508361816406, 0.027685165405273438, 0.03010082244873047, 0.0325164794921875, 0.03493213653564453, 0.03734779357910156, 0.039763450622558594, 0.042179107666015625, 0.044594764709472656, 0.04701042175292969, 0.04942607879638672, 0.05184173583984375, 0.05425739288330078, 0.05667304992675781, 0.059088706970214844, 0.061504364013671875, 0.0639200210571289, 0.06633567810058594, 0.06875133514404297, 0.0711669921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 3.0, 5.0, 7.0, 13.0, 22.0, 35.0, 42.0, 70.0, 93.0, 125.0, 243.0, 397.0, 661.0, 1244.0, 2470.0, 5229.0, 12201.0, 31351.0, 96724.0, 364841.0, 2061741.0, 1262474.0, 243681.0, 69194.0, 23538.0, 9379.0, 3969.0, 1971.0, 1057.0, 544.0, 330.0, 212.0, 125.0, 90.0, 55.0, 37.0, 29.0, 24.0, 11.0, 14.0, 11.0, 8.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.25830078125, -0.25089073181152344, -0.24348068237304688, -0.2360706329345703, -0.22866058349609375, -0.2212505340576172, -0.21384048461914062, -0.20643043518066406, -0.1990203857421875, -0.19161033630371094, -0.18420028686523438, -0.1767902374267578, -0.16938018798828125, -0.1619701385498047, -0.15456008911132812, -0.14715003967285156, -0.139739990234375, -0.13232994079589844, -0.12491989135742188, -0.11750984191894531, -0.11009979248046875, -0.10268974304199219, -0.09527969360351562, -0.08786964416503906, -0.0804595947265625, -0.07304954528808594, -0.06563949584960938, -0.05822944641113281, -0.05081939697265625, -0.04340934753417969, -0.035999298095703125, -0.028589248657226562, -0.02117919921875, -0.013769149780273438, -0.006359100341796875, 0.0010509490966796875, 0.00846099853515625, 0.015871047973632812, 0.023281097412109375, 0.030691146850585938, 0.0381011962890625, 0.04551124572753906, 0.052921295166015625, 0.06033134460449219, 0.06774139404296875, 0.07515144348144531, 0.08256149291992188, 0.08997154235839844, 0.097381591796875, 0.10479164123535156, 0.11220169067382812, 0.11961174011230469, 0.12702178955078125, 0.1344318389892578, 0.14184188842773438, 0.14925193786621094, 0.1566619873046875, 0.16407203674316406, 0.17148208618164062, 0.1788921356201172, 0.18630218505859375, 0.1937122344970703, 0.20112228393554688, 0.20853233337402344, 0.2159423828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 14.0, 19.0, 21.0, 35.0, 46.0, 76.0, 116.0, 153.0, 285.0, 449.0, 808.0, 783.0, 398.0, 258.0, 184.0, 118.0, 100.0, 55.0, 33.0, 25.0, 20.0, 16.0, 14.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.1990489959716797, -0.19167709350585938, -0.18430519104003906, -0.17693328857421875, -0.16956138610839844, -0.16218948364257812, -0.1548175811767578, -0.1474456787109375, -0.1400737762451172, -0.13270187377929688, -0.12532997131347656, -0.11795806884765625, -0.11058616638183594, -0.10321426391601562, -0.09584236145019531, -0.088470458984375, -0.08109855651855469, -0.07372665405273438, -0.06635475158691406, -0.05898284912109375, -0.05161094665527344, -0.044239044189453125, -0.03686714172363281, -0.0294952392578125, -0.022123336791992188, -0.014751434326171875, -0.0073795318603515625, -7.62939453125e-06, 0.0073642730712890625, 0.014736175537109375, 0.022108078002929688, 0.02947998046875, 0.03685188293457031, 0.044223785400390625, 0.05159568786621094, 0.05896759033203125, 0.06633949279785156, 0.07371139526367188, 0.08108329772949219, 0.0884552001953125, 0.09582710266113281, 0.10319900512695312, 0.11057090759277344, 0.11794281005859375, 0.12531471252441406, 0.13268661499023438, 0.1400585174560547, 0.147430419921875, 0.1548023223876953, 0.16217422485351562, 0.16954612731933594, 0.17691802978515625, 0.18428993225097656, 0.19166183471679688, 0.1990337371826172, 0.2064056396484375, 0.2137775421142578, 0.22114944458007812, 0.22852134704589844, 0.23589324951171875, 0.24326515197753906, 0.2506370544433594, 0.2580089569091797, 0.265380859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 13.0, 20.0, 33.0, 45.0, 58.0, 75.0, 89.0, 103.0, 123.0, 95.0, 96.0, 87.0, 43.0, 47.0, 26.0, 19.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9431825876235962, -0.9066481590270996, -0.870113730430603, -0.8335792422294617, -0.7970448136329651, -0.7605103850364685, -0.7239758968353271, -0.6874414682388306, -0.650907039642334, -0.6143726110458374, -0.5778381824493408, -0.5413036942481995, -0.5047692656517029, -0.4682348370552063, -0.43170037865638733, -0.39516592025756836, -0.3586314916610718, -0.3220970630645752, -0.2855626046657562, -0.24902816116809845, -0.21249371767044067, -0.1759592741727829, -0.13942483067512512, -0.10289037227630615, -0.06635594367980957, -0.029821500182151794, 0.0067129433155059814, 0.04324738681316376, 0.07978183031082153, 0.11631627380847931, 0.15285071730613708, 0.18938517570495605, 0.22591948509216309, 0.26245391368865967, 0.29898837208747864, 0.3355228304862976, 0.3720572590827942, 0.40859168767929077, 0.44512614607810974, 0.4816606044769287, 0.5181950330734253, 0.5547294616699219, 0.5912638902664185, 0.6277983784675598, 0.6643328070640564, 0.700867235660553, 0.7374017238616943, 0.7739361524581909, 0.8104705810546875, 0.8470050096511841, 0.8835394382476807, 0.920073926448822, 0.9566083550453186, 0.9931427836418152, 1.0296772718429565, 1.0662117004394531, 1.1027461290359497, 1.1392805576324463, 1.1758149862289429, 1.2123494148254395, 1.2488839626312256, 1.2854183912277222, 1.3219528198242188, 1.3584872484207153, 1.395021677017212]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 8.0, 8.0, 14.0, 19.0, 18.0, 18.0, 20.0, 23.0, 31.0, 35.0, 30.0, 47.0, 41.0, 41.0, 47.0, 46.0, 37.0, 42.0, 45.0, 39.0, 45.0, 49.0, 40.0, 29.0, 30.0, 16.0, 26.0, 16.0, 19.0, 21.0, 19.0, 20.0, 9.0, 7.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6378845572471619, -0.618523895740509, -0.5991631746292114, -0.5798025131225586, -0.560441792011261, -0.5410811305046082, -0.5217204093933105, -0.5023597478866577, -0.4829990565776825, -0.4636383652687073, -0.44427767395973206, -0.42491698265075684, -0.405556321144104, -0.3861956000328064, -0.36683493852615356, -0.34747424721717834, -0.3281135559082031, -0.3087528645992279, -0.2893921732902527, -0.27003148198127747, -0.25067079067230225, -0.23131011426448822, -0.2119494378566742, -0.19258874654769897, -0.17322805523872375, -0.15386736392974854, -0.13450667262077332, -0.11514599621295929, -0.09578530490398407, -0.07642461359500885, -0.05706392973661423, -0.037703245878219604, -0.01834261417388916, 0.001018073409795761, 0.020378760993480682, 0.039739448577165604, 0.059100136160850525, 0.07846082746982574, 0.09782151132822037, 0.11718219518661499, 0.1365428864955902, 0.15590357780456543, 0.17526426911354065, 0.19462494552135468, 0.2139856368303299, 0.23334632813930511, 0.25270700454711914, 0.27206769585609436, 0.2914283871650696, 0.3107890784740448, 0.33014976978302, 0.34951046109199524, 0.36887115240097046, 0.3882318139076233, 0.4075925052165985, 0.42695319652557373, 0.44631388783454895, 0.46567457914352417, 0.4850352704524994, 0.5043959617614746, 0.5237566232681274, 0.543117344379425, 0.5624780058860779, 0.5818387269973755, 0.6011993885040283]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 7.0, 8.0, 9.0, 21.0, 23.0, 39.0, 58.0, 106.0, 147.0, 168.0, 277.0, 470.0, 662.0, 998.0, 1579.0, 2520.0, 3773.0, 6056.0, 9515.0, 15038.0, 24688.0, 40292.0, 69438.0, 129520.0, 251934.0, 223280.0, 111440.0, 61096.0, 35969.0, 22040.0, 13527.0, 8613.0, 5521.0, 3354.0, 2184.0, 1468.0, 920.0, 619.0, 408.0, 246.0, 167.0, 116.0, 91.0, 48.0, 37.0, 17.0, 19.0, 15.0, 5.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1314697265625, -0.12691879272460938, -0.12236785888671875, -0.11781692504882812, -0.1132659912109375, -0.10871505737304688, -0.10416412353515625, -0.09961318969726562, -0.095062255859375, -0.09051132202148438, -0.08596038818359375, -0.08140945434570312, -0.0768585205078125, -0.07230758666992188, -0.06775665283203125, -0.06320571899414062, -0.05865478515625, -0.054103851318359375, -0.04955291748046875, -0.045001983642578125, -0.0404510498046875, -0.035900115966796875, -0.03134918212890625, -0.026798248291015625, -0.022247314453125, -0.017696380615234375, -0.01314544677734375, -0.008594512939453125, -0.0040435791015625, 0.000507354736328125, 0.00505828857421875, 0.009609222412109375, 0.01416015625, 0.018711090087890625, 0.02326202392578125, 0.027812957763671875, 0.0323638916015625, 0.036914825439453125, 0.04146575927734375, 0.046016693115234375, 0.050567626953125, 0.055118560791015625, 0.05966949462890625, 0.06422042846679688, 0.0687713623046875, 0.07332229614257812, 0.07787322998046875, 0.08242416381835938, 0.08697509765625, 0.09152603149414062, 0.09607696533203125, 0.10062789916992188, 0.1051788330078125, 0.10972976684570312, 0.11428070068359375, 0.11883163452148438, 0.123382568359375, 0.12793350219726562, 0.13248443603515625, 0.13703536987304688, 0.1415863037109375, 0.14613723754882812, 0.15068817138671875, 0.15523910522460938, 0.1597900390625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 5.0, 4.0, 5.0, 11.0, 10.0, 13.0, 14.0, 17.0, 17.0, 29.0, 27.0, 39.0, 37.0, 35.0, 49.0, 36.0, 37.0, 51.0, 38.0, 43.0, 35.0, 46.0, 47.0, 37.0, 50.0, 28.0, 44.0, 35.0, 18.0, 23.0, 17.0, 10.0, 15.0, 11.0, 10.0, 8.0, 9.0, 4.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.097900390625, -0.09518623352050781, -0.09247207641601562, -0.08975791931152344, -0.08704376220703125, -0.08432960510253906, -0.08161544799804688, -0.07890129089355469, -0.0761871337890625, -0.07347297668457031, -0.07075881958007812, -0.06804466247558594, -0.06533050537109375, -0.06261634826660156, -0.059902191162109375, -0.05718803405761719, -0.054473876953125, -0.05175971984863281, -0.049045562744140625, -0.04633140563964844, -0.04361724853515625, -0.04090309143066406, -0.038188934326171875, -0.03547477722167969, -0.0327606201171875, -0.030046463012695312, -0.027332305908203125, -0.024618148803710938, -0.02190399169921875, -0.019189834594726562, -0.016475677490234375, -0.013761520385742188, -0.01104736328125, -0.008333206176757812, -0.005619049072265625, -0.0029048919677734375, -0.00019073486328125, 0.0025234222412109375, 0.005237579345703125, 0.007951736450195312, 0.0106658935546875, 0.013380050659179688, 0.016094207763671875, 0.018808364868164062, 0.02152252197265625, 0.024236679077148438, 0.026950836181640625, 0.029664993286132812, 0.032379150390625, 0.03509330749511719, 0.037807464599609375, 0.04052162170410156, 0.04323577880859375, 0.04594993591308594, 0.048664093017578125, 0.05137825012207031, 0.0540924072265625, 0.05680656433105469, 0.059520721435546875, 0.06223487854003906, 0.06494903564453125, 0.06766319274902344, 0.07037734985351562, 0.07309150695800781, 0.0758056640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 10.0, 9.0, 7.0, 12.0, 15.0, 26.0, 27.0, 39.0, 39.0, 69.0, 84.0, 104.0, 157.0, 269.0, 517.0, 986.0, 2189.0, 5309.0, 13107.0, 33432.0, 89344.0, 284334.0, 407582.0, 132306.0, 46977.0, 18416.0, 7298.0, 2965.0, 1236.0, 634.0, 347.0, 169.0, 131.0, 97.0, 75.0, 62.0, 36.0, 29.0, 28.0, 13.0, 15.0, 11.0, 10.0, 6.0, 7.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0], "bins": [-0.29638671875, -0.2879619598388672, -0.2795372009277344, -0.27111244201660156, -0.26268768310546875, -0.25426292419433594, -0.24583816528320312, -0.2374134063720703, -0.2289886474609375, -0.2205638885498047, -0.21213912963867188, -0.20371437072753906, -0.19528961181640625, -0.18686485290527344, -0.17844009399414062, -0.1700153350830078, -0.161590576171875, -0.1531658172607422, -0.14474105834960938, -0.13631629943847656, -0.12789154052734375, -0.11946678161621094, -0.11104202270507812, -0.10261726379394531, -0.0941925048828125, -0.08576774597167969, -0.07734298706054688, -0.06891822814941406, -0.06049346923828125, -0.05206871032714844, -0.043643951416015625, -0.03521919250488281, -0.02679443359375, -0.018369674682617188, -0.009944915771484375, -0.0015201568603515625, 0.00690460205078125, 0.015329360961914062, 0.023754119873046875, 0.03217887878417969, 0.0406036376953125, 0.04902839660644531, 0.057453155517578125, 0.06587791442871094, 0.07430267333984375, 0.08272743225097656, 0.09115219116210938, 0.09957695007324219, 0.108001708984375, 0.11642646789550781, 0.12485122680664062, 0.13327598571777344, 0.14170074462890625, 0.15012550354003906, 0.15855026245117188, 0.1669750213623047, 0.1753997802734375, 0.1838245391845703, 0.19224929809570312, 0.20067405700683594, 0.20909881591796875, 0.21752357482910156, 0.22594833374023438, 0.2343730926513672, 0.2427978515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 3.0, 7.0, 6.0, 13.0, 7.0, 16.0, 16.0, 15.0, 20.0, 16.0, 24.0, 25.0, 23.0, 33.0, 32.0, 38.0, 52.0, 46.0, 35.0, 42.0, 34.0, 54.0, 38.0, 45.0, 26.0, 35.0, 34.0, 32.0, 29.0, 25.0, 29.0, 24.0, 21.0, 18.0, 10.0, 12.0, 9.0, 14.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.276611328125, -0.2676277160644531, -0.25864410400390625, -0.24966049194335938, -0.2406768798828125, -0.23169326782226562, -0.22270965576171875, -0.21372604370117188, -0.204742431640625, -0.19575881958007812, -0.18677520751953125, -0.17779159545898438, -0.1688079833984375, -0.15982437133789062, -0.15084075927734375, -0.14185714721679688, -0.13287353515625, -0.12388992309570312, -0.11490631103515625, -0.10592269897460938, -0.0969390869140625, -0.08795547485351562, -0.07897186279296875, -0.06998825073242188, -0.061004638671875, -0.052021026611328125, -0.04303741455078125, -0.034053802490234375, -0.0250701904296875, -0.016086578369140625, -0.00710296630859375, 0.001880645751953125, 0.0108642578125, 0.019847869873046875, 0.02883148193359375, 0.037815093994140625, 0.0467987060546875, 0.055782318115234375, 0.06476593017578125, 0.07374954223632812, 0.082733154296875, 0.09171676635742188, 0.10070037841796875, 0.10968399047851562, 0.1186676025390625, 0.12765121459960938, 0.13663482666015625, 0.14561843872070312, 0.15460205078125, 0.16358566284179688, 0.17256927490234375, 0.18155288696289062, 0.1905364990234375, 0.19952011108398438, 0.20850372314453125, 0.21748733520507812, 0.226470947265625, 0.23545455932617188, 0.24443817138671875, 0.2534217834472656, 0.2624053955078125, 0.2713890075683594, 0.28037261962890625, 0.2893562316894531, 0.29833984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 15.0, 14.0, 29.0, 41.0, 27.0, 72.0, 86.0, 150.0, 251.0, 468.0, 988.0, 2102.0, 5815.0, 17178.0, 57656.0, 238253.0, 539285.0, 132201.0, 35414.0, 11223.0, 4003.0, 1632.0, 704.0, 369.0, 175.0, 119.0, 76.0, 53.0, 41.0, 25.0, 18.0, 21.0, 14.0, 9.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.231689453125, -0.22564125061035156, -0.21959304809570312, -0.2135448455810547, -0.20749664306640625, -0.2014484405517578, -0.19540023803710938, -0.18935203552246094, -0.1833038330078125, -0.17725563049316406, -0.17120742797851562, -0.1651592254638672, -0.15911102294921875, -0.1530628204345703, -0.14701461791992188, -0.14096641540527344, -0.134918212890625, -0.12887001037597656, -0.12282180786132812, -0.11677360534667969, -0.11072540283203125, -0.10467720031738281, -0.09862899780273438, -0.09258079528808594, -0.0865325927734375, -0.08048439025878906, -0.07443618774414062, -0.06838798522949219, -0.06233978271484375, -0.05629158020019531, -0.050243377685546875, -0.04419517517089844, -0.03814697265625, -0.03209877014160156, -0.026050567626953125, -0.020002365112304688, -0.01395416259765625, -0.007905960083007812, -0.001857757568359375, 0.0041904449462890625, 0.0102386474609375, 0.016286849975585938, 0.022335052490234375, 0.028383255004882812, 0.03443145751953125, 0.04047966003417969, 0.046527862548828125, 0.05257606506347656, 0.058624267578125, 0.06467247009277344, 0.07072067260742188, 0.07676887512207031, 0.08281707763671875, 0.08886528015136719, 0.09491348266601562, 0.10096168518066406, 0.1070098876953125, 0.11305809020996094, 0.11910629272460938, 0.1251544952392578, 0.13120269775390625, 0.1372509002685547, 0.14329910278320312, 0.14934730529785156, 0.1553955078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 6.0, 8.0, 10.0, 16.0, 16.0, 17.0, 31.0, 38.0, 50.0, 65.0, 109.0, 116.0, 98.0, 87.0, 64.0, 48.0, 49.0, 21.0, 22.0, 25.0, 10.0, 18.0, 11.0, 9.0, 6.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2961368560791016e-05, -3.192666918039322e-05, -3.089196979999542e-05, -2.9857270419597626e-05, -2.882257103919983e-05, -2.7787871658802032e-05, -2.6753172278404236e-05, -2.571847289800644e-05, -2.4683773517608643e-05, -2.3649074137210846e-05, -2.261437475681305e-05, -2.1579675376415253e-05, -2.0544975996017456e-05, -1.951027661561966e-05, -1.8475577235221863e-05, -1.7440877854824066e-05, -1.640617847442627e-05, -1.5371479094028473e-05, -1.4336779713630676e-05, -1.330208033323288e-05, -1.2267380952835083e-05, -1.1232681572437286e-05, -1.019798219203949e-05, -9.163282811641693e-06, -8.128583431243896e-06, -7.0938840508461e-06, -6.059184670448303e-06, -5.024485290050507e-06, -3.98978590965271e-06, -2.9550865292549133e-06, -1.9203871488571167e-06, -8.856877684593201e-07, 1.4901161193847656e-07, 1.1837109923362732e-06, 2.21841037273407e-06, 3.2531097531318665e-06, 4.287809133529663e-06, 5.32250851392746e-06, 6.357207894325256e-06, 7.391907274723053e-06, 8.42660665512085e-06, 9.461306035518646e-06, 1.0496005415916443e-05, 1.153070479631424e-05, 1.2565404176712036e-05, 1.3600103557109833e-05, 1.463480293750763e-05, 1.5669502317905426e-05, 1.6704201698303223e-05, 1.773890107870102e-05, 1.8773600459098816e-05, 1.9808299839496613e-05, 2.084299921989441e-05, 2.1877698600292206e-05, 2.2912397980690002e-05, 2.39470973610878e-05, 2.4981796741485596e-05, 2.6016496121883392e-05, 2.705119550228119e-05, 2.8085894882678986e-05, 2.9120594263076782e-05, 3.015529364347458e-05, 3.1189993023872375e-05, 3.222469240427017e-05, 3.325939178466797e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 18.0, 14.0, 24.0, 25.0, 47.0, 81.0, 149.0, 302.0, 759.0, 1772.0, 4772.0, 18098.0, 99817.0, 588102.0, 276911.0, 43277.0, 9391.0, 2882.0, 1108.0, 481.0, 212.0, 118.0, 68.0, 35.0, 15.0, 14.0, 11.0, 12.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.226806640625, -0.2194347381591797, -0.21206283569335938, -0.20469093322753906, -0.19731903076171875, -0.18994712829589844, -0.18257522583007812, -0.1752033233642578, -0.1678314208984375, -0.1604595184326172, -0.15308761596679688, -0.14571571350097656, -0.13834381103515625, -0.13097190856933594, -0.12360000610351562, -0.11622810363769531, -0.108856201171875, -0.10148429870605469, -0.09411239624023438, -0.08674049377441406, -0.07936859130859375, -0.07199668884277344, -0.06462478637695312, -0.05725288391113281, -0.0498809814453125, -0.04250907897949219, -0.035137176513671875, -0.027765274047851562, -0.02039337158203125, -0.013021469116210938, -0.005649566650390625, 0.0017223358154296875, 0.00909423828125, 0.016466140747070312, 0.023838043212890625, 0.031209945678710938, 0.03858184814453125, 0.04595375061035156, 0.053325653076171875, 0.06069755554199219, 0.0680694580078125, 0.07544136047363281, 0.08281326293945312, 0.09018516540527344, 0.09755706787109375, 0.10492897033691406, 0.11230087280273438, 0.11967277526855469, 0.127044677734375, 0.1344165802001953, 0.14178848266601562, 0.14916038513183594, 0.15653228759765625, 0.16390419006347656, 0.17127609252929688, 0.1786479949951172, 0.1860198974609375, 0.1933917999267578, 0.20076370239257812, 0.20813560485839844, 0.21550750732421875, 0.22287940979003906, 0.23025131225585938, 0.2376232147216797, 0.2449951171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 7.0, 4.0, 8.0, 13.0, 15.0, 24.0, 38.0, 56.0, 59.0, 94.0, 139.0, 110.0, 122.0, 84.0, 50.0, 38.0, 30.0, 27.0, 13.0, 17.0, 6.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.1596393585205078, -0.15399551391601562, -0.14835166931152344, -0.14270782470703125, -0.13706398010253906, -0.13142013549804688, -0.1257762908935547, -0.1201324462890625, -0.11448860168457031, -0.10884475708007812, -0.10320091247558594, -0.09755706787109375, -0.09191322326660156, -0.08626937866210938, -0.08062553405761719, -0.074981689453125, -0.06933784484863281, -0.06369400024414062, -0.05805015563964844, -0.05240631103515625, -0.04676246643066406, -0.041118621826171875, -0.03547477722167969, -0.0298309326171875, -0.024187088012695312, -0.018543243408203125, -0.012899398803710938, -0.00725555419921875, -0.0016117095947265625, 0.004032135009765625, 0.009675979614257812, 0.01531982421875, 0.020963668823242188, 0.026607513427734375, 0.03225135803222656, 0.03789520263671875, 0.04353904724121094, 0.049182891845703125, 0.05482673645019531, 0.0604705810546875, 0.06611442565917969, 0.07175827026367188, 0.07740211486816406, 0.08304595947265625, 0.08868980407714844, 0.09433364868164062, 0.09997749328613281, 0.105621337890625, 0.11126518249511719, 0.11690902709960938, 0.12255287170410156, 0.12819671630859375, 0.13384056091308594, 0.13948440551757812, 0.1451282501220703, 0.1507720947265625, 0.1564159393310547, 0.16205978393554688, 0.16770362854003906, 0.17334747314453125, 0.17899131774902344, 0.18463516235351562, 0.1902790069580078, 0.1959228515625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 8.0, 16.0, 19.0, 48.0, 86.0, 139.0, 181.0, 176.0, 156.0, 77.0, 55.0, 19.0, 14.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4526896476745605, -2.3807754516601562, -2.308861255645752, -2.2369470596313477, -2.1650328636169434, -2.09311842918396, -2.0212042331695557, -1.9492900371551514, -1.877375841140747, -1.8054616451263428, -1.7335474491119385, -1.6616331338882446, -1.5897189378738403, -1.517804741859436, -1.4458904266357422, -1.373976230621338, -1.3020620346069336, -1.2301478385925293, -1.158233642578125, -1.0863193273544312, -1.0144051313400269, -0.9424909353256226, -0.8705766797065735, -0.7986624240875244, -0.7267482280731201, -0.6548340320587158, -0.5829197764396667, -0.5110055208206177, -0.4390913248062134, -0.3671770989894867, -0.29526287317276, -0.22334861755371094, -0.15143442153930664, -0.07952019572257996, -0.0076059699058532715, 0.06430825591087341, 0.1362224817276001, 0.20813670754432678, 0.28005093336105347, 0.35196518898010254, 0.42387938499450684, 0.4957936108112335, 0.5677078366279602, 0.6396220922470093, 0.7115362882614136, 0.7834504842758179, 0.8553647398948669, 0.927278995513916, 0.9991931915283203, 1.0711073875427246, 1.143021583557129, 1.2149358987808228, 1.286850094795227, 1.3587642908096313, 1.4306786060333252, 1.5025928020477295, 1.5745069980621338, 1.646421194076538, 1.7183353900909424, 1.7902497053146362, 1.8621639013290405, 1.9340780973434448, 2.0059924125671387, 2.077906608581543, 2.1498208045959473]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 2.0, 0.0, 4.0, 6.0, 6.0, 5.0, 5.0, 12.0, 6.0, 11.0, 20.0, 21.0, 22.0, 18.0, 20.0, 26.0, 34.0, 25.0, 33.0, 35.0, 35.0, 45.0, 46.0, 33.0, 39.0, 28.0, 40.0, 46.0, 34.0, 31.0, 34.0, 35.0, 31.0, 23.0, 30.0, 27.0, 20.0, 25.0, 10.0, 13.0, 9.0, 15.0, 4.0, 5.0, 5.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.7390925884246826, -0.7134337425231934, -0.6877748966217041, -0.6621159911155701, -0.6364571452140808, -0.6107982993125916, -0.5851394534111023, -0.5594805479049683, -0.533821702003479, -0.5081628561019897, -0.4825039803981781, -0.45684513449668884, -0.4311862587928772, -0.40552741289138794, -0.3798685669898987, -0.35420969128608704, -0.3285508453845978, -0.3028919994831085, -0.2772331237792969, -0.2515742778778076, -0.22591540217399597, -0.2002565562725067, -0.17459769546985626, -0.1489388346672058, -0.12327997386455536, -0.09762111306190491, -0.07196225225925446, -0.0463033989071846, -0.02064453810453415, 0.005014315247535706, 0.030673176050186157, 0.05633203685283661, 0.08199089765548706, 0.10764975845813751, 0.13330861926078796, 0.15896746516227722, 0.18462634086608887, 0.21028518676757812, 0.23594404757022858, 0.26160290837287903, 0.2872617840766907, 0.31292062997817993, 0.3385795056819916, 0.36423835158348083, 0.3898972272872925, 0.41555607318878174, 0.441214919090271, 0.46687379479408264, 0.4925326406955719, 0.5181915163993835, 0.5438503623008728, 0.5695092082023621, 0.5951680541038513, 0.6208269596099854, 0.6464858055114746, 0.6721446514129639, 0.6978034973144531, 0.7234623432159424, 0.7491211891174316, 0.7747800946235657, 0.8004389405250549, 0.8260977864265442, 0.8517566323280334, 0.8774155378341675, 0.9030743837356567]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 5.0, 0.0, 9.0, 10.0, 15.0, 17.0, 14.0, 31.0, 40.0, 69.0, 108.0, 184.0, 321.0, 544.0, 913.0, 1890.0, 3890.0, 8443.0, 20483.0, 52011.0, 148432.0, 523441.0, 2222548.0, 875821.0, 216489.0, 71538.0, 26643.0, 10702.0, 4767.0, 2260.0, 1167.0, 628.0, 326.0, 181.0, 111.0, 80.0, 40.0, 38.0, 26.0, 21.0, 7.0, 5.0, 6.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1546630859375, -0.14944839477539062, -0.14423370361328125, -0.13901901245117188, -0.1338043212890625, -0.12858963012695312, -0.12337493896484375, -0.11816024780273438, -0.112945556640625, -0.10773086547851562, -0.10251617431640625, -0.09730148315429688, -0.0920867919921875, -0.08687210083007812, -0.08165740966796875, -0.07644271850585938, -0.07122802734375, -0.06601333618164062, -0.06079864501953125, -0.055583953857421875, -0.0503692626953125, -0.045154571533203125, -0.03993988037109375, -0.034725189208984375, -0.029510498046875, -0.024295806884765625, -0.01908111572265625, -0.013866424560546875, -0.0086517333984375, -0.003437042236328125, 0.00177764892578125, 0.006992340087890625, 0.01220703125, 0.017421722412109375, 0.02263641357421875, 0.027851104736328125, 0.0330657958984375, 0.038280487060546875, 0.04349517822265625, 0.048709869384765625, 0.053924560546875, 0.059139251708984375, 0.06435394287109375, 0.06956863403320312, 0.0747833251953125, 0.07999801635742188, 0.08521270751953125, 0.09042739868164062, 0.09564208984375, 0.10085678100585938, 0.10607147216796875, 0.11128616333007812, 0.1165008544921875, 0.12171554565429688, 0.12693023681640625, 0.13214492797851562, 0.137359619140625, 0.14257431030273438, 0.14778900146484375, 0.15300369262695312, 0.1582183837890625, 0.16343307495117188, 0.16864776611328125, 0.17386245727539062, 0.1790771484375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 8.0, 10.0, 5.0, 13.0, 15.0, 15.0, 18.0, 21.0, 23.0, 23.0, 26.0, 23.0, 43.0, 45.0, 32.0, 50.0, 39.0, 45.0, 48.0, 47.0, 52.0, 37.0, 42.0, 46.0, 39.0, 20.0, 35.0, 32.0, 18.0, 15.0, 27.0, 15.0, 8.0, 8.0, 11.0, 8.0, 7.0, 7.0, 5.0, 1.0, 1.0, 5.0, 4.0, 0.0, 1.0], "bins": [-0.10601806640625, -0.10318565368652344, -0.10035324096679688, -0.09752082824707031, -0.09468841552734375, -0.09185600280761719, -0.08902359008789062, -0.08619117736816406, -0.0833587646484375, -0.08052635192871094, -0.07769393920898438, -0.07486152648925781, -0.07202911376953125, -0.06919670104980469, -0.06636428833007812, -0.06353187561035156, -0.060699462890625, -0.05786705017089844, -0.055034637451171875, -0.05220222473144531, -0.04936981201171875, -0.04653739929199219, -0.043704986572265625, -0.04087257385253906, -0.0380401611328125, -0.03520774841308594, -0.032375335693359375, -0.029542922973632812, -0.02671051025390625, -0.023878097534179688, -0.021045684814453125, -0.018213272094726562, -0.015380859375, -0.012548446655273438, -0.009716033935546875, -0.0068836212158203125, -0.00405120849609375, -0.0012187957763671875, 0.001613616943359375, 0.0044460296630859375, 0.0072784423828125, 0.010110855102539062, 0.012943267822265625, 0.015775680541992188, 0.01860809326171875, 0.021440505981445312, 0.024272918701171875, 0.027105331420898438, 0.029937744140625, 0.03277015686035156, 0.035602569580078125, 0.03843498229980469, 0.04126739501953125, 0.04409980773925781, 0.046932220458984375, 0.04976463317871094, 0.0525970458984375, 0.05542945861816406, 0.058261871337890625, 0.06109428405761719, 0.06392669677734375, 0.06675910949707031, 0.06959152221679688, 0.07242393493652344, 0.07525634765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 8.0, 8.0, 12.0, 10.0, 10.0, 32.0, 26.0, 51.0, 61.0, 70.0, 133.0, 183.0, 237.0, 377.0, 727.0, 1177.0, 2107.0, 4070.0, 8614.0, 18765.0, 44389.0, 109530.0, 295747.0, 979709.0, 1850652.0, 557396.0, 190476.0, 73274.0, 29933.0, 13147.0, 6214.0, 3055.0, 1667.0, 885.0, 526.0, 327.0, 201.0, 121.0, 114.0, 75.0, 55.0, 31.0, 17.0, 18.0, 15.0, 8.0, 7.0, 7.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.1885528564453125, -0.182525634765625, -0.1764984130859375, -0.17047119140625, -0.1644439697265625, -0.158416748046875, -0.1523895263671875, -0.1463623046875, -0.1403350830078125, -0.134307861328125, -0.1282806396484375, -0.12225341796875, -0.1162261962890625, -0.110198974609375, -0.1041717529296875, -0.09814453125, -0.0921173095703125, -0.086090087890625, -0.0800628662109375, -0.07403564453125, -0.0680084228515625, -0.061981201171875, -0.0559539794921875, -0.0499267578125, -0.0438995361328125, -0.037872314453125, -0.0318450927734375, -0.02581787109375, -0.0197906494140625, -0.013763427734375, -0.0077362060546875, -0.001708984375, 0.0043182373046875, 0.010345458984375, 0.0163726806640625, 0.02239990234375, 0.0284271240234375, 0.034454345703125, 0.0404815673828125, 0.0465087890625, 0.0525360107421875, 0.058563232421875, 0.0645904541015625, 0.07061767578125, 0.0766448974609375, 0.082672119140625, 0.0886993408203125, 0.0947265625, 0.1007537841796875, 0.106781005859375, 0.1128082275390625, 0.11883544921875, 0.1248626708984375, 0.130889892578125, 0.1369171142578125, 0.1429443359375, 0.1489715576171875, 0.154998779296875, 0.1610260009765625, 0.16705322265625, 0.1730804443359375, 0.179107666015625, 0.1851348876953125, 0.191162109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 7.0, 8.0, 17.0, 11.0, 25.0, 42.0, 44.0, 70.0, 95.0, 124.0, 153.0, 259.0, 388.0, 559.0, 749.0, 460.0, 310.0, 228.0, 149.0, 104.0, 78.0, 62.0, 33.0, 34.0, 17.0, 15.0, 8.0, 9.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24853515625, -0.24126052856445312, -0.23398590087890625, -0.22671127319335938, -0.2194366455078125, -0.21216201782226562, -0.20488739013671875, -0.19761276245117188, -0.190338134765625, -0.18306350708007812, -0.17578887939453125, -0.16851425170898438, -0.1612396240234375, -0.15396499633789062, -0.14669036865234375, -0.13941574096679688, -0.13214111328125, -0.12486648559570312, -0.11759185791015625, -0.11031723022460938, -0.1030426025390625, -0.09576797485351562, -0.08849334716796875, -0.08121871948242188, -0.073944091796875, -0.06666946411132812, -0.05939483642578125, -0.052120208740234375, -0.0448455810546875, -0.037570953369140625, -0.03029632568359375, -0.023021697998046875, -0.0157470703125, -0.008472442626953125, -0.00119781494140625, 0.006076812744140625, 0.0133514404296875, 0.020626068115234375, 0.02790069580078125, 0.035175323486328125, 0.042449951171875, 0.049724578857421875, 0.05699920654296875, 0.06427383422851562, 0.0715484619140625, 0.07882308959960938, 0.08609771728515625, 0.09337234497070312, 0.10064697265625, 0.10792160034179688, 0.11519622802734375, 0.12247085571289062, 0.1297454833984375, 0.13702011108398438, 0.14429473876953125, 0.15156936645507812, 0.158843994140625, 0.16611862182617188, 0.17339324951171875, 0.18066787719726562, 0.1879425048828125, 0.19521713256835938, 0.20249176025390625, 0.20976638793945312, 0.217041015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 16.0, 22.0, 27.0, 49.0, 77.0, 110.0, 114.0, 93.0, 107.0, 121.0, 71.0, 60.0, 36.0, 31.0, 25.0, 10.0, 5.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9338374137878418, -0.892816960811615, -0.8517965078353882, -0.8107760548591614, -0.7697556018829346, -0.7287351489067078, -0.687714695930481, -0.6466941833496094, -0.6056737899780273, -0.5646533370018005, -0.5236328840255737, -0.4826124310493469, -0.4415919780731201, -0.4005715250968933, -0.3595510423183441, -0.3185305893421173, -0.2775101065635681, -0.2364896535873413, -0.1954692006111145, -0.1544487327337265, -0.1134282797574997, -0.07240782678127289, -0.03138735890388489, 0.009633094072341919, 0.050653547048568726, 0.09167400002479553, 0.13269445300102234, 0.17371492087841034, 0.21473537385463715, 0.25575584173202515, 0.29677629470825195, 0.33779674768447876, 0.37881720066070557, 0.4198376536369324, 0.4608581066131592, 0.501878559589386, 0.5428990125656128, 0.5839194655418396, 0.6249399185180664, 0.665960431098938, 0.70698082447052, 0.7480012774467468, 0.7890217304229736, 0.8300421833992004, 0.8710626363754272, 0.912083089351654, 0.9531035423278809, 0.9941240549087524, 1.035144567489624, 1.0761650800704956, 1.1171854734420776, 1.1582059860229492, 1.1992263793945312, 1.2402468919754028, 1.2812672853469849, 1.3222877979278564, 1.3633081912994385, 1.40432870388031, 1.445349097251892, 1.4863696098327637, 1.5273900032043457, 1.5684105157852173, 1.6094309091567993, 1.650451421737671, 1.691471815109253]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 5.0, 7.0, 11.0, 9.0, 18.0, 21.0, 22.0, 35.0, 38.0, 28.0, 34.0, 43.0, 37.0, 39.0, 47.0, 37.0, 46.0, 46.0, 33.0, 35.0, 33.0, 34.0, 38.0, 41.0, 36.0, 26.0, 30.0, 27.0, 23.0, 16.0, 23.0, 12.0, 12.0, 22.0, 9.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6693547964096069, -0.6482653021812439, -0.6271757483482361, -0.606086254119873, -0.5849967002868652, -0.5639072060585022, -0.5428177118301392, -0.5217281579971313, -0.5006386041641235, -0.4795490801334381, -0.4584595561027527, -0.43737006187438965, -0.41628050804138184, -0.3951910138130188, -0.3741014897823334, -0.35301196575164795, -0.3319224715232849, -0.3108329474925995, -0.28974342346191406, -0.268653929233551, -0.2475643903017044, -0.22647486627101898, -0.20538535714149475, -0.18429583311080933, -0.1632063090801239, -0.14211678504943848, -0.12102726846933365, -0.09993775188922882, -0.0788482278585434, -0.05775870382785797, -0.03666919469833374, -0.015579670667648315, 0.005509793758392334, 0.02659931406378746, 0.04768883436918259, 0.06877835094928741, 0.08986787497997284, 0.11095739901065826, 0.1320469081401825, 0.15313643217086792, 0.17422595620155334, 0.19531548023223877, 0.2164050042629242, 0.23749451339244843, 0.25858402252197266, 0.27967357635498047, 0.3007630705833435, 0.32185259461402893, 0.34294211864471436, 0.3640316426753998, 0.3851211667060852, 0.40621066093444824, 0.42730021476745605, 0.4483897089958191, 0.4694792330265045, 0.49056875705718994, 0.5116583108901978, 0.5327478051185608, 0.5538373589515686, 0.5749268531799316, 0.5960164070129395, 0.6171059012413025, 0.6381953954696655, 0.6592849493026733, 0.6803744435310364]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 15.0, 20.0, 47.0, 39.0, 73.0, 94.0, 131.0, 215.0, 309.0, 427.0, 604.0, 950.0, 1321.0, 1848.0, 2863.0, 4556.0, 6970.0, 11289.0, 18938.0, 32836.0, 62503.0, 147102.0, 353305.0, 217501.0, 82575.0, 41162.0, 23184.0, 13673.0, 8435.0, 5155.0, 3396.0, 2159.0, 1473.0, 1007.0, 737.0, 526.0, 339.0, 230.0, 164.0, 112.0, 87.0, 64.0, 38.0, 35.0, 17.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14596176147460938, -0.14104461669921875, -0.13612747192382812, -0.1312103271484375, -0.12629318237304688, -0.12137603759765625, -0.11645889282226562, -0.111541748046875, -0.10662460327148438, -0.10170745849609375, -0.09679031372070312, -0.0918731689453125, -0.08695602416992188, -0.08203887939453125, -0.07712173461914062, -0.07220458984375, -0.06728744506835938, -0.06237030029296875, -0.057453155517578125, -0.0525360107421875, -0.047618865966796875, -0.04270172119140625, -0.037784576416015625, -0.032867431640625, -0.027950286865234375, -0.02303314208984375, -0.018115997314453125, -0.0131988525390625, -0.008281707763671875, -0.00336456298828125, 0.001552581787109375, 0.0064697265625, 0.011386871337890625, 0.01630401611328125, 0.021221160888671875, 0.0261383056640625, 0.031055450439453125, 0.03597259521484375, 0.040889739990234375, 0.045806884765625, 0.050724029541015625, 0.05564117431640625, 0.060558319091796875, 0.0654754638671875, 0.07039260864257812, 0.07530975341796875, 0.08022689819335938, 0.08514404296875, 0.09006118774414062, 0.09497833251953125, 0.09989547729492188, 0.1048126220703125, 0.10972976684570312, 0.11464691162109375, 0.11956405639648438, 0.124481201171875, 0.12939834594726562, 0.13431549072265625, 0.13923263549804688, 0.1441497802734375, 0.14906692504882812, 0.15398406982421875, 0.15890121459960938, 0.163818359375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 8.0, 8.0, 8.0, 7.0, 13.0, 6.0, 12.0, 20.0, 25.0, 24.0, 28.0, 31.0, 42.0, 38.0, 43.0, 49.0, 46.0, 37.0, 44.0, 40.0, 44.0, 45.0, 47.0, 42.0, 47.0, 35.0, 27.0, 35.0, 24.0, 22.0, 20.0, 12.0, 16.0, 14.0, 8.0, 8.0, 4.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1011962890625, -0.09802627563476562, -0.09485626220703125, -0.09168624877929688, -0.0885162353515625, -0.08534622192382812, -0.08217620849609375, -0.07900619506835938, -0.075836181640625, -0.07266616821289062, -0.06949615478515625, -0.06632614135742188, -0.0631561279296875, -0.059986114501953125, -0.05681610107421875, -0.053646087646484375, -0.05047607421875, -0.047306060791015625, -0.04413604736328125, -0.040966033935546875, -0.0377960205078125, -0.034626007080078125, -0.03145599365234375, -0.028285980224609375, -0.025115966796875, -0.021945953369140625, -0.01877593994140625, -0.015605926513671875, -0.0124359130859375, -0.009265899658203125, -0.00609588623046875, -0.002925872802734375, 0.000244140625, 0.003414154052734375, 0.00658416748046875, 0.009754180908203125, 0.0129241943359375, 0.016094207763671875, 0.01926422119140625, 0.022434234619140625, 0.025604248046875, 0.028774261474609375, 0.03194427490234375, 0.035114288330078125, 0.0382843017578125, 0.041454315185546875, 0.04462432861328125, 0.047794342041015625, 0.05096435546875, 0.054134368896484375, 0.05730438232421875, 0.060474395751953125, 0.0636444091796875, 0.06681442260742188, 0.06998443603515625, 0.07315444946289062, 0.076324462890625, 0.07949447631835938, 0.08266448974609375, 0.08583450317382812, 0.0890045166015625, 0.09217453002929688, 0.09534454345703125, 0.09851455688476562, 0.1016845703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 9.0, 5.0, 4.0, 10.0, 19.0, 17.0, 15.0, 15.0, 25.0, 44.0, 71.0, 104.0, 149.0, 243.0, 440.0, 796.0, 1477.0, 2845.0, 5588.0, 10980.0, 22480.0, 50225.0, 141348.0, 465158.0, 222328.0, 67352.0, 28711.0, 13693.0, 6796.0, 3377.0, 1818.0, 1018.0, 516.0, 296.0, 200.0, 135.0, 80.0, 46.0, 34.0, 25.0, 16.0, 8.0, 13.0, 7.0, 8.0, 7.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2216796875, -0.2146778106689453, -0.20767593383789062, -0.20067405700683594, -0.19367218017578125, -0.18667030334472656, -0.17966842651367188, -0.1726665496826172, -0.1656646728515625, -0.1586627960205078, -0.15166091918945312, -0.14465904235839844, -0.13765716552734375, -0.13065528869628906, -0.12365341186523438, -0.11665153503417969, -0.109649658203125, -0.10264778137207031, -0.09564590454101562, -0.08864402770996094, -0.08164215087890625, -0.07464027404785156, -0.06763839721679688, -0.06063652038574219, -0.0536346435546875, -0.04663276672363281, -0.039630889892578125, -0.03262901306152344, -0.02562713623046875, -0.018625259399414062, -0.011623382568359375, -0.0046215057373046875, 0.00238037109375, 0.009382247924804688, 0.016384124755859375, 0.023386001586914062, 0.03038787841796875, 0.03738975524902344, 0.044391632080078125, 0.05139350891113281, 0.0583953857421875, 0.06539726257324219, 0.07239913940429688, 0.07940101623535156, 0.08640289306640625, 0.09340476989746094, 0.10040664672851562, 0.10740852355957031, 0.114410400390625, 0.12141227722167969, 0.12841415405273438, 0.13541603088378906, 0.14241790771484375, 0.14941978454589844, 0.15642166137695312, 0.1634235382080078, 0.1704254150390625, 0.1774272918701172, 0.18442916870117188, 0.19143104553222656, 0.19843292236328125, 0.20543479919433594, 0.21243667602539062, 0.2194385528564453, 0.2264404296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 10.0, 8.0, 4.0, 14.0, 12.0, 11.0, 16.0, 17.0, 24.0, 31.0, 23.0, 26.0, 26.0, 38.0, 40.0, 29.0, 39.0, 42.0, 49.0, 35.0, 28.0, 49.0, 37.0, 35.0, 36.0, 36.0, 30.0, 30.0, 30.0, 27.0, 21.0, 20.0, 20.0, 15.0, 19.0, 13.0, 9.0, 11.0, 6.0, 5.0, 7.0, 1.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.278564453125, -0.2702751159667969, -0.26198577880859375, -0.2536964416503906, -0.2454071044921875, -0.23711776733398438, -0.22882843017578125, -0.22053909301757812, -0.212249755859375, -0.20396041870117188, -0.19567108154296875, -0.18738174438476562, -0.1790924072265625, -0.17080307006835938, -0.16251373291015625, -0.15422439575195312, -0.14593505859375, -0.13764572143554688, -0.12935638427734375, -0.12106704711914062, -0.1127777099609375, -0.10448837280273438, -0.09619903564453125, -0.08790969848632812, -0.079620361328125, -0.07133102416992188, -0.06304168701171875, -0.054752349853515625, -0.0464630126953125, -0.038173675537109375, -0.02988433837890625, -0.021595001220703125, -0.0133056640625, -0.005016326904296875, 0.00327301025390625, 0.011562347412109375, 0.0198516845703125, 0.028141021728515625, 0.03643035888671875, 0.044719696044921875, 0.053009033203125, 0.061298370361328125, 0.06958770751953125, 0.07787704467773438, 0.0861663818359375, 0.09445571899414062, 0.10274505615234375, 0.11103439331054688, 0.11932373046875, 0.12761306762695312, 0.13590240478515625, 0.14419174194335938, 0.1524810791015625, 0.16077041625976562, 0.16905975341796875, 0.17734909057617188, 0.185638427734375, 0.19392776489257812, 0.20221710205078125, 0.21050643920898438, 0.2187957763671875, 0.22708511352539062, 0.23537445068359375, 0.24366378784179688, 0.251953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 1.0, 10.0, 6.0, 11.0, 19.0, 26.0, 32.0, 45.0, 78.0, 139.0, 250.0, 479.0, 970.0, 2028.0, 4339.0, 9366.0, 21464.0, 50408.0, 112413.0, 380932.0, 293519.0, 95379.0, 42457.0, 18797.0, 8182.0, 3546.0, 1755.0, 898.0, 441.0, 224.0, 117.0, 76.0, 50.0, 26.0, 17.0, 13.0, 7.0, 8.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.11590576171875, -0.11238288879394531, -0.10886001586914062, -0.10533714294433594, -0.10181427001953125, -0.09829139709472656, -0.09476852416992188, -0.09124565124511719, -0.0877227783203125, -0.08419990539550781, -0.08067703247070312, -0.07715415954589844, -0.07363128662109375, -0.07010841369628906, -0.06658554077148438, -0.06306266784667969, -0.059539794921875, -0.05601692199707031, -0.052494049072265625, -0.04897117614746094, -0.04544830322265625, -0.04192543029785156, -0.038402557373046875, -0.03487968444824219, -0.0313568115234375, -0.027833938598632812, -0.024311065673828125, -0.020788192749023438, -0.01726531982421875, -0.013742446899414062, -0.010219573974609375, -0.0066967010498046875, -0.003173828125, 0.0003490447998046875, 0.003871917724609375, 0.0073947906494140625, 0.01091766357421875, 0.014440536499023438, 0.017963409423828125, 0.021486282348632812, 0.0250091552734375, 0.028532028198242188, 0.032054901123046875, 0.03557777404785156, 0.03910064697265625, 0.04262351989746094, 0.046146392822265625, 0.04966926574707031, 0.053192138671875, 0.05671501159667969, 0.060237884521484375, 0.06376075744628906, 0.06728363037109375, 0.07080650329589844, 0.07432937622070312, 0.07785224914550781, 0.0813751220703125, 0.08489799499511719, 0.08842086791992188, 0.09194374084472656, 0.09546661376953125, 0.09898948669433594, 0.10251235961914062, 0.10603523254394531, 0.10955810546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 7.0, 4.0, 8.0, 6.0, 6.0, 10.0, 6.0, 16.0, 20.0, 29.0, 34.0, 38.0, 52.0, 93.0, 113.0, 131.0, 126.0, 76.0, 65.0, 43.0, 17.0, 27.0, 17.0, 6.0, 17.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0338764190673828e-05, -2.931244671344757e-05, -2.8286129236221313e-05, -2.7259811758995056e-05, -2.62334942817688e-05, -2.520717680454254e-05, -2.4180859327316284e-05, -2.3154541850090027e-05, -2.212822437286377e-05, -2.1101906895637512e-05, -2.0075589418411255e-05, -1.9049271941184998e-05, -1.802295446395874e-05, -1.6996636986732483e-05, -1.5970319509506226e-05, -1.4944002032279968e-05, -1.3917684555053711e-05, -1.2891367077827454e-05, -1.1865049600601196e-05, -1.0838732123374939e-05, -9.812414646148682e-06, -8.786097168922424e-06, -7.759779691696167e-06, -6.73346221446991e-06, -5.707144737243652e-06, -4.680827260017395e-06, -3.6545097827911377e-06, -2.6281923055648804e-06, -1.601874828338623e-06, -5.755573511123657e-07, 4.507601261138916e-07, 1.477077603340149e-06, 2.5033950805664062e-06, 3.5297125577926636e-06, 4.556030035018921e-06, 5.582347512245178e-06, 6.6086649894714355e-06, 7.634982466697693e-06, 8.66129994392395e-06, 9.687617421150208e-06, 1.0713934898376465e-05, 1.1740252375602722e-05, 1.276656985282898e-05, 1.3792887330055237e-05, 1.4819204807281494e-05, 1.584552228450775e-05, 1.687183976173401e-05, 1.7898157238960266e-05, 1.8924474716186523e-05, 1.995079219341278e-05, 2.0977109670639038e-05, 2.2003427147865295e-05, 2.3029744625091553e-05, 2.405606210231781e-05, 2.5082379579544067e-05, 2.6108697056770325e-05, 2.7135014533996582e-05, 2.816133201122284e-05, 2.9187649488449097e-05, 3.0213966965675354e-05, 3.124028444290161e-05, 3.226660192012787e-05, 3.3292919397354126e-05, 3.431923687458038e-05, 3.534555435180664e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 8.0, 10.0, 23.0, 23.0, 42.0, 59.0, 100.0, 170.0, 334.0, 634.0, 1227.0, 3069.0, 9571.0, 32321.0, 117542.0, 523646.0, 267619.0, 64704.0, 18081.0, 5428.0, 2010.0, 883.0, 453.0, 239.0, 121.0, 84.0, 45.0, 33.0, 20.0, 18.0, 11.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.141357421875, -0.13626670837402344, -0.13117599487304688, -0.1260852813720703, -0.12099456787109375, -0.11590385437011719, -0.11081314086914062, -0.10572242736816406, -0.1006317138671875, -0.09554100036621094, -0.09045028686523438, -0.08535957336425781, -0.08026885986328125, -0.07517814636230469, -0.07008743286132812, -0.06499671936035156, -0.059906005859375, -0.05481529235839844, -0.049724578857421875, -0.04463386535644531, -0.03954315185546875, -0.03445243835449219, -0.029361724853515625, -0.024271011352539062, -0.0191802978515625, -0.014089584350585938, -0.008998870849609375, -0.0039081573486328125, 0.00118255615234375, 0.0062732696533203125, 0.011363983154296875, 0.016454696655273438, 0.02154541015625, 0.026636123657226562, 0.031726837158203125, 0.03681755065917969, 0.04190826416015625, 0.04699897766113281, 0.052089691162109375, 0.05718040466308594, 0.0622711181640625, 0.06736183166503906, 0.07245254516601562, 0.07754325866699219, 0.08263397216796875, 0.08772468566894531, 0.09281539916992188, 0.09790611267089844, 0.102996826171875, 0.10808753967285156, 0.11317825317382812, 0.11826896667480469, 0.12335968017578125, 0.1284503936767578, 0.13354110717773438, 0.13863182067871094, 0.1437225341796875, 0.14881324768066406, 0.15390396118164062, 0.1589946746826172, 0.16408538818359375, 0.1691761016845703, 0.17426681518554688, 0.17935752868652344, 0.1844482421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 8.0, 9.0, 15.0, 7.0, 17.0, 14.0, 20.0, 31.0, 26.0, 30.0, 46.0, 61.0, 98.0, 118.0, 99.0, 83.0, 71.0, 35.0, 39.0, 27.0, 21.0, 17.0, 23.0, 19.0, 9.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 7.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.128662109375, -0.1252899169921875, -0.121917724609375, -0.1185455322265625, -0.11517333984375, -0.1118011474609375, -0.108428955078125, -0.1050567626953125, -0.1016845703125, -0.0983123779296875, -0.094940185546875, -0.0915679931640625, -0.08819580078125, -0.0848236083984375, -0.081451416015625, -0.0780792236328125, -0.07470703125, -0.0713348388671875, -0.067962646484375, -0.0645904541015625, -0.06121826171875, -0.0578460693359375, -0.054473876953125, -0.0511016845703125, -0.0477294921875, -0.0443572998046875, -0.040985107421875, -0.0376129150390625, -0.03424072265625, -0.0308685302734375, -0.027496337890625, -0.0241241455078125, -0.020751953125, -0.0173797607421875, -0.014007568359375, -0.0106353759765625, -0.00726318359375, -0.0038909912109375, -0.000518798828125, 0.0028533935546875, 0.0062255859375, 0.0095977783203125, 0.012969970703125, 0.0163421630859375, 0.01971435546875, 0.0230865478515625, 0.026458740234375, 0.0298309326171875, 0.033203125, 0.0365753173828125, 0.039947509765625, 0.0433197021484375, 0.04669189453125, 0.0500640869140625, 0.053436279296875, 0.0568084716796875, 0.0601806640625, 0.0635528564453125, 0.066925048828125, 0.0702972412109375, 0.07366943359375, 0.0770416259765625, 0.080413818359375, 0.0837860107421875, 0.087158203125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 20.0, 24.0, 39.0, 59.0, 90.0, 105.0, 117.0, 118.0, 97.0, 90.0, 77.0, 48.0, 36.0, 22.0, 20.0, 5.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0324938297271729, -0.9934993982315063, -0.9545049667358398, -0.9155104756355286, -0.8765160441398621, -0.8375216126441956, -0.7985271215438843, -0.7595326900482178, -0.7205382585525513, -0.6815438270568848, -0.6425493955612183, -0.603554904460907, -0.5645604729652405, -0.525566041469574, -0.4865715801715851, -0.4475771188735962, -0.4085826873779297, -0.3695882558822632, -0.3305937945842743, -0.2915993332862854, -0.2526049017906189, -0.2136104553937912, -0.1746160089969635, -0.1356215476989746, -0.0966271162033081, -0.05763266980648041, -0.01863822340965271, 0.020356222987174988, 0.059350669384002686, 0.09834511578083038, 0.13733956217765808, 0.17633402347564697, 0.21532845497131348, 0.25432288646698, 0.29331734776496887, 0.33231180906295776, 0.37130624055862427, 0.41030067205429077, 0.44929513335227966, 0.48828959465026855, 0.5272840261459351, 0.5662784576416016, 0.6052728891372681, 0.6442673802375793, 0.6832618117332458, 0.7222562432289124, 0.7612507343292236, 0.8002451658248901, 0.8392395973205566, 0.8782340288162231, 0.9172284603118896, 0.9562229514122009, 0.9952173829078674, 1.0342118740081787, 1.0732063055038452, 1.1122007369995117, 1.1511951684951782, 1.1901895999908447, 1.2291840314865112, 1.2681784629821777, 1.3071730136871338, 1.3461674451828003, 1.3851618766784668, 1.4241563081741333, 1.4631507396697998]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 10.0, 8.0, 10.0, 20.0, 17.0, 14.0, 14.0, 29.0, 31.0, 28.0, 27.0, 33.0, 39.0, 49.0, 40.0, 33.0, 43.0, 57.0, 31.0, 33.0, 43.0, 44.0, 36.0, 43.0, 28.0, 39.0, 21.0, 27.0, 22.0, 23.0, 19.0, 12.0, 8.0, 12.0, 7.0, 6.0, 10.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6206184029579163, -0.5980514287948608, -0.5754845142364502, -0.5529175400733948, -0.5303506255149841, -0.5077836513519287, -0.48521673679351807, -0.46264976263046265, -0.440082848072052, -0.41751590371131897, -0.39494895935058594, -0.3723820149898529, -0.3498150706291199, -0.32724812626838684, -0.3046811819076538, -0.2821142077445984, -0.25954726338386536, -0.23698031902313232, -0.2144133746623993, -0.19184643030166626, -0.16927948594093323, -0.1467125415802002, -0.12414558231830597, -0.10157863795757294, -0.0790116935968399, -0.05644474923610687, -0.03387780115008354, -0.011310853064060211, 0.011256091296672821, 0.03382303565740585, 0.05638998746871948, 0.07895693182945251, 0.10152387619018555, 0.12409082055091858, 0.1466577649116516, 0.16922470927238464, 0.19179165363311768, 0.2143585979938507, 0.23692555725574493, 0.25949251651763916, 0.2820594310760498, 0.30462637543678284, 0.32719331979751587, 0.3497602641582489, 0.37232720851898193, 0.39489415287971497, 0.417461097240448, 0.4400280714035034, 0.46259501576423645, 0.4851619601249695, 0.5077289342880249, 0.5302958488464355, 0.552862823009491, 0.5754297375679016, 0.597996711730957, 0.6205636262893677, 0.6431306004524231, 0.6656975746154785, 0.6882644891738892, 0.7108314633369446, 0.7333983778953552, 0.7559653520584106, 0.7785322666168213, 0.8010992407798767, 0.8236661553382874]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 14.0, 16.0, 31.0, 49.0, 46.0, 89.0, 124.0, 194.0, 318.0, 521.0, 907.0, 1715.0, 3285.0, 6469.0, 14219.0, 32130.0, 78334.0, 210576.0, 766389.0, 2188768.0, 592161.0, 177030.0, 67089.0, 28143.0, 12650.0, 6069.0, 3075.0, 1616.0, 856.0, 547.0, 306.0, 179.0, 112.0, 86.0, 56.0, 23.0, 26.0, 21.0, 8.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.1601848602294922, -0.15508651733398438, -0.14998817443847656, -0.14488983154296875, -0.13979148864746094, -0.13469314575195312, -0.1295948028564453, -0.1244964599609375, -0.11939811706542969, -0.11429977416992188, -0.10920143127441406, -0.10410308837890625, -0.09900474548339844, -0.09390640258789062, -0.08880805969238281, -0.083709716796875, -0.07861137390136719, -0.07351303100585938, -0.06841468811035156, -0.06331634521484375, -0.05821800231933594, -0.053119659423828125, -0.04802131652832031, -0.0429229736328125, -0.03782463073730469, -0.032726287841796875, -0.027627944946289062, -0.02252960205078125, -0.017431259155273438, -0.012332916259765625, -0.0072345733642578125, -0.00213623046875, 0.0029621124267578125, 0.008060455322265625, 0.013158798217773438, 0.01825714111328125, 0.023355484008789062, 0.028453826904296875, 0.03355216979980469, 0.0386505126953125, 0.04374885559082031, 0.048847198486328125, 0.05394554138183594, 0.05904388427734375, 0.06414222717285156, 0.06924057006835938, 0.07433891296386719, 0.079437255859375, 0.08453559875488281, 0.08963394165039062, 0.09473228454589844, 0.09983062744140625, 0.10492897033691406, 0.11002731323242188, 0.11512565612792969, 0.1202239990234375, 0.1253223419189453, 0.13042068481445312, 0.13551902770996094, 0.14061737060546875, 0.14571571350097656, 0.15081405639648438, 0.1559123992919922, 0.1610107421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 7.0, 11.0, 9.0, 16.0, 23.0, 23.0, 23.0, 20.0, 26.0, 24.0, 41.0, 40.0, 41.0, 45.0, 57.0, 38.0, 43.0, 50.0, 52.0, 45.0, 44.0, 36.0, 31.0, 32.0, 29.0, 26.0, 27.0, 17.0, 14.0, 13.0, 18.0, 12.0, 5.0, 8.0, 5.0, 10.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0970458984375, -0.09416961669921875, -0.0912933349609375, -0.08841705322265625, -0.085540771484375, -0.08266448974609375, -0.0797882080078125, -0.07691192626953125, -0.07403564453125, -0.07115936279296875, -0.0682830810546875, -0.06540679931640625, -0.062530517578125, -0.05965423583984375, -0.0567779541015625, -0.05390167236328125, -0.051025390625, -0.04814910888671875, -0.0452728271484375, -0.04239654541015625, -0.039520263671875, -0.03664398193359375, -0.0337677001953125, -0.03089141845703125, -0.02801513671875, -0.02513885498046875, -0.0222625732421875, -0.01938629150390625, -0.016510009765625, -0.01363372802734375, -0.0107574462890625, -0.00788116455078125, -0.0050048828125, -0.00212860107421875, 0.0007476806640625, 0.00362396240234375, 0.006500244140625, 0.00937652587890625, 0.0122528076171875, 0.01512908935546875, 0.01800537109375, 0.02088165283203125, 0.0237579345703125, 0.02663421630859375, 0.029510498046875, 0.03238677978515625, 0.0352630615234375, 0.03813934326171875, 0.041015625, 0.04389190673828125, 0.0467681884765625, 0.04964447021484375, 0.052520751953125, 0.05539703369140625, 0.0582733154296875, 0.06114959716796875, 0.06402587890625, 0.06690216064453125, 0.0697784423828125, 0.07265472412109375, 0.075531005859375, 0.07840728759765625, 0.0812835693359375, 0.08415985107421875, 0.0870361328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 14.0, 21.0, 30.0, 52.0, 67.0, 111.0, 164.0, 246.0, 433.0, 695.0, 1126.0, 2007.0, 3650.0, 6980.0, 14193.0, 29585.0, 65569.0, 157180.0, 438693.0, 1714570.0, 1209527.0, 324516.0, 123328.0, 52809.0, 24255.0, 11378.0, 5810.0, 3016.0, 1658.0, 958.0, 565.0, 367.0, 245.0, 165.0, 106.0, 75.0, 38.0, 16.0, 13.0, 15.0, 7.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.217529296875, -0.2112903594970703, -0.20505142211914062, -0.19881248474121094, -0.19257354736328125, -0.18633460998535156, -0.18009567260742188, -0.1738567352294922, -0.1676177978515625, -0.1613788604736328, -0.15513992309570312, -0.14890098571777344, -0.14266204833984375, -0.13642311096191406, -0.13018417358398438, -0.12394523620605469, -0.117706298828125, -0.11146736145019531, -0.10522842407226562, -0.09898948669433594, -0.09275054931640625, -0.08651161193847656, -0.08027267456054688, -0.07403373718261719, -0.0677947998046875, -0.06155586242675781, -0.055316925048828125, -0.04907798767089844, -0.04283905029296875, -0.03660011291503906, -0.030361175537109375, -0.024122238159179688, -0.01788330078125, -0.011644363403320312, -0.005405426025390625, 0.0008335113525390625, 0.00707244873046875, 0.013311386108398438, 0.019550323486328125, 0.025789260864257812, 0.0320281982421875, 0.03826713562011719, 0.044506072998046875, 0.05074501037597656, 0.05698394775390625, 0.06322288513183594, 0.06946182250976562, 0.07570075988769531, 0.081939697265625, 0.08817863464355469, 0.09441757202148438, 0.10065650939941406, 0.10689544677734375, 0.11313438415527344, 0.11937332153320312, 0.1256122589111328, 0.1318511962890625, 0.1380901336669922, 0.14432907104492188, 0.15056800842285156, 0.15680694580078125, 0.16304588317871094, 0.16928482055664062, 0.1755237579345703, 0.1817626953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 14.0, 3.0, 5.0, 10.0, 9.0, 18.0, 20.0, 21.0, 30.0, 41.0, 45.0, 54.0, 83.0, 110.0, 135.0, 192.0, 279.0, 475.0, 646.0, 574.0, 356.0, 262.0, 171.0, 123.0, 94.0, 68.0, 64.0, 40.0, 17.0, 19.0, 26.0, 14.0, 20.0, 11.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1895751953125, -0.1827411651611328, -0.17590713500976562, -0.16907310485839844, -0.16223907470703125, -0.15540504455566406, -0.14857101440429688, -0.1417369842529297, -0.1349029541015625, -0.1280689239501953, -0.12123489379882812, -0.11440086364746094, -0.10756683349609375, -0.10073280334472656, -0.09389877319335938, -0.08706474304199219, -0.080230712890625, -0.07339668273925781, -0.06656265258789062, -0.05972862243652344, -0.05289459228515625, -0.04606056213378906, -0.039226531982421875, -0.03239250183105469, -0.0255584716796875, -0.018724441528320312, -0.011890411376953125, -0.0050563812255859375, 0.00177764892578125, 0.008611679077148438, 0.015445709228515625, 0.022279739379882812, 0.02911376953125, 0.03594779968261719, 0.042781829833984375, 0.04961585998535156, 0.05644989013671875, 0.06328392028808594, 0.07011795043945312, 0.07695198059082031, 0.0837860107421875, 0.09062004089355469, 0.09745407104492188, 0.10428810119628906, 0.11112213134765625, 0.11795616149902344, 0.12479019165039062, 0.1316242218017578, 0.138458251953125, 0.1452922821044922, 0.15212631225585938, 0.15896034240722656, 0.16579437255859375, 0.17262840270996094, 0.17946243286132812, 0.1862964630126953, 0.1931304931640625, 0.1999645233154297, 0.20679855346679688, 0.21363258361816406, 0.22046661376953125, 0.22730064392089844, 0.23413467407226562, 0.2409687042236328, 0.247802734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 15.0, 16.0, 47.0, 57.0, 115.0, 150.0, 199.0, 164.0, 123.0, 59.0, 22.0, 20.0, 7.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3207229375839233, -1.2530392408370972, -1.185355544090271, -1.1176718473434448, -1.0499881505966187, -0.9823044538497925, -0.9146208167076111, -0.8469371199607849, -0.7792534232139587, -0.7115697264671326, -0.6438860297203064, -0.576202392578125, -0.5085186958312988, -0.44083496928215027, -0.3731513023376465, -0.3054676055908203, -0.23778390884399414, -0.17010021209716797, -0.10241653025150299, -0.03473284840583801, 0.03295084834098816, 0.10063454508781433, 0.16831821203231812, 0.2360019087791443, 0.30368560552597046, 0.37136930227279663, 0.4390529990196228, 0.5067366361618042, 0.5744203329086304, 0.6421040296554565, 0.7097877264022827, 0.7774714231491089, 0.8451550006866455, 0.9128386974334717, 0.9805223941802979, 1.048206090927124, 1.1158897876739502, 1.1835734844207764, 1.2512571811676025, 1.3189408779144287, 1.3866245746612549, 1.454308271408081, 1.5219919681549072, 1.5896756649017334, 1.6573593616485596, 1.7250430583953857, 1.792726755142212, 1.860410451889038, 1.9280940294265747, 1.9957777261734009, 2.0634613037109375, 2.1311450004577637, 2.19882869720459, 2.266512393951416, 2.334196090698242, 2.4018797874450684, 2.4695634841918945, 2.5372471809387207, 2.604930877685547, 2.672614574432373, 2.740298271179199, 2.8079819679260254, 2.8756656646728516, 2.9433493614196777, 3.011033058166504]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 3.0, 6.0, 4.0, 7.0, 14.0, 11.0, 10.0, 15.0, 22.0, 25.0, 27.0, 24.0, 44.0, 34.0, 29.0, 31.0, 51.0, 32.0, 41.0, 47.0, 42.0, 36.0, 32.0, 33.0, 38.0, 37.0, 44.0, 34.0, 33.0, 30.0, 24.0, 26.0, 10.0, 15.0, 17.0, 16.0, 12.0, 5.0, 2.0, 10.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8308234810829163, -0.8071470856666565, -0.7834707498550415, -0.7597943544387817, -0.736117959022522, -0.7124415636062622, -0.6887651681900024, -0.6650888323783875, -0.6414124369621277, -0.6177360415458679, -0.5940597057342529, -0.5703833103179932, -0.5467069149017334, -0.5230305194854736, -0.49935415387153625, -0.4756777882575989, -0.4520013928413391, -0.42832499742507935, -0.40464863181114197, -0.3809722661972046, -0.3572958707809448, -0.33361947536468506, -0.3099431097507477, -0.2862667441368103, -0.26259034872055054, -0.23891396820545197, -0.2152375876903534, -0.19156120717525482, -0.16788482666015625, -0.14420844614505768, -0.1205320656299591, -0.09685568511486053, -0.07317930459976196, -0.04950292408466339, -0.02582654356956482, -0.0021501630544662476, 0.021526217460632324, 0.045202597975730896, 0.06887897849082947, 0.09255535900592804, 0.11623173952102661, 0.13990812003612518, 0.16358450055122375, 0.18726088106632233, 0.2109372615814209, 0.23461364209651947, 0.25829002261161804, 0.2819663882255554, 0.3056427836418152, 0.32931917905807495, 0.35299554467201233, 0.3766719102859497, 0.4003483057022095, 0.42402470111846924, 0.4477010667324066, 0.471377432346344, 0.49505382776260376, 0.5187302231788635, 0.5424065589904785, 0.5660829544067383, 0.589759349822998, 0.6134357452392578, 0.6371121406555176, 0.6607884764671326, 0.6844648718833923]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 14.0, 13.0, 18.0, 24.0, 42.0, 56.0, 102.0, 175.0, 285.0, 443.0, 772.0, 1327.0, 2260.0, 3751.0, 6499.0, 11469.0, 21748.0, 47085.0, 135068.0, 375443.0, 279923.0, 88540.0, 34521.0, 16809.0, 9390.0, 5231.0, 3094.0, 1791.0, 1046.0, 648.0, 394.0, 204.0, 134.0, 82.0, 57.0, 38.0, 26.0, 11.0, 14.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1781005859375, -0.17169761657714844, -0.16529464721679688, -0.1588916778564453, -0.15248870849609375, -0.1460857391357422, -0.13968276977539062, -0.13327980041503906, -0.1268768310546875, -0.12047386169433594, -0.11407089233398438, -0.10766792297363281, -0.10126495361328125, -0.09486198425292969, -0.08845901489257812, -0.08205604553222656, -0.075653076171875, -0.06925010681152344, -0.06284713745117188, -0.05644416809082031, -0.05004119873046875, -0.04363822937011719, -0.037235260009765625, -0.030832290649414062, -0.0244293212890625, -0.018026351928710938, -0.011623382568359375, -0.0052204132080078125, 0.00118255615234375, 0.0075855255126953125, 0.013988494873046875, 0.020391464233398438, 0.02679443359375, 0.03319740295410156, 0.039600372314453125, 0.04600334167480469, 0.05240631103515625, 0.05880928039550781, 0.06521224975585938, 0.07161521911621094, 0.0780181884765625, 0.08442115783691406, 0.09082412719726562, 0.09722709655761719, 0.10363006591796875, 0.11003303527832031, 0.11643600463867188, 0.12283897399902344, 0.129241943359375, 0.13564491271972656, 0.14204788208007812, 0.1484508514404297, 0.15485382080078125, 0.1612567901611328, 0.16765975952148438, 0.17406272888183594, 0.1804656982421875, 0.18686866760253906, 0.19327163696289062, 0.1996746063232422, 0.20607757568359375, 0.2124805450439453, 0.21888351440429688, 0.22528648376464844, 0.231689453125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 7.0, 7.0, 8.0, 12.0, 9.0, 12.0, 18.0, 21.0, 22.0, 34.0, 20.0, 16.0, 29.0, 44.0, 34.0, 37.0, 24.0, 40.0, 47.0, 31.0, 39.0, 38.0, 45.0, 37.0, 36.0, 39.0, 30.0, 35.0, 25.0, 20.0, 30.0, 27.0, 14.0, 18.0, 13.0, 16.0, 13.0, 11.0, 10.0, 9.0, 2.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08966350555419922, -0.08661460876464844, -0.08356571197509766, -0.08051681518554688, -0.0774679183959961, -0.07441902160644531, -0.07137012481689453, -0.06832122802734375, -0.06527233123779297, -0.06222343444824219, -0.059174537658691406, -0.056125640869140625, -0.053076744079589844, -0.05002784729003906, -0.04697895050048828, -0.0439300537109375, -0.04088115692138672, -0.03783226013183594, -0.034783363342285156, -0.031734466552734375, -0.028685569763183594, -0.025636672973632812, -0.02258777618408203, -0.01953887939453125, -0.01648998260498047, -0.013441085815429688, -0.010392189025878906, -0.007343292236328125, -0.004294395446777344, -0.0012454986572265625, 0.0018033981323242188, 0.004852294921875, 0.007901191711425781, 0.010950088500976562, 0.013998985290527344, 0.017047882080078125, 0.020096778869628906, 0.023145675659179688, 0.02619457244873047, 0.02924346923828125, 0.03229236602783203, 0.03534126281738281, 0.038390159606933594, 0.041439056396484375, 0.044487953186035156, 0.04753684997558594, 0.05058574676513672, 0.0536346435546875, 0.05668354034423828, 0.05973243713378906, 0.06278133392333984, 0.06583023071289062, 0.0688791275024414, 0.07192802429199219, 0.07497692108154297, 0.07802581787109375, 0.08107471466064453, 0.08412361145019531, 0.0871725082397461, 0.09022140502929688, 0.09327030181884766, 0.09631919860839844, 0.09936809539794922, 0.1024169921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 2.0, 11.0, 15.0, 18.0, 25.0, 51.0, 73.0, 149.0, 230.0, 418.0, 905.0, 1862.0, 4147.0, 10081.0, 29545.0, 140246.0, 608755.0, 194588.0, 36554.0, 11904.0, 4734.0, 2126.0, 964.0, 517.0, 235.0, 147.0, 89.0, 49.0, 26.0, 27.0, 16.0, 11.0, 4.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.38427734375, -0.3734779357910156, -0.36267852783203125, -0.3518791198730469, -0.3410797119140625, -0.3302803039550781, -0.31948089599609375, -0.3086814880371094, -0.297882080078125, -0.2870826721191406, -0.27628326416015625, -0.2654838562011719, -0.2546844482421875, -0.24388504028320312, -0.23308563232421875, -0.22228622436523438, -0.21148681640625, -0.20068740844726562, -0.18988800048828125, -0.17908859252929688, -0.1682891845703125, -0.15748977661132812, -0.14669036865234375, -0.13589096069335938, -0.125091552734375, -0.11429214477539062, -0.10349273681640625, -0.09269332885742188, -0.0818939208984375, -0.07109451293945312, -0.06029510498046875, -0.049495697021484375, -0.0386962890625, -0.027896881103515625, -0.01709747314453125, -0.006298065185546875, 0.0045013427734375, 0.015300750732421875, 0.02610015869140625, 0.036899566650390625, 0.047698974609375, 0.058498382568359375, 0.06929779052734375, 0.08009719848632812, 0.0908966064453125, 0.10169601440429688, 0.11249542236328125, 0.12329483032226562, 0.13409423828125, 0.14489364624023438, 0.15569305419921875, 0.16649246215820312, 0.1772918701171875, 0.18809127807617188, 0.19889068603515625, 0.20969009399414062, 0.220489501953125, 0.23128890991210938, 0.24208831787109375, 0.2528877258300781, 0.2636871337890625, 0.2744865417480469, 0.28528594970703125, 0.2960853576660156, 0.306884765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 16.0, 8.0, 8.0, 13.0, 23.0, 15.0, 19.0, 30.0, 24.0, 25.0, 21.0, 35.0, 36.0, 44.0, 37.0, 33.0, 61.0, 40.0, 49.0, 39.0, 41.0, 39.0, 36.0, 30.0, 36.0, 20.0, 27.0, 20.0, 19.0, 28.0, 20.0, 20.0, 13.0, 10.0, 6.0, 9.0, 8.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.27118682861328125, -0.2618560791015625, -0.25252532958984375, -0.243194580078125, -0.23386383056640625, -0.2245330810546875, -0.21520233154296875, -0.20587158203125, -0.19654083251953125, -0.1872100830078125, -0.17787933349609375, -0.168548583984375, -0.15921783447265625, -0.1498870849609375, -0.14055633544921875, -0.1312255859375, -0.12189483642578125, -0.1125640869140625, -0.10323333740234375, -0.093902587890625, -0.08457183837890625, -0.0752410888671875, -0.06591033935546875, -0.05657958984375, -0.04724884033203125, -0.0379180908203125, -0.02858734130859375, -0.019256591796875, -0.00992584228515625, -0.0005950927734375, 0.00873565673828125, 0.01806640625, 0.02739715576171875, 0.0367279052734375, 0.04605865478515625, 0.055389404296875, 0.06472015380859375, 0.0740509033203125, 0.08338165283203125, 0.09271240234375, 0.10204315185546875, 0.1113739013671875, 0.12070465087890625, 0.130035400390625, 0.13936614990234375, 0.1486968994140625, 0.15802764892578125, 0.1673583984375, 0.17668914794921875, 0.1860198974609375, 0.19535064697265625, 0.204681396484375, 0.21401214599609375, 0.2233428955078125, 0.23267364501953125, 0.24200439453125, 0.25133514404296875, 0.2606658935546875, 0.26999664306640625, 0.279327392578125, 0.28865814208984375, 0.2979888916015625, 0.30731964111328125, 0.316650390625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 15.0, 13.0, 23.0, 30.0, 43.0, 82.0, 136.0, 221.0, 476.0, 924.0, 1824.0, 3901.0, 8697.0, 20349.0, 53922.0, 179532.0, 486835.0, 195224.0, 57679.0, 21448.0, 9070.0, 4096.0, 1987.0, 907.0, 498.0, 276.0, 139.0, 75.0, 48.0, 32.0, 17.0, 14.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11871337890625, -0.11494827270507812, -0.11118316650390625, -0.10741806030273438, -0.1036529541015625, -0.09988784790039062, -0.09612274169921875, -0.09235763549804688, -0.088592529296875, -0.08482742309570312, -0.08106231689453125, -0.07729721069335938, -0.0735321044921875, -0.06976699829101562, -0.06600189208984375, -0.062236785888671875, -0.0584716796875, -0.054706573486328125, -0.05094146728515625, -0.047176361083984375, -0.0434112548828125, -0.039646148681640625, -0.03588104248046875, -0.032115936279296875, -0.028350830078125, -0.024585723876953125, -0.02082061767578125, -0.017055511474609375, -0.0132904052734375, -0.009525299072265625, -0.00576019287109375, -0.001995086669921875, 0.00177001953125, 0.005535125732421875, 0.00930023193359375, 0.013065338134765625, 0.0168304443359375, 0.020595550537109375, 0.02436065673828125, 0.028125762939453125, 0.031890869140625, 0.035655975341796875, 0.03942108154296875, 0.043186187744140625, 0.0469512939453125, 0.050716400146484375, 0.05448150634765625, 0.058246612548828125, 0.06201171875, 0.06577682495117188, 0.06954193115234375, 0.07330703735351562, 0.0770721435546875, 0.08083724975585938, 0.08460235595703125, 0.08836746215820312, 0.092132568359375, 0.09589767456054688, 0.09966278076171875, 0.10342788696289062, 0.1071929931640625, 0.11095809936523438, 0.11472320556640625, 0.11848831176757812, 0.12225341796875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 9.0, 8.0, 15.0, 26.0, 33.0, 77.0, 161.0, 234.0, 193.0, 104.0, 71.0, 13.0, 12.0, 11.0, 10.0, 11.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.655122756958008e-05, -4.480872303247452e-05, -4.306621849536896e-05, -4.13237139582634e-05, -3.958120942115784e-05, -3.7838704884052277e-05, -3.6096200346946716e-05, -3.4353695809841156e-05, -3.2611191272735596e-05, -3.0868686735630035e-05, -2.9126182198524475e-05, -2.7383677661418915e-05, -2.5641173124313354e-05, -2.3898668587207794e-05, -2.2156164050102234e-05, -2.0413659512996674e-05, -1.8671154975891113e-05, -1.6928650438785553e-05, -1.5186145901679993e-05, -1.3443641364574432e-05, -1.1701136827468872e-05, -9.958632290363312e-06, -8.216127753257751e-06, -6.473623216152191e-06, -4.731118679046631e-06, -2.9886141419410706e-06, -1.2461096048355103e-06, 4.9639493227005e-07, 2.2388994693756104e-06, 3.981404006481171e-06, 5.723908543586731e-06, 7.466413080692291e-06, 9.208917617797852e-06, 1.0951422154903412e-05, 1.2693926692008972e-05, 1.4436431229114532e-05, 1.6178935766220093e-05, 1.7921440303325653e-05, 1.9663944840431213e-05, 2.1406449377536774e-05, 2.3148953914642334e-05, 2.4891458451747894e-05, 2.6633962988853455e-05, 2.8376467525959015e-05, 3.0118972063064575e-05, 3.1861476600170135e-05, 3.3603981137275696e-05, 3.5346485674381256e-05, 3.7088990211486816e-05, 3.883149474859238e-05, 4.057399928569794e-05, 4.23165038228035e-05, 4.405900835990906e-05, 4.580151289701462e-05, 4.754401743412018e-05, 4.928652197122574e-05, 5.10290265083313e-05, 5.277153104543686e-05, 5.451403558254242e-05, 5.625654011964798e-05, 5.799904465675354e-05, 5.97415491938591e-05, 6.148405373096466e-05, 6.322655826807022e-05, 6.496906280517578e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 4.0, 8.0, 13.0, 13.0, 18.0, 18.0, 39.0, 56.0, 96.0, 124.0, 176.0, 264.0, 372.0, 630.0, 1014.0, 1852.0, 3645.0, 7375.0, 17374.0, 45431.0, 139766.0, 387898.0, 292887.0, 92529.0, 31961.0, 12584.0, 5744.0, 2823.0, 1454.0, 871.0, 470.0, 354.0, 206.0, 137.0, 99.0, 77.0, 57.0, 38.0, 23.0, 20.0, 10.0, 9.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1021728515625, -0.09885787963867188, -0.09554290771484375, -0.09222793579101562, -0.0889129638671875, -0.08559799194335938, -0.08228302001953125, -0.07896804809570312, -0.075653076171875, -0.07233810424804688, -0.06902313232421875, -0.06570816040039062, -0.0623931884765625, -0.059078216552734375, -0.05576324462890625, -0.052448272705078125, -0.04913330078125, -0.045818328857421875, -0.04250335693359375, -0.039188385009765625, -0.0358734130859375, -0.032558441162109375, -0.02924346923828125, -0.025928497314453125, -0.022613525390625, -0.019298553466796875, -0.01598358154296875, -0.012668609619140625, -0.0093536376953125, -0.006038665771484375, -0.00272369384765625, 0.000591278076171875, 0.00390625, 0.007221221923828125, 0.01053619384765625, 0.013851165771484375, 0.0171661376953125, 0.020481109619140625, 0.02379608154296875, 0.027111053466796875, 0.030426025390625, 0.033740997314453125, 0.03705596923828125, 0.040370941162109375, 0.0436859130859375, 0.047000885009765625, 0.05031585693359375, 0.053630828857421875, 0.05694580078125, 0.060260772705078125, 0.06357574462890625, 0.06689071655273438, 0.0702056884765625, 0.07352066040039062, 0.07683563232421875, 0.08015060424804688, 0.083465576171875, 0.08678054809570312, 0.09009552001953125, 0.09341049194335938, 0.0967254638671875, 0.10004043579101562, 0.10335540771484375, 0.10667037963867188, 0.1099853515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 6.0, 12.0, 12.0, 11.0, 11.0, 29.0, 40.0, 49.0, 76.0, 73.0, 107.0, 106.0, 95.0, 92.0, 83.0, 58.0, 44.0, 31.0, 16.0, 12.0, 10.0, 6.0, 7.0, 5.0, 5.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1246337890625, -0.12082958221435547, -0.11702537536621094, -0.1132211685180664, -0.10941696166992188, -0.10561275482177734, -0.10180854797363281, -0.09800434112548828, -0.09420013427734375, -0.09039592742919922, -0.08659172058105469, -0.08278751373291016, -0.07898330688476562, -0.0751791000366211, -0.07137489318847656, -0.06757068634033203, -0.0637664794921875, -0.05996227264404297, -0.05615806579589844, -0.052353858947753906, -0.048549652099609375, -0.044745445251464844, -0.04094123840332031, -0.03713703155517578, -0.03333282470703125, -0.02952861785888672, -0.025724411010742188, -0.021920204162597656, -0.018115997314453125, -0.014311790466308594, -0.010507583618164062, -0.006703376770019531, -0.002899169921875, 0.0009050369262695312, 0.0047092437744140625, 0.008513450622558594, 0.012317657470703125, 0.016121864318847656, 0.019926071166992188, 0.02373027801513672, 0.02753448486328125, 0.03133869171142578, 0.03514289855957031, 0.038947105407714844, 0.042751312255859375, 0.046555519104003906, 0.05035972595214844, 0.05416393280029297, 0.0579681396484375, 0.06177234649658203, 0.06557655334472656, 0.0693807601928711, 0.07318496704101562, 0.07698917388916016, 0.08079338073730469, 0.08459758758544922, 0.08840179443359375, 0.09220600128173828, 0.09601020812988281, 0.09981441497802734, 0.10361862182617188, 0.1074228286743164, 0.11122703552246094, 0.11503124237060547, 0.11883544921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 9.0, 15.0, 19.0, 40.0, 52.0, 70.0, 88.0, 95.0, 104.0, 110.0, 105.0, 82.0, 81.0, 43.0, 22.0, 13.0, 18.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.081995964050293, -1.046774983406067, -1.0115540027618408, -0.9763329029083252, -0.9411119222640991, -0.905890941619873, -0.8706699013710022, -0.8354488611221313, -0.8002278804779053, -0.7650068998336792, -0.7297858595848083, -0.6945648193359375, -0.6593438386917114, -0.6241228580474854, -0.5889018177986145, -0.5536807775497437, -0.5184597969055176, -0.4832387864589691, -0.44801777601242065, -0.4127967655658722, -0.37757575511932373, -0.34235474467277527, -0.3071337342262268, -0.27191272377967834, -0.23669171333312988, -0.20147070288658142, -0.16624969244003296, -0.1310286819934845, -0.09580767154693604, -0.06058666110038757, -0.02536565065383911, 0.00985535979270935, 0.04507637023925781, 0.08029738068580627, 0.11551839113235474, 0.1507394015789032, 0.18596041202545166, 0.22118142247200012, 0.2564024329185486, 0.29162344336509705, 0.3268444538116455, 0.36206546425819397, 0.39728647470474243, 0.4325074851512909, 0.46772849559783936, 0.5029494762420654, 0.5381705164909363, 0.5733915567398071, 0.6086125373840332, 0.6438335180282593, 0.6790545582771301, 0.714275598526001, 0.749496579170227, 0.7847175598144531, 0.819938600063324, 0.8551596403121948, 0.8903806209564209, 0.925601601600647, 0.9608226418495178, 0.9960436820983887, 1.0312646627426147, 1.0664856433868408, 1.1017067432403564, 1.1369277238845825, 1.1721487045288086]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 10.0, 16.0, 10.0, 9.0, 15.0, 23.0, 31.0, 26.0, 27.0, 29.0, 29.0, 35.0, 33.0, 36.0, 49.0, 31.0, 29.0, 41.0, 28.0, 39.0, 40.0, 44.0, 40.0, 33.0, 29.0, 29.0, 37.0, 29.0, 20.0, 26.0, 21.0, 18.0, 15.0, 6.0, 6.0, 15.0, 7.0, 7.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7232616543769836, -0.6990386247634888, -0.6748155951499939, -0.650592565536499, -0.6263695359230042, -0.6021465063095093, -0.5779235363006592, -0.5537004470825195, -0.5294774770736694, -0.5052544474601746, -0.4810314178466797, -0.4568083882331848, -0.43258535861968994, -0.40836232900619507, -0.3841393291950226, -0.3599162995815277, -0.33569324016571045, -0.3114702105522156, -0.2872471809387207, -0.26302415132522583, -0.23880113661289215, -0.21457810699939728, -0.1903550922870636, -0.16613206267356873, -0.14190903306007385, -0.11768600344657898, -0.0934629812836647, -0.06923995912075043, -0.045016929507255554, -0.02079389989376068, 0.003429114818572998, 0.02765214443206787, 0.051875174045562744, 0.07609820365905762, 0.1003212258219719, 0.12454424798488617, 0.14876727759838104, 0.17299030721187592, 0.1972133219242096, 0.22143635153770447, 0.24565938115119934, 0.2698824107646942, 0.2941054403781891, 0.3183284401893616, 0.34255146980285645, 0.3667744994163513, 0.3909975290298462, 0.41522055864334106, 0.43944358825683594, 0.4636666178703308, 0.4878896474838257, 0.5121126770973206, 0.5363357067108154, 0.5605587363243103, 0.5847817659378052, 0.6090047359466553, 0.6332278251647949, 0.6574508547782898, 0.6816738843917847, 0.7058969140052795, 0.7301199436187744, 0.7543429732322693, 0.7785660028457642, 0.8027889728546143, 0.8270120024681091]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 7.0, 6.0, 14.0, 20.0, 26.0, 53.0, 56.0, 72.0, 148.0, 207.0, 317.0, 549.0, 920.0, 1724.0, 3318.0, 6907.0, 14464.0, 35035.0, 87020.0, 247254.0, 878120.0, 1955461.0, 646171.0, 192525.0, 69884.0, 28841.0, 12506.0, 5884.0, 2959.0, 1586.0, 880.0, 477.0, 297.0, 192.0, 128.0, 74.0, 66.0, 43.0, 27.0, 28.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.153564453125, -0.14815521240234375, -0.1427459716796875, -0.13733673095703125, -0.131927490234375, -0.12651824951171875, -0.1211090087890625, -0.11569976806640625, -0.11029052734375, -0.10488128662109375, -0.0994720458984375, -0.09406280517578125, -0.088653564453125, -0.08324432373046875, -0.0778350830078125, -0.07242584228515625, -0.0670166015625, -0.06160736083984375, -0.0561981201171875, -0.05078887939453125, -0.045379638671875, -0.03997039794921875, -0.0345611572265625, -0.02915191650390625, -0.02374267578125, -0.01833343505859375, -0.0129241943359375, -0.00751495361328125, -0.002105712890625, 0.00330352783203125, 0.0087127685546875, 0.01412200927734375, 0.01953125, 0.02494049072265625, 0.0303497314453125, 0.03575897216796875, 0.041168212890625, 0.04657745361328125, 0.0519866943359375, 0.05739593505859375, 0.06280517578125, 0.06821441650390625, 0.0736236572265625, 0.07903289794921875, 0.084442138671875, 0.08985137939453125, 0.0952606201171875, 0.10066986083984375, 0.1060791015625, 0.11148834228515625, 0.1168975830078125, 0.12230682373046875, 0.127716064453125, 0.13312530517578125, 0.1385345458984375, 0.14394378662109375, 0.14935302734375, 0.15476226806640625, 0.1601715087890625, 0.16558074951171875, 0.170989990234375, 0.17639923095703125, 0.1818084716796875, 0.18721771240234375, 0.192626953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 7.0, 11.0, 9.0, 7.0, 16.0, 17.0, 19.0, 33.0, 22.0, 35.0, 40.0, 34.0, 31.0, 46.0, 29.0, 44.0, 37.0, 43.0, 48.0, 37.0, 49.0, 41.0, 46.0, 43.0, 47.0, 20.0, 26.0, 16.0, 17.0, 24.0, 18.0, 10.0, 12.0, 15.0, 5.0, 5.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.11199951171875, -0.10868549346923828, -0.10537147521972656, -0.10205745697021484, -0.09874343872070312, -0.0954294204711914, -0.09211540222167969, -0.08880138397216797, -0.08548736572265625, -0.08217334747314453, -0.07885932922363281, -0.0755453109741211, -0.07223129272460938, -0.06891727447509766, -0.06560325622558594, -0.06228923797607422, -0.0589752197265625, -0.05566120147705078, -0.05234718322753906, -0.049033164978027344, -0.045719146728515625, -0.042405128479003906, -0.03909111022949219, -0.03577709197998047, -0.03246307373046875, -0.02914905548095703, -0.025835037231445312, -0.022521018981933594, -0.019207000732421875, -0.015892982482910156, -0.012578964233398438, -0.009264945983886719, -0.005950927734375, -0.0026369094848632812, 0.0006771087646484375, 0.003991127014160156, 0.007305145263671875, 0.010619163513183594, 0.013933181762695312, 0.01724720001220703, 0.02056121826171875, 0.02387523651123047, 0.027189254760742188, 0.030503273010253906, 0.033817291259765625, 0.037131309509277344, 0.04044532775878906, 0.04375934600830078, 0.0470733642578125, 0.05038738250732422, 0.05370140075683594, 0.057015419006347656, 0.060329437255859375, 0.0636434555053711, 0.06695747375488281, 0.07027149200439453, 0.07358551025390625, 0.07689952850341797, 0.08021354675292969, 0.0835275650024414, 0.08684158325195312, 0.09015560150146484, 0.09346961975097656, 0.09678363800048828, 0.10009765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 9.0, 14.0, 16.0, 23.0, 22.0, 21.0, 27.0, 45.0, 66.0, 106.0, 148.0, 242.0, 420.0, 774.0, 1754.0, 4185.0, 12381.0, 40927.0, 166525.0, 960806.0, 2495399.0, 391180.0, 84165.0, 22562.0, 7071.0, 2748.0, 1173.0, 591.0, 321.0, 179.0, 97.0, 79.0, 45.0, 37.0, 13.0, 23.0, 19.0, 12.0, 7.0, 5.0, 6.0, 6.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.275146484375, -0.26467132568359375, -0.2541961669921875, -0.24372100830078125, -0.233245849609375, -0.22277069091796875, -0.2122955322265625, -0.20182037353515625, -0.19134521484375, -0.18087005615234375, -0.1703948974609375, -0.15991973876953125, -0.149444580078125, -0.13896942138671875, -0.1284942626953125, -0.11801910400390625, -0.1075439453125, -0.09706878662109375, -0.0865936279296875, -0.07611846923828125, -0.065643310546875, -0.05516815185546875, -0.0446929931640625, -0.03421783447265625, -0.02374267578125, -0.01326751708984375, -0.0027923583984375, 0.00768280029296875, 0.018157958984375, 0.02863311767578125, 0.0391082763671875, 0.04958343505859375, 0.06005859375, 0.07053375244140625, 0.0810089111328125, 0.09148406982421875, 0.101959228515625, 0.11243438720703125, 0.1229095458984375, 0.13338470458984375, 0.14385986328125, 0.15433502197265625, 0.1648101806640625, 0.17528533935546875, 0.185760498046875, 0.19623565673828125, 0.2067108154296875, 0.21718597412109375, 0.2276611328125, 0.23813629150390625, 0.2486114501953125, 0.25908660888671875, 0.269561767578125, 0.28003692626953125, 0.2905120849609375, 0.30098724365234375, 0.31146240234375, 0.32193756103515625, 0.3324127197265625, 0.34288787841796875, 0.353363037109375, 0.36383819580078125, 0.3743133544921875, 0.38478851318359375, 0.395263671875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 7.0, 18.0, 24.0, 39.0, 49.0, 77.0, 95.0, 154.0, 209.0, 364.0, 630.0, 882.0, 618.0, 304.0, 220.0, 139.0, 80.0, 57.0, 37.0, 33.0, 13.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.44899749755859375, -0.4373016357421875, -0.42560577392578125, -0.413909912109375, -0.40221405029296875, -0.3905181884765625, -0.37882232666015625, -0.36712646484375, -0.35543060302734375, -0.3437347412109375, -0.33203887939453125, -0.320343017578125, -0.30864715576171875, -0.2969512939453125, -0.28525543212890625, -0.2735595703125, -0.26186370849609375, -0.2501678466796875, -0.23847198486328125, -0.226776123046875, -0.21508026123046875, -0.2033843994140625, -0.19168853759765625, -0.17999267578125, -0.16829681396484375, -0.1566009521484375, -0.14490509033203125, -0.133209228515625, -0.12151336669921875, -0.1098175048828125, -0.09812164306640625, -0.08642578125, -0.07472991943359375, -0.0630340576171875, -0.05133819580078125, -0.039642333984375, -0.02794647216796875, -0.0162506103515625, -0.00455474853515625, 0.00714111328125, 0.01883697509765625, 0.0305328369140625, 0.04222869873046875, 0.053924560546875, 0.06562042236328125, 0.0773162841796875, 0.08901214599609375, 0.1007080078125, 0.11240386962890625, 0.1240997314453125, 0.13579559326171875, 0.147491455078125, 0.15918731689453125, 0.1708831787109375, 0.18257904052734375, 0.19427490234375, 0.20597076416015625, 0.2176666259765625, 0.22936248779296875, 0.241058349609375, 0.25275421142578125, 0.2644500732421875, 0.27614593505859375, 0.287841796875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 17.0, 46.0, 92.0, 166.0, 208.0, 193.0, 130.0, 77.0, 37.0, 10.0, 3.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6999917030334473, -2.607011318206787, -2.514031171798706, -2.421050786972046, -2.328070640563965, -2.2350902557373047, -2.1421101093292236, -2.0491297245025635, -1.9561495780944824, -1.8631693124771118, -1.7701890468597412, -1.6772087812423706, -1.584228515625, -1.4912482500076294, -1.3982679843902588, -1.3052875995635986, -1.212307333946228, -1.1193270683288574, -1.0263468027114868, -0.9333665370941162, -0.8403862714767456, -0.747406005859375, -0.6544256806373596, -0.561445415019989, -0.4684651494026184, -0.3754848837852478, -0.2825046181678772, -0.1895243227481842, -0.0965440571308136, -0.003563791513442993, 0.08941650390625, 0.1823967695236206, 0.2753770351409912, 0.3683573007583618, 0.4613375663757324, 0.554317831993103, 0.6472980976104736, 0.7402783632278442, 0.8332586884498596, 0.9262389540672302, 1.019219160079956, 1.1121994256973267, 1.2051796913146973, 1.2981599569320679, 1.3911402225494385, 1.484120488166809, 1.5771007537841797, 1.6700811386108398, 1.7630614042282104, 1.856041669845581, 1.9490219354629517, 2.0420022010803223, 2.1349825859069824, 2.2279627323150635, 2.3209431171417236, 2.4139232635498047, 2.506903648376465, 2.599884033203125, 2.692864179611206, 2.785844564437866, 2.8788247108459473, 2.9718050956726074, 3.0647852420806885, 3.1577656269073486, 3.2507457733154297]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 9.0, 9.0, 12.0, 13.0, 9.0, 24.0, 15.0, 14.0, 19.0, 23.0, 28.0, 29.0, 37.0, 34.0, 28.0, 46.0, 37.0, 47.0, 34.0, 42.0, 35.0, 42.0, 39.0, 38.0, 37.0, 28.0, 21.0, 23.0, 23.0, 27.0, 21.0, 22.0, 16.0, 16.0, 15.0, 16.0, 13.0, 13.0, 5.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.8448373079299927, -0.8209336400032043, -0.7970299124717712, -0.7731262445449829, -0.7492225170135498, -0.7253188490867615, -0.7014151811599731, -0.67751145362854, -0.6536077857017517, -0.6297041177749634, -0.6058003902435303, -0.5818967223167419, -0.5579930543899536, -0.5340893268585205, -0.5101856589317322, -0.48628196120262146, -0.46237826347351074, -0.4384745657444, -0.4145708680152893, -0.390667200088501, -0.36676350235939026, -0.34285980463027954, -0.3189561367034912, -0.2950524389743805, -0.2711487412452698, -0.24724504351615906, -0.22334136068820953, -0.19943767786026, -0.1755339801311493, -0.15163028240203857, -0.12772659957408905, -0.10382291674613953, -0.07991921901702881, -0.05601552873849869, -0.03211183845996857, -0.008208148181438446, 0.015695542097091675, 0.039599232375621796, 0.06350292265415192, 0.08740660548210144, 0.11131030321121216, 0.13521400094032288, 0.1591176837682724, 0.18302136659622192, 0.20692506432533264, 0.23082876205444336, 0.2547324299812317, 0.2786361277103424, 0.3025398254394531, 0.32644352316856384, 0.35034722089767456, 0.3742508888244629, 0.3981545865535736, 0.4220582842826843, 0.44596195220947266, 0.4698656499385834, 0.4937693476676941, 0.5176730155944824, 0.5415767431259155, 0.5654804110527039, 0.5893840789794922, 0.6132878065109253, 0.6371914744377136, 0.661095142364502, 0.6849988698959351]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 17.0, 17.0, 27.0, 50.0, 88.0, 112.0, 186.0, 275.0, 448.0, 672.0, 1062.0, 1529.0, 2373.0, 3487.0, 4953.0, 7666.0, 11923.0, 22117.0, 52456.0, 180364.0, 445955.0, 197235.0, 56366.0, 23275.0, 12414.0, 7759.0, 5157.0, 3534.0, 2436.0, 1574.0, 1052.0, 731.0, 465.0, 276.0, 207.0, 108.0, 54.0, 43.0, 32.0, 24.0, 8.0, 12.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.298095703125, -0.2899360656738281, -0.28177642822265625, -0.2736167907714844, -0.2654571533203125, -0.2572975158691406, -0.24913787841796875, -0.24097824096679688, -0.232818603515625, -0.22465896606445312, -0.21649932861328125, -0.20833969116210938, -0.2001800537109375, -0.19202041625976562, -0.18386077880859375, -0.17570114135742188, -0.16754150390625, -0.15938186645507812, -0.15122222900390625, -0.14306259155273438, -0.1349029541015625, -0.12674331665039062, -0.11858367919921875, -0.11042404174804688, -0.102264404296875, -0.09410476684570312, -0.08594512939453125, -0.07778549194335938, -0.0696258544921875, -0.061466217041015625, -0.05330657958984375, -0.045146942138671875, -0.0369873046875, -0.028827667236328125, -0.02066802978515625, -0.012508392333984375, -0.0043487548828125, 0.003810882568359375, 0.01197052001953125, 0.020130157470703125, 0.028289794921875, 0.036449432373046875, 0.04460906982421875, 0.052768707275390625, 0.0609283447265625, 0.06908798217773438, 0.07724761962890625, 0.08540725708007812, 0.09356689453125, 0.10172653198242188, 0.10988616943359375, 0.11804580688476562, 0.1262054443359375, 0.13436508178710938, 0.14252471923828125, 0.15068435668945312, 0.158843994140625, 0.16700363159179688, 0.17516326904296875, 0.18332290649414062, 0.1914825439453125, 0.19964218139648438, 0.20780181884765625, 0.21596145629882812, 0.22412109375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 9.0, 5.0, 8.0, 19.0, 14.0, 21.0, 19.0, 15.0, 27.0, 28.0, 31.0, 23.0, 31.0, 39.0, 36.0, 49.0, 40.0, 37.0, 43.0, 39.0, 49.0, 35.0, 34.0, 36.0, 36.0, 38.0, 35.0, 27.0, 16.0, 15.0, 20.0, 19.0, 12.0, 9.0, 12.0, 6.0, 11.0, 8.0, 6.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0], "bins": [-0.1163330078125, -0.11287498474121094, -0.10941696166992188, -0.10595893859863281, -0.10250091552734375, -0.09904289245605469, -0.09558486938476562, -0.09212684631347656, -0.0886688232421875, -0.08521080017089844, -0.08175277709960938, -0.07829475402832031, -0.07483673095703125, -0.07137870788574219, -0.06792068481445312, -0.06446266174316406, -0.061004638671875, -0.05754661560058594, -0.054088592529296875, -0.05063056945800781, -0.04717254638671875, -0.04371452331542969, -0.040256500244140625, -0.03679847717285156, -0.0333404541015625, -0.029882431030273438, -0.026424407958984375, -0.022966384887695312, -0.01950836181640625, -0.016050338745117188, -0.012592315673828125, -0.009134292602539062, -0.00567626953125, -0.0022182464599609375, 0.001239776611328125, 0.0046977996826171875, 0.00815582275390625, 0.011613845825195312, 0.015071868896484375, 0.018529891967773438, 0.0219879150390625, 0.025445938110351562, 0.028903961181640625, 0.03236198425292969, 0.03582000732421875, 0.03927803039550781, 0.042736053466796875, 0.04619407653808594, 0.049652099609375, 0.05311012268066406, 0.056568145751953125, 0.06002616882324219, 0.06348419189453125, 0.06694221496582031, 0.07040023803710938, 0.07385826110839844, 0.0773162841796875, 0.08077430725097656, 0.08423233032226562, 0.08769035339355469, 0.09114837646484375, 0.09460639953613281, 0.09806442260742188, 0.10152244567871094, 0.10498046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 12.0, 16.0, 16.0, 21.0, 27.0, 46.0, 62.0, 81.0, 164.0, 285.0, 513.0, 994.0, 2072.0, 4699.0, 10768.0, 25704.0, 77331.0, 493232.0, 337383.0, 57585.0, 20928.0, 8975.0, 3896.0, 1769.0, 863.0, 399.0, 243.0, 148.0, 100.0, 58.0, 42.0, 25.0, 21.0, 20.0, 13.0, 8.0, 6.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.368408203125, -0.3556556701660156, -0.34290313720703125, -0.3301506042480469, -0.3173980712890625, -0.3046455383300781, -0.29189300537109375, -0.2791404724121094, -0.266387939453125, -0.2536354064941406, -0.24088287353515625, -0.22813034057617188, -0.2153778076171875, -0.20262527465820312, -0.18987274169921875, -0.17712020874023438, -0.16436767578125, -0.15161514282226562, -0.13886260986328125, -0.12611007690429688, -0.1133575439453125, -0.10060501098632812, -0.08785247802734375, -0.07509994506835938, -0.062347412109375, -0.049594879150390625, -0.03684234619140625, -0.024089813232421875, -0.0113372802734375, 0.001415252685546875, 0.01416778564453125, 0.026920318603515625, 0.0396728515625, 0.052425384521484375, 0.06517791748046875, 0.07793045043945312, 0.0906829833984375, 0.10343551635742188, 0.11618804931640625, 0.12894058227539062, 0.141693115234375, 0.15444564819335938, 0.16719818115234375, 0.17995071411132812, 0.1927032470703125, 0.20545578002929688, 0.21820831298828125, 0.23096084594726562, 0.24371337890625, 0.2564659118652344, 0.26921844482421875, 0.2819709777832031, 0.2947235107421875, 0.3074760437011719, 0.32022857666015625, 0.3329811096191406, 0.345733642578125, 0.3584861755371094, 0.37123870849609375, 0.3839912414550781, 0.3967437744140625, 0.4094963073730469, 0.42224884033203125, 0.4350013732910156, 0.44775390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 7.0, 6.0, 5.0, 8.0, 12.0, 13.0, 10.0, 23.0, 18.0, 15.0, 27.0, 22.0, 32.0, 22.0, 44.0, 42.0, 43.0, 38.0, 47.0, 44.0, 57.0, 49.0, 51.0, 47.0, 44.0, 41.0, 36.0, 33.0, 31.0, 18.0, 15.0, 19.0, 20.0, 10.0, 10.0, 8.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3037109375, -0.29177093505859375, -0.2798309326171875, -0.26789093017578125, -0.255950927734375, -0.24401092529296875, -0.2320709228515625, -0.22013092041015625, -0.20819091796875, -0.19625091552734375, -0.1843109130859375, -0.17237091064453125, -0.160430908203125, -0.14849090576171875, -0.1365509033203125, -0.12461090087890625, -0.1126708984375, -0.10073089599609375, -0.0887908935546875, -0.07685089111328125, -0.064910888671875, -0.05297088623046875, -0.0410308837890625, -0.02909088134765625, -0.01715087890625, -0.00521087646484375, 0.0067291259765625, 0.01866912841796875, 0.030609130859375, 0.04254913330078125, 0.0544891357421875, 0.06642913818359375, 0.078369140625, 0.09030914306640625, 0.1022491455078125, 0.11418914794921875, 0.126129150390625, 0.13806915283203125, 0.1500091552734375, 0.16194915771484375, 0.17388916015625, 0.18582916259765625, 0.1977691650390625, 0.20970916748046875, 0.221649169921875, 0.23358917236328125, 0.2455291748046875, 0.25746917724609375, 0.2694091796875, 0.28134918212890625, 0.2932891845703125, 0.30522918701171875, 0.317169189453125, 0.32910919189453125, 0.3410491943359375, 0.35298919677734375, 0.36492919921875, 0.37686920166015625, 0.3888092041015625, 0.40074920654296875, 0.412689208984375, 0.42462921142578125, 0.4365692138671875, 0.44850921630859375, 0.46044921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 14.0, 11.0, 17.0, 17.0, 47.0, 82.0, 122.0, 174.0, 267.0, 505.0, 921.0, 1517.0, 2891.0, 4959.0, 9342.0, 18558.0, 41000.0, 119825.0, 476711.0, 250341.0, 66053.0, 26951.0, 12733.0, 6798.0, 3757.0, 2136.0, 1141.0, 673.0, 397.0, 228.0, 133.0, 80.0, 56.0, 32.0, 16.0, 15.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.14501953125, -0.14072227478027344, -0.13642501831054688, -0.1321277618408203, -0.12783050537109375, -0.12353324890136719, -0.11923599243164062, -0.11493873596191406, -0.1106414794921875, -0.10634422302246094, -0.10204696655273438, -0.09774971008300781, -0.09345245361328125, -0.08915519714355469, -0.08485794067382812, -0.08056068420410156, -0.076263427734375, -0.07196617126464844, -0.06766891479492188, -0.06337165832519531, -0.05907440185546875, -0.05477714538574219, -0.050479888916015625, -0.04618263244628906, -0.0418853759765625, -0.03758811950683594, -0.033290863037109375, -0.028993606567382812, -0.02469635009765625, -0.020399093627929688, -0.016101837158203125, -0.011804580688476562, -0.00750732421875, -0.0032100677490234375, 0.001087188720703125, 0.0053844451904296875, 0.00968170166015625, 0.013978958129882812, 0.018276214599609375, 0.022573471069335938, 0.0268707275390625, 0.031167984008789062, 0.035465240478515625, 0.03976249694824219, 0.04405975341796875, 0.04835700988769531, 0.052654266357421875, 0.05695152282714844, 0.061248779296875, 0.06554603576660156, 0.06984329223632812, 0.07414054870605469, 0.07843780517578125, 0.08273506164550781, 0.08703231811523438, 0.09132957458496094, 0.0956268310546875, 0.09992408752441406, 0.10422134399414062, 0.10851860046386719, 0.11281585693359375, 0.11711311340332031, 0.12141036987304688, 0.12570762634277344, 0.1300048828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 4.0, 12.0, 12.0, 12.0, 28.0, 30.0, 82.0, 148.0, 196.0, 200.0, 97.0, 49.0, 37.0, 19.0, 9.0, 11.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5180320739746094e-05, -4.349276423454285e-05, -4.18052077293396e-05, -4.011765122413635e-05, -3.8430094718933105e-05, -3.674253821372986e-05, -3.505498170852661e-05, -3.3367425203323364e-05, -3.167986869812012e-05, -2.999231219291687e-05, -2.8304755687713623e-05, -2.6617199182510376e-05, -2.492964267730713e-05, -2.3242086172103882e-05, -2.1554529666900635e-05, -1.9866973161697388e-05, -1.817941665649414e-05, -1.6491860151290894e-05, -1.4804303646087646e-05, -1.31167471408844e-05, -1.1429190635681152e-05, -9.741634130477905e-06, -8.054077625274658e-06, -6.366521120071411e-06, -4.678964614868164e-06, -2.991408109664917e-06, -1.30385160446167e-06, 3.8370490074157715e-07, 2.0712614059448242e-06, 3.7588179111480713e-06, 5.446374416351318e-06, 7.1339309215545654e-06, 8.821487426757812e-06, 1.050904393196106e-05, 1.2196600437164307e-05, 1.3884156942367554e-05, 1.55717134475708e-05, 1.7259269952774048e-05, 1.8946826457977295e-05, 2.0634382963180542e-05, 2.232193946838379e-05, 2.4009495973587036e-05, 2.5697052478790283e-05, 2.738460898399353e-05, 2.9072165489196777e-05, 3.0759721994400024e-05, 3.244727849960327e-05, 3.413483500480652e-05, 3.5822391510009766e-05, 3.750994801521301e-05, 3.919750452041626e-05, 4.088506102561951e-05, 4.2572617530822754e-05, 4.4260174036026e-05, 4.594773054122925e-05, 4.7635287046432495e-05, 4.932284355163574e-05, 5.101040005683899e-05, 5.2697956562042236e-05, 5.4385513067245483e-05, 5.607306957244873e-05, 5.776062607765198e-05, 5.9448182582855225e-05, 6.113573908805847e-05, 6.282329559326172e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 8.0, 13.0, 14.0, 21.0, 31.0, 49.0, 81.0, 113.0, 229.0, 400.0, 771.0, 1914.0, 4116.0, 10364.0, 27621.0, 90741.0, 367763.0, 395977.0, 99386.0, 29568.0, 11015.0, 4477.0, 1939.0, 914.0, 434.0, 229.0, 128.0, 64.0, 47.0, 36.0, 21.0, 10.0, 17.0, 11.0, 7.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.165771484375, -0.16117095947265625, -0.1565704345703125, -0.15196990966796875, -0.147369384765625, -0.14276885986328125, -0.1381683349609375, -0.13356781005859375, -0.12896728515625, -0.12436676025390625, -0.1197662353515625, -0.11516571044921875, -0.110565185546875, -0.10596466064453125, -0.1013641357421875, -0.09676361083984375, -0.0921630859375, -0.08756256103515625, -0.0829620361328125, -0.07836151123046875, -0.073760986328125, -0.06916046142578125, -0.0645599365234375, -0.05995941162109375, -0.05535888671875, -0.05075836181640625, -0.0461578369140625, -0.04155731201171875, -0.036956787109375, -0.03235626220703125, -0.0277557373046875, -0.02315521240234375, -0.0185546875, -0.01395416259765625, -0.0093536376953125, -0.00475311279296875, -0.000152587890625, 0.00444793701171875, 0.0090484619140625, 0.01364898681640625, 0.01824951171875, 0.02285003662109375, 0.0274505615234375, 0.03205108642578125, 0.036651611328125, 0.04125213623046875, 0.0458526611328125, 0.05045318603515625, 0.0550537109375, 0.05965423583984375, 0.0642547607421875, 0.06885528564453125, 0.073455810546875, 0.07805633544921875, 0.0826568603515625, 0.08725738525390625, 0.09185791015625, 0.09645843505859375, 0.1010589599609375, 0.10565948486328125, 0.110260009765625, 0.11486053466796875, 0.1194610595703125, 0.12406158447265625, 0.128662109375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 7.0, 6.0, 15.0, 15.0, 10.0, 23.0, 31.0, 38.0, 49.0, 59.0, 76.0, 109.0, 89.0, 104.0, 84.0, 58.0, 46.0, 33.0, 27.0, 29.0, 18.0, 9.0, 12.0, 9.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1148681640625, -0.11110687255859375, -0.1073455810546875, -0.10358428955078125, -0.099822998046875, -0.09606170654296875, -0.0923004150390625, -0.08853912353515625, -0.08477783203125, -0.08101654052734375, -0.0772552490234375, -0.07349395751953125, -0.069732666015625, -0.06597137451171875, -0.0622100830078125, -0.05844879150390625, -0.0546875, -0.05092620849609375, -0.0471649169921875, -0.04340362548828125, -0.039642333984375, -0.03588104248046875, -0.0321197509765625, -0.02835845947265625, -0.02459716796875, -0.02083587646484375, -0.0170745849609375, -0.01331329345703125, -0.009552001953125, -0.00579071044921875, -0.0020294189453125, 0.00173187255859375, 0.0054931640625, 0.00925445556640625, 0.0130157470703125, 0.01677703857421875, 0.020538330078125, 0.02429962158203125, 0.0280609130859375, 0.03182220458984375, 0.03558349609375, 0.03934478759765625, 0.0431060791015625, 0.04686737060546875, 0.050628662109375, 0.05438995361328125, 0.0581512451171875, 0.06191253662109375, 0.065673828125, 0.06943511962890625, 0.0731964111328125, 0.07695770263671875, 0.080718994140625, 0.08448028564453125, 0.0882415771484375, 0.09200286865234375, 0.09576416015625, 0.09952545166015625, 0.1032867431640625, 0.10704803466796875, 0.110809326171875, 0.11457061767578125, 0.1183319091796875, 0.12209320068359375, 0.1258544921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 16.0, 39.0, 53.0, 104.0, 125.0, 139.0, 158.0, 135.0, 87.0, 53.0, 39.0, 24.0, 11.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.616220474243164, -1.545584797859192, -1.4749491214752197, -1.404313325881958, -1.3336776494979858, -1.2630419731140137, -1.192406177520752, -1.1217705011367798, -1.0511348247528076, -0.9804991483688354, -0.9098634123802185, -0.8392276763916016, -0.7685920000076294, -0.6979563236236572, -0.6273205876350403, -0.5566848516464233, -0.48604917526245117, -0.4154134690761566, -0.34477776288986206, -0.2741420567035675, -0.20350635051727295, -0.1328706443309784, -0.06223493814468384, 0.008400768041610718, 0.07903647422790527, 0.14967218041419983, 0.22030788660049438, 0.29094359278678894, 0.3615792989730835, 0.43221500515937805, 0.5028507113456726, 0.5734864473342896, 0.6441221237182617, 0.7147578001022339, 0.7853935360908508, 0.8560292720794678, 0.9266649484634399, 0.9973006248474121, 1.0679364204406738, 1.138572096824646, 1.2092077732086182, 1.2798434495925903, 1.3504791259765625, 1.4211149215698242, 1.4917505979537964, 1.5623862743377686, 1.6330220699310303, 1.7036577463150024, 1.7742934226989746, 1.8449290990829468, 1.915564775466919, 1.9862005710601807, 2.0568361282348633, 2.127471923828125, 2.1981077194213867, 2.2687432765960693, 2.339379072189331, 2.4100148677825928, 2.4806504249572754, 2.551286220550537, 2.621922016143799, 2.6925575733184814, 2.763193368911743, 2.833828926086426, 2.9044647216796875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 6.0, 9.0, 12.0, 7.0, 13.0, 14.0, 23.0, 13.0, 18.0, 22.0, 19.0, 35.0, 19.0, 32.0, 32.0, 39.0, 30.0, 30.0, 44.0, 39.0, 32.0, 37.0, 40.0, 29.0, 34.0, 31.0, 35.0, 32.0, 31.0, 25.0, 25.0, 21.0, 24.0, 16.0, 20.0, 11.0, 7.0, 17.0, 8.0, 9.0, 5.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.7879053950309753, -0.7606739401817322, -0.7334424257278442, -0.7062109708786011, -0.6789795160293579, -0.6517480611801147, -0.6245166063308716, -0.5972850918769836, -0.5700536370277405, -0.5428221821784973, -0.5155906677246094, -0.4883592128753662, -0.46112775802612305, -0.4338963031768799, -0.40666481852531433, -0.3794333338737488, -0.3522018790245056, -0.32497042417526245, -0.2977389395236969, -0.27050745487213135, -0.24327600002288818, -0.21604453027248383, -0.18881306052207947, -0.1615815907716751, -0.13435012102127075, -0.1071186512708664, -0.07988718152046204, -0.05265571177005768, -0.02542424201965332, 0.0018072277307510376, 0.029038697481155396, 0.05627016723155975, 0.08350157737731934, 0.1107330471277237, 0.13796451687812805, 0.1651959866285324, 0.19242745637893677, 0.21965892612934113, 0.24689039587974548, 0.27412188053131104, 0.3013533353805542, 0.32858479022979736, 0.3558162748813629, 0.38304775953292847, 0.41027921438217163, 0.4375106692314148, 0.46474215388298035, 0.4919736385345459, 0.5192050933837891, 0.5464365482330322, 0.5736680030822754, 0.6008995175361633, 0.6281309723854065, 0.6553624272346497, 0.6825939416885376, 0.7098253965377808, 0.7370568513870239, 0.7642883062362671, 0.7915197610855103, 0.8187512755393982, 0.8459827303886414, 0.8732141852378845, 0.9004456996917725, 0.9276771545410156, 0.9549086093902588]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 9.0, 11.0, 19.0, 23.0, 44.0, 72.0, 123.0, 199.0, 332.0, 619.0, 1021.0, 2119.0, 4141.0, 8772.0, 20423.0, 51008.0, 146379.0, 533199.0, 1943044.0, 1086319.0, 259442.0, 81545.0, 30572.0, 13008.0, 5880.0, 2827.0, 1374.0, 733.0, 407.0, 229.0, 149.0, 95.0, 55.0, 43.0, 18.0, 14.0, 7.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179931640625, -0.17366981506347656, -0.16740798950195312, -0.1611461639404297, -0.15488433837890625, -0.1486225128173828, -0.14236068725585938, -0.13609886169433594, -0.1298370361328125, -0.12357521057128906, -0.11731338500976562, -0.11105155944824219, -0.10478973388671875, -0.09852790832519531, -0.09226608276367188, -0.08600425720214844, -0.079742431640625, -0.07348060607910156, -0.06721878051757812, -0.06095695495605469, -0.05469512939453125, -0.04843330383300781, -0.042171478271484375, -0.03590965270996094, -0.0296478271484375, -0.023386001586914062, -0.017124176025390625, -0.010862350463867188, -0.00460052490234375, 0.0016613006591796875, 0.007923126220703125, 0.014184951782226562, 0.02044677734375, 0.026708602905273438, 0.032970428466796875, 0.03923225402832031, 0.04549407958984375, 0.05175590515136719, 0.058017730712890625, 0.06427955627441406, 0.0705413818359375, 0.07680320739746094, 0.08306503295898438, 0.08932685852050781, 0.09558868408203125, 0.10185050964355469, 0.10811233520507812, 0.11437416076660156, 0.120635986328125, 0.12689781188964844, 0.13315963745117188, 0.1394214630126953, 0.14568328857421875, 0.1519451141357422, 0.15820693969726562, 0.16446876525878906, 0.1707305908203125, 0.17699241638183594, 0.18325424194335938, 0.1895160675048828, 0.19577789306640625, 0.2020397186279297, 0.20830154418945312, 0.21456336975097656, 0.2208251953125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 7.0, 11.0, 9.0, 14.0, 19.0, 22.0, 26.0, 26.0, 24.0, 29.0, 26.0, 32.0, 28.0, 34.0, 44.0, 46.0, 34.0, 39.0, 47.0, 36.0, 40.0, 34.0, 32.0, 36.0, 30.0, 38.0, 28.0, 21.0, 22.0, 20.0, 19.0, 17.0, 11.0, 12.0, 10.0, 9.0, 6.0, 8.0, 4.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.11962890625, -0.1160116195678711, -0.11239433288574219, -0.10877704620361328, -0.10515975952148438, -0.10154247283935547, -0.09792518615722656, -0.09430789947509766, -0.09069061279296875, -0.08707332611083984, -0.08345603942871094, -0.07983875274658203, -0.07622146606445312, -0.07260417938232422, -0.06898689270019531, -0.0653696060180664, -0.0617523193359375, -0.058135032653808594, -0.05451774597167969, -0.05090045928955078, -0.047283172607421875, -0.04366588592529297, -0.04004859924316406, -0.036431312561035156, -0.03281402587890625, -0.029196739196777344, -0.025579452514648438, -0.02196216583251953, -0.018344879150390625, -0.014727592468261719, -0.011110305786132812, -0.007493019104003906, -0.003875732421875, -0.00025844573974609375, 0.0033588409423828125, 0.006976127624511719, 0.010593414306640625, 0.014210700988769531, 0.017827987670898438, 0.021445274353027344, 0.02506256103515625, 0.028679847717285156, 0.03229713439941406, 0.03591442108154297, 0.039531707763671875, 0.04314899444580078, 0.04676628112792969, 0.050383567810058594, 0.0540008544921875, 0.057618141174316406, 0.06123542785644531, 0.06485271453857422, 0.06847000122070312, 0.07208728790283203, 0.07570457458496094, 0.07932186126708984, 0.08293914794921875, 0.08655643463134766, 0.09017372131347656, 0.09379100799560547, 0.09740829467773438, 0.10102558135986328, 0.10464286804199219, 0.1082601547241211, 0.11187744140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 8.0, 9.0, 13.0, 21.0, 19.0, 33.0, 54.0, 97.0, 142.0, 224.0, 477.0, 1100.0, 3086.0, 9672.0, 40883.0, 239506.0, 2486836.0, 1238590.0, 137007.0, 25841.0, 6670.0, 2239.0, 872.0, 414.0, 181.0, 86.0, 53.0, 31.0, 28.0, 22.0, 18.0, 12.0, 8.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.427734375, -0.4134063720703125, -0.399078369140625, -0.3847503662109375, -0.37042236328125, -0.3560943603515625, -0.341766357421875, -0.3274383544921875, -0.3131103515625, -0.2987823486328125, -0.284454345703125, -0.2701263427734375, -0.25579833984375, -0.2414703369140625, -0.227142333984375, -0.2128143310546875, -0.198486328125, -0.1841583251953125, -0.169830322265625, -0.1555023193359375, -0.14117431640625, -0.1268463134765625, -0.112518310546875, -0.0981903076171875, -0.0838623046875, -0.0695343017578125, -0.055206298828125, -0.0408782958984375, -0.02655029296875, -0.0122222900390625, 0.002105712890625, 0.0164337158203125, 0.03076171875, 0.0450897216796875, 0.059417724609375, 0.0737457275390625, 0.08807373046875, 0.1024017333984375, 0.116729736328125, 0.1310577392578125, 0.1453857421875, 0.1597137451171875, 0.174041748046875, 0.1883697509765625, 0.20269775390625, 0.2170257568359375, 0.231353759765625, 0.2456817626953125, 0.260009765625, 0.2743377685546875, 0.288665771484375, 0.3029937744140625, 0.31732177734375, 0.3316497802734375, 0.345977783203125, 0.3603057861328125, 0.3746337890625, 0.3889617919921875, 0.403289794921875, 0.4176177978515625, 0.43194580078125, 0.4462738037109375, 0.460601806640625, 0.4749298095703125, 0.4892578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 13.0, 14.0, 13.0, 21.0, 29.0, 44.0, 95.0, 143.0, 216.0, 303.0, 633.0, 940.0, 698.0, 346.0, 185.0, 122.0, 97.0, 57.0, 44.0, 21.0, 8.0, 9.0, 10.0, 10.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.595703125, -0.5816993713378906, -0.5676956176757812, -0.5536918640136719, -0.5396881103515625, -0.5256843566894531, -0.5116806030273438, -0.4976768493652344, -0.483673095703125, -0.4696693420410156, -0.45566558837890625, -0.4416618347167969, -0.4276580810546875, -0.4136543273925781, -0.39965057373046875, -0.3856468200683594, -0.37164306640625, -0.3576393127441406, -0.34363555908203125, -0.3296318054199219, -0.3156280517578125, -0.3016242980957031, -0.28762054443359375, -0.2736167907714844, -0.259613037109375, -0.24560928344726562, -0.23160552978515625, -0.21760177612304688, -0.2035980224609375, -0.18959426879882812, -0.17559051513671875, -0.16158676147460938, -0.1475830078125, -0.13357925415039062, -0.11957550048828125, -0.10557174682617188, -0.0915679931640625, -0.07756423950195312, -0.06356048583984375, -0.049556732177734375, -0.035552978515625, -0.021549224853515625, -0.00754547119140625, 0.006458282470703125, 0.0204620361328125, 0.034465789794921875, 0.04846954345703125, 0.062473297119140625, 0.07647705078125, 0.09048080444335938, 0.10448455810546875, 0.11848831176757812, 0.1324920654296875, 0.14649581909179688, 0.16049957275390625, 0.17450332641601562, 0.188507080078125, 0.20251083374023438, 0.21651458740234375, 0.23051834106445312, 0.2445220947265625, 0.2585258483886719, 0.27252960205078125, 0.2865333557128906, 0.300537109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 12.0, 32.0, 44.0, 48.0, 87.0, 129.0, 125.0, 153.0, 134.0, 94.0, 63.0, 36.0, 17.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5302045345306396, -2.459735631942749, -2.3892664909362793, -2.3187975883483887, -2.248328685760498, -2.1778595447540283, -2.1073906421661377, -2.036921739578247, -1.9664525985717773, -1.8959835767745972, -1.8255146741867065, -1.7550456523895264, -1.6845766305923462, -1.614107608795166, -1.5436387062072754, -1.4731696844100952, -1.4027007818222046, -1.3322317600250244, -1.2617628574371338, -1.1912938356399536, -1.1208248138427734, -1.0503559112548828, -0.9798868894577026, -0.9094178676605225, -0.8389489054679871, -0.7684799432754517, -0.6980109214782715, -0.6275419592857361, -0.5570729970932007, -0.4866039752960205, -0.4161350131034851, -0.3456660211086273, -0.27519702911376953, -0.20472803711891174, -0.13425906002521515, -0.06379008293151855, 0.006678909063339233, 0.07714790105819702, 0.14761686325073242, 0.2180858552455902, 0.288554847240448, 0.3590238392353058, 0.4294928312301636, 0.499961793422699, 0.5704307556152344, 0.6408997774124146, 0.71136873960495, 0.7818377017974854, 0.8523067235946655, 0.9227756857872009, 0.9932447075843811, 1.0637136697769165, 1.1341826915740967, 1.2046515941619873, 1.2751206159591675, 1.3455896377563477, 1.4160585403442383, 1.4865275621414185, 1.556996464729309, 1.6274654865264893, 1.6979345083236694, 1.7684035301208496, 1.8388724327087402, 1.9093414545059204, 1.9798104763031006]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 4.0, 6.0, 9.0, 11.0, 8.0, 16.0, 22.0, 15.0, 21.0, 18.0, 14.0, 28.0, 26.0, 22.0, 32.0, 27.0, 36.0, 44.0, 43.0, 39.0, 40.0, 37.0, 46.0, 37.0, 43.0, 41.0, 30.0, 37.0, 25.0, 27.0, 28.0, 21.0, 18.0, 17.0, 15.0, 15.0, 11.0, 14.0, 15.0, 1.0, 9.0, 3.0, 8.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.9195284247398376, -0.8909602761268616, -0.8623921275138855, -0.8338240385055542, -0.8052558898925781, -0.776687741279602, -0.748119592666626, -0.7195514440536499, -0.6909832954406738, -0.6624151468276978, -0.6338469982147217, -0.6052788496017456, -0.5767107605934143, -0.5481426119804382, -0.5195744633674622, -0.4910063147544861, -0.4624382257461548, -0.4338700771331787, -0.405301958322525, -0.37673380970954895, -0.34816569089889526, -0.3195975422859192, -0.2910293936729431, -0.26246124505996704, -0.23389312624931335, -0.20532499253749847, -0.1767568588256836, -0.14818871021270752, -0.11962057650089264, -0.09105244278907776, -0.062484294176101685, -0.033916160464286804, -0.0053479671478271484, 0.02322017028927803, 0.05178830772638321, 0.08035644888877869, 0.10892458260059357, 0.13749271631240845, 0.16606086492538452, 0.1946289986371994, 0.22319713234901428, 0.25176528096199036, 0.28033339977264404, 0.3089015483856201, 0.3374696969985962, 0.3660378158092499, 0.39460596442222595, 0.42317408323287964, 0.4517422318458557, 0.4803103804588318, 0.5088785290718079, 0.5374466180801392, 0.5660147666931152, 0.5945829153060913, 0.6231510639190674, 0.6517192125320435, 0.6802873611450195, 0.7088555097579956, 0.7374236583709717, 0.7659918069839478, 0.794559895992279, 0.8231280446052551, 0.8516961932182312, 0.8802643418312073, 0.9088324308395386]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 8.0, 15.0, 12.0, 19.0, 35.0, 53.0, 78.0, 117.0, 185.0, 338.0, 584.0, 1055.0, 1844.0, 3171.0, 5722.0, 9951.0, 17516.0, 32010.0, 77926.0, 313031.0, 397359.0, 103721.0, 37453.0, 19871.0, 11340.0, 6431.0, 3643.0, 2135.0, 1232.0, 674.0, 393.0, 216.0, 146.0, 82.0, 45.0, 49.0, 18.0, 19.0, 10.0, 7.0, 8.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.2958984375, -0.2863883972167969, -0.27687835693359375, -0.2673683166503906, -0.2578582763671875, -0.24834823608398438, -0.23883819580078125, -0.22932815551757812, -0.219818115234375, -0.21030807495117188, -0.20079803466796875, -0.19128799438476562, -0.1817779541015625, -0.17226791381835938, -0.16275787353515625, -0.15324783325195312, -0.14373779296875, -0.13422775268554688, -0.12471771240234375, -0.11520767211914062, -0.1056976318359375, -0.09618759155273438, -0.08667755126953125, -0.07716751098632812, -0.067657470703125, -0.058147430419921875, -0.04863739013671875, -0.039127349853515625, -0.0296173095703125, -0.020107269287109375, -0.01059722900390625, -0.001087188720703125, 0.0084228515625, 0.017932891845703125, 0.02744293212890625, 0.036952972412109375, 0.0464630126953125, 0.055973052978515625, 0.06548309326171875, 0.07499313354492188, 0.084503173828125, 0.09401321411132812, 0.10352325439453125, 0.11303329467773438, 0.1225433349609375, 0.13205337524414062, 0.14156341552734375, 0.15107345581054688, 0.16058349609375, 0.17009353637695312, 0.17960357666015625, 0.18911361694335938, 0.1986236572265625, 0.20813369750976562, 0.21764373779296875, 0.22715377807617188, 0.236663818359375, 0.24617385864257812, 0.25568389892578125, 0.2651939392089844, 0.2747039794921875, 0.2842140197753906, 0.29372406005859375, 0.3032341003417969, 0.312744140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 8.0, 11.0, 13.0, 12.0, 16.0, 14.0, 29.0, 19.0, 33.0, 34.0, 44.0, 46.0, 39.0, 53.0, 46.0, 52.0, 54.0, 48.0, 47.0, 37.0, 55.0, 39.0, 41.0, 23.0, 28.0, 23.0, 24.0, 29.0, 17.0, 9.0, 8.0, 9.0, 6.0, 5.0, 5.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1380615234375, -0.1335010528564453, -0.12894058227539062, -0.12438011169433594, -0.11981964111328125, -0.11525917053222656, -0.11069869995117188, -0.10613822937011719, -0.1015777587890625, -0.09701728820800781, -0.09245681762695312, -0.08789634704589844, -0.08333587646484375, -0.07877540588378906, -0.07421493530273438, -0.06965446472167969, -0.065093994140625, -0.06053352355957031, -0.055973052978515625, -0.05141258239746094, -0.04685211181640625, -0.04229164123535156, -0.037731170654296875, -0.03317070007324219, -0.0286102294921875, -0.024049758911132812, -0.019489288330078125, -0.014928817749023438, -0.01036834716796875, -0.0058078765869140625, -0.001247406005859375, 0.0033130645751953125, 0.00787353515625, 0.012434005737304688, 0.016994476318359375, 0.021554946899414062, 0.02611541748046875, 0.030675888061523438, 0.035236358642578125, 0.03979682922363281, 0.0443572998046875, 0.04891777038574219, 0.053478240966796875, 0.05803871154785156, 0.06259918212890625, 0.06715965270996094, 0.07172012329101562, 0.07628059387207031, 0.080841064453125, 0.08540153503417969, 0.08996200561523438, 0.09452247619628906, 0.09908294677734375, 0.10364341735839844, 0.10820388793945312, 0.11276435852050781, 0.1173248291015625, 0.12188529968261719, 0.12644577026367188, 0.13100624084472656, 0.13556671142578125, 0.14012718200683594, 0.14468765258789062, 0.1492481231689453, 0.15380859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 8.0, 5.0, 9.0, 15.0, 32.0, 38.0, 61.0, 84.0, 117.0, 209.0, 383.0, 714.0, 1450.0, 3300.0, 7921.0, 19961.0, 67136.0, 581249.0, 298226.0, 41920.0, 14600.0, 6029.0, 2578.0, 1153.0, 550.0, 318.0, 148.0, 104.0, 60.0, 41.0, 34.0, 25.0, 10.0, 11.0, 18.0, 11.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4619140625, -0.4447021484375, -0.427490234375, -0.4102783203125, -0.39306640625, -0.3758544921875, -0.358642578125, -0.3414306640625, -0.32421875, -0.3070068359375, -0.289794921875, -0.2725830078125, -0.25537109375, -0.2381591796875, -0.220947265625, -0.2037353515625, -0.1865234375, -0.1693115234375, -0.152099609375, -0.1348876953125, -0.11767578125, -0.1004638671875, -0.083251953125, -0.0660400390625, -0.048828125, -0.0316162109375, -0.014404296875, 0.0028076171875, 0.02001953125, 0.0372314453125, 0.054443359375, 0.0716552734375, 0.0888671875, 0.1060791015625, 0.123291015625, 0.1405029296875, 0.15771484375, 0.1749267578125, 0.192138671875, 0.2093505859375, 0.2265625, 0.2437744140625, 0.260986328125, 0.2781982421875, 0.29541015625, 0.3126220703125, 0.329833984375, 0.3470458984375, 0.3642578125, 0.3814697265625, 0.398681640625, 0.4158935546875, 0.43310546875, 0.4503173828125, 0.467529296875, 0.4847412109375, 0.501953125, 0.5191650390625, 0.536376953125, 0.5535888671875, 0.57080078125, 0.5880126953125, 0.605224609375, 0.6224365234375, 0.6396484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 8.0, 3.0, 6.0, 15.0, 11.0, 16.0, 15.0, 26.0, 21.0, 28.0, 35.0, 37.0, 46.0, 52.0, 58.0, 62.0, 61.0, 49.0, 58.0, 48.0, 45.0, 44.0, 39.0, 45.0, 28.0, 37.0, 25.0, 21.0, 12.0, 10.0, 6.0, 10.0, 6.0, 4.0, 11.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.556640625, -0.539947509765625, -0.52325439453125, -0.506561279296875, -0.4898681640625, -0.473175048828125, -0.45648193359375, -0.439788818359375, -0.423095703125, -0.406402587890625, -0.38970947265625, -0.373016357421875, -0.3563232421875, -0.339630126953125, -0.32293701171875, -0.306243896484375, -0.28955078125, -0.272857666015625, -0.25616455078125, -0.239471435546875, -0.2227783203125, -0.206085205078125, -0.18939208984375, -0.172698974609375, -0.156005859375, -0.139312744140625, -0.12261962890625, -0.105926513671875, -0.0892333984375, -0.072540283203125, -0.05584716796875, -0.039154052734375, -0.0224609375, -0.005767822265625, 0.01092529296875, 0.027618408203125, 0.0443115234375, 0.061004638671875, 0.07769775390625, 0.094390869140625, 0.111083984375, 0.127777099609375, 0.14447021484375, 0.161163330078125, 0.1778564453125, 0.194549560546875, 0.21124267578125, 0.227935791015625, 0.24462890625, 0.261322021484375, 0.27801513671875, 0.294708251953125, 0.3114013671875, 0.328094482421875, 0.34478759765625, 0.361480712890625, 0.378173828125, 0.394866943359375, 0.41156005859375, 0.428253173828125, 0.4449462890625, 0.461639404296875, 0.47833251953125, 0.495025634765625, 0.51171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 13.0, 7.0, 13.0, 20.0, 27.0, 42.0, 65.0, 95.0, 136.0, 253.0, 353.0, 537.0, 812.0, 1264.0, 2082.0, 3584.0, 5706.0, 9358.0, 16596.0, 29515.0, 58130.0, 148712.0, 409029.0, 208166.0, 72191.0, 35058.0, 18821.0, 10947.0, 6548.0, 3848.0, 2458.0, 1530.0, 906.0, 591.0, 403.0, 247.0, 154.0, 113.0, 59.0, 53.0, 17.0, 24.0, 21.0, 15.0, 12.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.11041259765625, -0.10702896118164062, -0.10364532470703125, -0.10026168823242188, -0.0968780517578125, -0.09349441528320312, -0.09011077880859375, -0.08672714233398438, -0.083343505859375, -0.07995986938476562, -0.07657623291015625, -0.07319259643554688, -0.0698089599609375, -0.06642532348632812, -0.06304168701171875, -0.059658050537109375, -0.0562744140625, -0.052890777587890625, -0.04950714111328125, -0.046123504638671875, -0.0427398681640625, -0.039356231689453125, -0.03597259521484375, -0.032588958740234375, -0.029205322265625, -0.025821685791015625, -0.02243804931640625, -0.019054412841796875, -0.0156707763671875, -0.012287139892578125, -0.00890350341796875, -0.005519866943359375, -0.00213623046875, 0.001247406005859375, 0.00463104248046875, 0.008014678955078125, 0.0113983154296875, 0.014781951904296875, 0.01816558837890625, 0.021549224853515625, 0.024932861328125, 0.028316497802734375, 0.03170013427734375, 0.035083770751953125, 0.0384674072265625, 0.041851043701171875, 0.04523468017578125, 0.048618316650390625, 0.052001953125, 0.055385589599609375, 0.05876922607421875, 0.062152862548828125, 0.0655364990234375, 0.06892013549804688, 0.07230377197265625, 0.07568740844726562, 0.079071044921875, 0.08245468139648438, 0.08583831787109375, 0.08922195434570312, 0.0926055908203125, 0.09598922729492188, 0.09937286376953125, 0.10275650024414062, 0.10614013671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 7.0, 12.0, 8.0, 8.0, 16.0, 11.0, 11.0, 31.0, 23.0, 69.0, 102.0, 142.0, 205.0, 143.0, 60.0, 38.0, 27.0, 11.0, 16.0, 7.0, 8.0, 10.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.3392181396484375e-05, -4.17931005358696e-05, -4.019401967525482e-05, -3.8594938814640045e-05, -3.699585795402527e-05, -3.539677709341049e-05, -3.3797696232795715e-05, -3.219861537218094e-05, -3.059953451156616e-05, -2.9000453650951385e-05, -2.740137279033661e-05, -2.5802291929721832e-05, -2.4203211069107056e-05, -2.260413020849228e-05, -2.1005049347877502e-05, -1.9405968487262726e-05, -1.780688762664795e-05, -1.6207806766033173e-05, -1.4608725905418396e-05, -1.300964504480362e-05, -1.1410564184188843e-05, -9.811483323574066e-06, -8.21240246295929e-06, -6.613321602344513e-06, -5.014240741729736e-06, -3.4151598811149597e-06, -1.816079020500183e-06, -2.169981598854065e-07, 1.3820827007293701e-06, 2.9811635613441467e-06, 4.580244421958923e-06, 6.1793252825737e-06, 7.778406143188477e-06, 9.377487003803253e-06, 1.097656786441803e-05, 1.2575648725032806e-05, 1.4174729585647583e-05, 1.577381044626236e-05, 1.7372891306877136e-05, 1.8971972167491913e-05, 2.057105302810669e-05, 2.2170133888721466e-05, 2.3769214749336243e-05, 2.536829560995102e-05, 2.6967376470565796e-05, 2.8566457331180573e-05, 3.016553819179535e-05, 3.1764619052410126e-05, 3.33636999130249e-05, 3.496278077363968e-05, 3.6561861634254456e-05, 3.816094249486923e-05, 3.976002335548401e-05, 4.1359104216098785e-05, 4.295818507671356e-05, 4.455726593732834e-05, 4.6156346797943115e-05, 4.775542765855789e-05, 4.935450851917267e-05, 5.0953589379787445e-05, 5.255267024040222e-05, 5.4151751101017e-05, 5.5750831961631775e-05, 5.734991282224655e-05, 5.894899368286133e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 7.0, 16.0, 19.0, 22.0, 43.0, 41.0, 84.0, 77.0, 150.0, 241.0, 360.0, 603.0, 1047.0, 1993.0, 4175.0, 8686.0, 18173.0, 38937.0, 92833.0, 271978.0, 368347.0, 139012.0, 53526.0, 24582.0, 11739.0, 5661.0, 2839.0, 1442.0, 702.0, 451.0, 237.0, 163.0, 121.0, 69.0, 47.0, 39.0, 16.0, 22.0, 15.0, 11.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.11474609375, -0.11118221282958984, -0.10761833190917969, -0.10405445098876953, -0.10049057006835938, -0.09692668914794922, -0.09336280822753906, -0.0897989273071289, -0.08623504638671875, -0.0826711654663086, -0.07910728454589844, -0.07554340362548828, -0.07197952270507812, -0.06841564178466797, -0.06485176086425781, -0.061287879943847656, -0.0577239990234375, -0.054160118103027344, -0.05059623718261719, -0.04703235626220703, -0.043468475341796875, -0.03990459442138672, -0.03634071350097656, -0.032776832580566406, -0.02921295166015625, -0.025649070739746094, -0.022085189819335938, -0.01852130889892578, -0.014957427978515625, -0.011393547058105469, -0.007829666137695312, -0.004265785217285156, -0.000701904296875, 0.0028619766235351562, 0.0064258575439453125, 0.009989738464355469, 0.013553619384765625, 0.01711750030517578, 0.020681381225585938, 0.024245262145996094, 0.02780914306640625, 0.031373023986816406, 0.03493690490722656, 0.03850078582763672, 0.042064666748046875, 0.04562854766845703, 0.04919242858886719, 0.052756309509277344, 0.0563201904296875, 0.059884071350097656, 0.06344795227050781, 0.06701183319091797, 0.07057571411132812, 0.07413959503173828, 0.07770347595214844, 0.0812673568725586, 0.08483123779296875, 0.0883951187133789, 0.09195899963378906, 0.09552288055419922, 0.09908676147460938, 0.10265064239501953, 0.10621452331542969, 0.10977840423583984, 0.11334228515625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 5.0, 3.0, 3.0, 6.0, 16.0, 10.0, 16.0, 28.0, 32.0, 34.0, 54.0, 65.0, 82.0, 82.0, 96.0, 110.0, 78.0, 61.0, 44.0, 34.0, 22.0, 22.0, 14.0, 9.0, 8.0, 8.0, 14.0, 4.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.168701171875, -0.1643085479736328, -0.15991592407226562, -0.15552330017089844, -0.15113067626953125, -0.14673805236816406, -0.14234542846679688, -0.1379528045654297, -0.1335601806640625, -0.1291675567626953, -0.12477493286132812, -0.12038230895996094, -0.11598968505859375, -0.11159706115722656, -0.10720443725585938, -0.10281181335449219, -0.098419189453125, -0.09402656555175781, -0.08963394165039062, -0.08524131774902344, -0.08084869384765625, -0.07645606994628906, -0.07206344604492188, -0.06767082214355469, -0.0632781982421875, -0.05888557434082031, -0.054492950439453125, -0.05010032653808594, -0.04570770263671875, -0.04131507873535156, -0.036922454833984375, -0.03252983093261719, -0.02813720703125, -0.023744583129882812, -0.019351959228515625, -0.014959335327148438, -0.01056671142578125, -0.0061740875244140625, -0.001781463623046875, 0.0026111602783203125, 0.0070037841796875, 0.011396408081054688, 0.015789031982421875, 0.020181655883789062, 0.02457427978515625, 0.028966903686523438, 0.033359527587890625, 0.03775215148925781, 0.042144775390625, 0.04653739929199219, 0.050930023193359375, 0.05532264709472656, 0.05971527099609375, 0.06410789489746094, 0.06850051879882812, 0.07289314270019531, 0.0772857666015625, 0.08167839050292969, 0.08607101440429688, 0.09046363830566406, 0.09485626220703125, 0.09924888610839844, 0.10364151000976562, 0.10803413391113281, 0.1124267578125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 13.0, 37.0, 64.0, 119.0, 149.0, 190.0, 173.0, 113.0, 57.0, 38.0, 16.0, 11.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.663025140762329, -2.5725982189178467, -2.4821712970733643, -2.391744375228882, -2.3013172149658203, -2.210890293121338, -2.1204633712768555, -2.030036449432373, -1.9396095275878906, -1.8491826057434082, -1.7587556838989258, -1.6683286428451538, -1.5779017210006714, -1.487474799156189, -1.397047758102417, -1.3066208362579346, -1.2161939144134521, -1.1257669925689697, -1.0353400707244873, -0.9449130296707153, -0.8544861078262329, -0.7640591859817505, -0.6736322045326233, -0.5832052230834961, -0.49277830123901367, -0.40235134959220886, -0.31192439794540405, -0.22149744629859924, -0.13107049465179443, -0.040643543004989624, 0.049783408641815186, 0.14021039009094238, 0.2306370735168457, 0.3210640251636505, 0.4114909768104553, 0.5019179582595825, 0.5923448801040649, 0.6827718019485474, 0.7731987833976746, 0.8636257648468018, 0.9540526866912842, 1.0444796085357666, 1.134906530380249, 1.225333571434021, 1.3157604932785034, 1.4061874151229858, 1.4966144561767578, 1.5870413780212402, 1.6774682998657227, 1.767895221710205, 1.8583221435546875, 1.9487491846084595, 2.0391759872436523, 2.129603147506714, 2.2200300693511963, 2.3104569911956787, 2.400883913040161, 2.4913108348846436, 2.581737756729126, 2.6721646785736084, 2.76259183883667, 2.8530187606811523, 2.9434456825256348, 3.033872604370117, 3.1242995262145996]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 6.0, 1.0, 8.0, 10.0, 11.0, 11.0, 13.0, 13.0, 16.0, 13.0, 19.0, 18.0, 32.0, 37.0, 38.0, 25.0, 37.0, 43.0, 43.0, 38.0, 47.0, 29.0, 38.0, 44.0, 42.0, 40.0, 38.0, 26.0, 33.0, 38.0, 25.0, 27.0, 28.0, 20.0, 15.0, 17.0, 13.0, 11.0, 10.0, 16.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.254845142364502, -1.2192962169647217, -1.1837472915649414, -1.1481983661651611, -1.1126494407653809, -1.0771005153656006, -1.0415515899658203, -1.0060027837753296, -0.9704538583755493, -0.934904932975769, -0.8993560075759888, -0.8638070821762085, -0.828258216381073, -0.7927092909812927, -0.7571603655815125, -0.7216114401817322, -0.6860625147819519, -0.6505135893821716, -0.6149646639823914, -0.5794157981872559, -0.5438668727874756, -0.5083179473876953, -0.47276902198791504, -0.43722009658813477, -0.4016712009906769, -0.3661222755908966, -0.3305733799934387, -0.29502445459365845, -0.2594755291938782, -0.2239266335964203, -0.18837770819664001, -0.15282879769802094, -0.11727988719940186, -0.08173097670078278, -0.0461820587515831, -0.010633140802383423, 0.024915769696235657, 0.060464680194854736, 0.09601360559463501, 0.1315625160932541, 0.16711142659187317, 0.20266033709049225, 0.23820924758911133, 0.2737581729888916, 0.3093070983886719, 0.34485599398612976, 0.38040491938591003, 0.4159538149833679, 0.4515027403831482, 0.48705166578292847, 0.5226005911827087, 0.5581494569778442, 0.5936983823776245, 0.6292473077774048, 0.6647962331771851, 0.7003451585769653, 0.7358940839767456, 0.7714430093765259, 0.8069919347763062, 0.8425408601760864, 0.8780897259712219, 0.9136386513710022, 0.9491875767707825, 0.9847365021705627, 1.0202853679656982]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 11.0, 19.0, 33.0, 55.0, 74.0, 116.0, 224.0, 372.0, 782.0, 1335.0, 2810.0, 5942.0, 13682.0, 31872.0, 79055.0, 221849.0, 760038.0, 1766394.0, 889425.0, 262015.0, 92797.0, 36555.0, 15643.0, 6887.0, 3196.0, 1463.0, 748.0, 418.0, 188.0, 122.0, 63.0, 30.0, 23.0, 19.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2301025390625, -0.22397804260253906, -0.21785354614257812, -0.2117290496826172, -0.20560455322265625, -0.1994800567626953, -0.19335556030273438, -0.18723106384277344, -0.1811065673828125, -0.17498207092285156, -0.16885757446289062, -0.1627330780029297, -0.15660858154296875, -0.1504840850830078, -0.14435958862304688, -0.13823509216308594, -0.132110595703125, -0.12598609924316406, -0.11986160278320312, -0.11373710632324219, -0.10761260986328125, -0.10148811340332031, -0.09536361694335938, -0.08923912048339844, -0.0831146240234375, -0.07699012756347656, -0.07086563110351562, -0.06474113464355469, -0.05861663818359375, -0.05249214172363281, -0.046367645263671875, -0.04024314880371094, -0.03411865234375, -0.027994155883789062, -0.021869659423828125, -0.015745162963867188, -0.00962066650390625, -0.0034961700439453125, 0.002628326416015625, 0.008752822875976562, 0.0148773193359375, 0.021001815795898438, 0.027126312255859375, 0.03325080871582031, 0.03937530517578125, 0.04549980163574219, 0.051624298095703125, 0.05774879455566406, 0.063873291015625, 0.06999778747558594, 0.07612228393554688, 0.08224678039550781, 0.08837127685546875, 0.09449577331542969, 0.10062026977539062, 0.10674476623535156, 0.1128692626953125, 0.11899375915527344, 0.12511825561523438, 0.1312427520751953, 0.13736724853515625, 0.1434917449951172, 0.14961624145507812, 0.15574073791503906, 0.161865234375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 11.0, 6.0, 10.0, 9.0, 10.0, 16.0, 21.0, 19.0, 23.0, 35.0, 25.0, 34.0, 29.0, 35.0, 45.0, 42.0, 56.0, 56.0, 51.0, 40.0, 41.0, 46.0, 42.0, 40.0, 36.0, 37.0, 37.0, 17.0, 16.0, 14.0, 21.0, 18.0, 15.0, 10.0, 13.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0], "bins": [-0.1878662109375, -0.18329715728759766, -0.1787281036376953, -0.17415904998779297, -0.16958999633789062, -0.16502094268798828, -0.16045188903808594, -0.1558828353881836, -0.15131378173828125, -0.1467447280883789, -0.14217567443847656, -0.13760662078857422, -0.13303756713867188, -0.12846851348876953, -0.12389945983886719, -0.11933040618896484, -0.1147613525390625, -0.11019229888916016, -0.10562324523925781, -0.10105419158935547, -0.09648513793945312, -0.09191608428955078, -0.08734703063964844, -0.0827779769897461, -0.07820892333984375, -0.0736398696899414, -0.06907081604003906, -0.06450176239013672, -0.059932708740234375, -0.05536365509033203, -0.05079460144042969, -0.046225547790527344, -0.041656494140625, -0.037087440490722656, -0.03251838684082031, -0.02794933319091797, -0.023380279541015625, -0.01881122589111328, -0.014242172241210938, -0.009673118591308594, -0.00510406494140625, -0.0005350112915039062, 0.0040340423583984375, 0.008603096008300781, 0.013172149658203125, 0.01774120330810547, 0.022310256958007812, 0.026879310607910156, 0.0314483642578125, 0.036017417907714844, 0.04058647155761719, 0.04515552520751953, 0.049724578857421875, 0.05429363250732422, 0.05886268615722656, 0.0634317398071289, 0.06800079345703125, 0.0725698471069336, 0.07713890075683594, 0.08170795440673828, 0.08627700805664062, 0.09084606170654297, 0.09541511535644531, 0.09998416900634766, 0.10455322265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 8.0, 1.0, 6.0, 15.0, 25.0, 33.0, 40.0, 65.0, 97.0, 160.0, 271.0, 493.0, 889.0, 1914.0, 4890.0, 15944.0, 68064.0, 384735.0, 2620131.0, 918965.0, 136174.0, 28182.0, 7682.0, 2805.0, 1178.0, 618.0, 350.0, 203.0, 99.0, 71.0, 59.0, 36.0, 30.0, 18.0, 12.0, 3.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.413818359375, -0.3988838195800781, -0.38394927978515625, -0.3690147399902344, -0.3540802001953125, -0.3391456604003906, -0.32421112060546875, -0.3092765808105469, -0.294342041015625, -0.2794075012207031, -0.26447296142578125, -0.24953842163085938, -0.2346038818359375, -0.21966934204101562, -0.20473480224609375, -0.18980026245117188, -0.17486572265625, -0.15993118286132812, -0.14499664306640625, -0.13006210327148438, -0.1151275634765625, -0.10019302368164062, -0.08525848388671875, -0.07032394409179688, -0.055389404296875, -0.040454864501953125, -0.02552032470703125, -0.010585784912109375, 0.0043487548828125, 0.019283294677734375, 0.03421783447265625, 0.049152374267578125, 0.0640869140625, 0.07902145385742188, 0.09395599365234375, 0.10889053344726562, 0.1238250732421875, 0.13875961303710938, 0.15369415283203125, 0.16862869262695312, 0.183563232421875, 0.19849777221679688, 0.21343231201171875, 0.22836685180664062, 0.2433013916015625, 0.2582359313964844, 0.27317047119140625, 0.2881050109863281, 0.30303955078125, 0.3179740905761719, 0.33290863037109375, 0.3478431701660156, 0.3627777099609375, 0.3777122497558594, 0.39264678955078125, 0.4075813293457031, 0.422515869140625, 0.4374504089355469, 0.45238494873046875, 0.4673194885253906, 0.4822540283203125, 0.4971885681152344, 0.5121231079101562, 0.5270576477050781, 0.5419921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 15.0, 17.0, 23.0, 29.0, 50.0, 66.0, 104.0, 137.0, 223.0, 354.0, 616.0, 800.0, 600.0, 330.0, 225.0, 155.0, 114.0, 73.0, 54.0, 31.0, 14.0, 13.0, 13.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5361518859863281, -0.5210342407226562, -0.5059165954589844, -0.4907989501953125, -0.4756813049316406, -0.46056365966796875, -0.4454460144042969, -0.430328369140625, -0.4152107238769531, -0.40009307861328125, -0.3849754333496094, -0.3698577880859375, -0.3547401428222656, -0.33962249755859375, -0.3245048522949219, -0.30938720703125, -0.2942695617675781, -0.27915191650390625, -0.2640342712402344, -0.2489166259765625, -0.23379898071289062, -0.21868133544921875, -0.20356369018554688, -0.188446044921875, -0.17332839965820312, -0.15821075439453125, -0.14309310913085938, -0.1279754638671875, -0.11285781860351562, -0.09774017333984375, -0.08262252807617188, -0.0675048828125, -0.052387237548828125, -0.03726959228515625, -0.022151947021484375, -0.0070343017578125, 0.008083343505859375, 0.02320098876953125, 0.038318634033203125, 0.053436279296875, 0.06855392456054688, 0.08367156982421875, 0.09878921508789062, 0.1139068603515625, 0.12902450561523438, 0.14414215087890625, 0.15925979614257812, 0.17437744140625, 0.18949508666992188, 0.20461273193359375, 0.21973037719726562, 0.2348480224609375, 0.24996566772460938, 0.26508331298828125, 0.2802009582519531, 0.295318603515625, 0.3104362487792969, 0.32555389404296875, 0.3406715393066406, 0.3557891845703125, 0.3709068298339844, 0.38602447509765625, 0.4011421203613281, 0.416259765625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 12.0, 23.0, 56.0, 101.0, 149.0, 196.0, 180.0, 124.0, 73.0, 37.0, 25.0, 8.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9030795097351074, -2.798339605331421, -2.6935997009277344, -2.588859796524048, -2.4841198921203613, -2.3793797492980957, -2.2746400833129883, -2.1698999404907227, -2.065160036087036, -1.9604201316833496, -1.855680227279663, -1.7509403228759766, -1.6462002992630005, -1.541460394859314, -1.4367204904556274, -1.3319804668426514, -1.2272406816482544, -1.1225007772445679, -1.0177608728408813, -0.91302090883255, -0.8082809448242188, -0.7035410404205322, -0.5988011360168457, -0.4940611720085144, -0.3893212676048279, -0.28458133339881897, -0.17984141409397125, -0.07510149478912354, 0.029638439416885376, 0.1343783736228943, 0.2391182780265808, 0.3438582420349121, 0.44859814643859863, 0.5533380508422852, 0.6580780148506165, 0.762817919254303, 0.8675578832626343, 0.9722977876663208, 1.0770376920700073, 1.1817777156829834, 1.28651762008667, 1.3912575244903564, 1.495997428894043, 1.6007373332977295, 1.7054773569107056, 1.810217261314392, 1.9149571657180786, 2.0196971893310547, 2.124436855316162, 2.2291767597198486, 2.333916664123535, 2.4386565685272217, 2.543396472930908, 2.648136615753174, 2.7528762817382812, 2.857616424560547, 2.9623563289642334, 3.06709623336792, 3.1718361377716064, 3.276576042175293, 3.3813159465789795, 3.486055850982666, 3.5907959938049316, 3.695535898208618, 3.8002758026123047]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 6.0, 11.0, 11.0, 9.0, 13.0, 12.0, 19.0, 16.0, 18.0, 17.0, 22.0, 20.0, 30.0, 28.0, 34.0, 39.0, 36.0, 49.0, 47.0, 45.0, 39.0, 35.0, 30.0, 36.0, 32.0, 40.0, 38.0, 27.0, 28.0, 18.0, 27.0, 28.0, 21.0, 18.0, 14.0, 10.0, 15.0, 7.0, 8.0, 5.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9802557826042175, -0.9464905261993408, -0.9127253293991089, -0.8789600729942322, -0.8451948761940002, -0.8114296197891235, -0.7776644229888916, -0.7438991665840149, -0.7101339101791382, -0.6763686537742615, -0.6426034569740295, -0.6088382005691528, -0.5750730037689209, -0.5413077473640442, -0.5075424909591675, -0.47377729415893555, -0.4400120973587036, -0.4062468707561493, -0.37248164415359497, -0.33871638774871826, -0.30495119094848633, -0.2711859345436096, -0.2374207079410553, -0.20365548133850098, -0.16989025473594666, -0.13612502813339233, -0.10235979408025742, -0.0685945600271225, -0.034829333424568176, -0.001064106822013855, 0.03270113468170166, 0.06646636128425598, 0.10023164749145508, 0.1339968740940094, 0.16776210069656372, 0.20152734220027924, 0.23529256880283356, 0.2690578103065491, 0.3028230369091034, 0.3365882635116577, 0.37035349011421204, 0.40411871671676636, 0.4378839433193207, 0.471649169921875, 0.5054144263267517, 0.5391796231269836, 0.5729448795318604, 0.6067100763320923, 0.640475332736969, 0.6742405891418457, 0.7080057859420776, 0.7417710423469543, 0.7755362391471863, 0.809301495552063, 0.8430666923522949, 0.8768319487571716, 0.9105972051620483, 0.944362461566925, 0.978127658367157, 1.0118929147720337, 1.0456581115722656, 1.0794233083724976, 1.113188624382019, 1.146953821182251, 1.180719017982483]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 8.0, 15.0, 23.0, 20.0, 40.0, 61.0, 79.0, 141.0, 212.0, 330.0, 571.0, 847.0, 1520.0, 2559.0, 4409.0, 7874.0, 14485.0, 26984.0, 56398.0, 141540.0, 342971.0, 261100.0, 96722.0, 41947.0, 21306.0, 11212.0, 6446.0, 3545.0, 2028.0, 1167.0, 708.0, 473.0, 294.0, 165.0, 111.0, 95.0, 54.0, 36.0, 22.0, 17.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30322265625, -0.2936897277832031, -0.28415679931640625, -0.2746238708496094, -0.2650909423828125, -0.2555580139160156, -0.24602508544921875, -0.23649215698242188, -0.226959228515625, -0.21742630004882812, -0.20789337158203125, -0.19836044311523438, -0.1888275146484375, -0.17929458618164062, -0.16976165771484375, -0.16022872924804688, -0.15069580078125, -0.14116287231445312, -0.13162994384765625, -0.12209701538085938, -0.1125640869140625, -0.10303115844726562, -0.09349822998046875, -0.08396530151367188, -0.074432373046875, -0.06489944458007812, -0.05536651611328125, -0.045833587646484375, -0.0363006591796875, -0.026767730712890625, -0.01723480224609375, -0.007701873779296875, 0.0018310546875, 0.011363983154296875, 0.02089691162109375, 0.030429840087890625, 0.0399627685546875, 0.049495697021484375, 0.05902862548828125, 0.06856155395507812, 0.078094482421875, 0.08762741088867188, 0.09716033935546875, 0.10669326782226562, 0.1162261962890625, 0.12575912475585938, 0.13529205322265625, 0.14482498168945312, 0.15435791015625, 0.16389083862304688, 0.17342376708984375, 0.18295669555664062, 0.1924896240234375, 0.20202255249023438, 0.21155548095703125, 0.22108840942382812, 0.230621337890625, 0.24015426635742188, 0.24968719482421875, 0.2592201232910156, 0.2687530517578125, 0.2782859802246094, 0.28781890869140625, 0.2973518371582031, 0.306884765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 8.0, 7.0, 13.0, 12.0, 9.0, 19.0, 18.0, 25.0, 33.0, 28.0, 33.0, 43.0, 36.0, 33.0, 53.0, 49.0, 39.0, 44.0, 42.0, 49.0, 50.0, 48.0, 46.0, 31.0, 37.0, 23.0, 26.0, 23.0, 18.0, 13.0, 9.0, 10.0, 12.0, 8.0, 9.0, 4.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1815185546875, -0.1764965057373047, -0.17147445678710938, -0.16645240783691406, -0.16143035888671875, -0.15640830993652344, -0.15138626098632812, -0.1463642120361328, -0.1413421630859375, -0.1363201141357422, -0.13129806518554688, -0.12627601623535156, -0.12125396728515625, -0.11623191833496094, -0.11120986938476562, -0.10618782043457031, -0.101165771484375, -0.09614372253417969, -0.09112167358398438, -0.08609962463378906, -0.08107757568359375, -0.07605552673339844, -0.07103347778320312, -0.06601142883300781, -0.0609893798828125, -0.05596733093261719, -0.050945281982421875, -0.04592323303222656, -0.04090118408203125, -0.03587913513183594, -0.030857086181640625, -0.025835037231445312, -0.02081298828125, -0.015790939331054688, -0.010768890380859375, -0.0057468414306640625, -0.00072479248046875, 0.0042972564697265625, 0.009319305419921875, 0.014341354370117188, 0.0193634033203125, 0.024385452270507812, 0.029407501220703125, 0.03442955017089844, 0.03945159912109375, 0.04447364807128906, 0.049495697021484375, 0.05451774597167969, 0.059539794921875, 0.06456184387207031, 0.06958389282226562, 0.07460594177246094, 0.07962799072265625, 0.08465003967285156, 0.08967208862304688, 0.09469413757324219, 0.0997161865234375, 0.10473823547363281, 0.10976028442382812, 0.11478233337402344, 0.11980438232421875, 0.12482643127441406, 0.12984848022460938, 0.1348705291748047, 0.139892578125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 21.0, 26.0, 49.0, 55.0, 77.0, 145.0, 218.0, 430.0, 812.0, 1600.0, 3705.0, 9746.0, 30362.0, 152243.0, 672667.0, 132208.0, 28203.0, 9098.0, 3447.0, 1612.0, 783.0, 380.0, 244.0, 121.0, 93.0, 53.0, 31.0, 31.0, 23.0, 12.0, 9.0, 6.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.66455078125, -0.641998291015625, -0.61944580078125, -0.596893310546875, -0.5743408203125, -0.551788330078125, -0.52923583984375, -0.506683349609375, -0.484130859375, -0.461578369140625, -0.43902587890625, -0.416473388671875, -0.3939208984375, -0.371368408203125, -0.34881591796875, -0.326263427734375, -0.3037109375, -0.281158447265625, -0.25860595703125, -0.236053466796875, -0.2135009765625, -0.190948486328125, -0.16839599609375, -0.145843505859375, -0.123291015625, -0.100738525390625, -0.07818603515625, -0.055633544921875, -0.0330810546875, -0.010528564453125, 0.01202392578125, 0.034576416015625, 0.05712890625, 0.079681396484375, 0.10223388671875, 0.124786376953125, 0.1473388671875, 0.169891357421875, 0.19244384765625, 0.214996337890625, 0.237548828125, 0.260101318359375, 0.28265380859375, 0.305206298828125, 0.3277587890625, 0.350311279296875, 0.37286376953125, 0.395416259765625, 0.41796875, 0.440521240234375, 0.46307373046875, 0.485626220703125, 0.5081787109375, 0.530731201171875, 0.55328369140625, 0.575836181640625, 0.598388671875, 0.620941162109375, 0.64349365234375, 0.666046142578125, 0.6885986328125, 0.711151123046875, 0.73370361328125, 0.756256103515625, 0.77880859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 8.0, 4.0, 8.0, 11.0, 14.0, 15.0, 26.0, 17.0, 36.0, 35.0, 36.0, 37.0, 41.0, 48.0, 52.0, 53.0, 65.0, 52.0, 50.0, 54.0, 50.0, 36.0, 38.0, 36.0, 30.0, 32.0, 20.0, 16.0, 15.0, 12.0, 9.0, 7.0, 1.0, 5.0, 3.0, 4.0, 6.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.541015625, -0.5224609375, -0.50390625, -0.4853515625, -0.466796875, -0.4482421875, -0.4296875, -0.4111328125, -0.392578125, -0.3740234375, -0.35546875, -0.3369140625, -0.318359375, -0.2998046875, -0.28125, -0.2626953125, -0.244140625, -0.2255859375, -0.20703125, -0.1884765625, -0.169921875, -0.1513671875, -0.1328125, -0.1142578125, -0.095703125, -0.0771484375, -0.05859375, -0.0400390625, -0.021484375, -0.0029296875, 0.015625, 0.0341796875, 0.052734375, 0.0712890625, 0.08984375, 0.1083984375, 0.126953125, 0.1455078125, 0.1640625, 0.1826171875, 0.201171875, 0.2197265625, 0.23828125, 0.2568359375, 0.275390625, 0.2939453125, 0.3125, 0.3310546875, 0.349609375, 0.3681640625, 0.38671875, 0.4052734375, 0.423828125, 0.4423828125, 0.4609375, 0.4794921875, 0.498046875, 0.5166015625, 0.53515625, 0.5537109375, 0.572265625, 0.5908203125, 0.609375, 0.6279296875, 0.646484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 4.0, 4.0, 7.0, 7.0, 12.0, 25.0, 34.0, 60.0, 87.0, 128.0, 237.0, 418.0, 672.0, 1250.0, 2208.0, 4020.0, 7489.0, 14341.0, 29056.0, 64393.0, 187013.0, 460129.0, 162554.0, 58755.0, 26699.0, 13317.0, 6958.0, 3797.0, 2062.0, 1165.0, 681.0, 359.0, 223.0, 151.0, 86.0, 53.0, 41.0, 15.0, 11.0, 5.0, 13.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1434326171875, -0.13820648193359375, -0.1329803466796875, -0.12775421142578125, -0.122528076171875, -0.11730194091796875, -0.1120758056640625, -0.10684967041015625, -0.10162353515625, -0.09639739990234375, -0.0911712646484375, -0.08594512939453125, -0.080718994140625, -0.07549285888671875, -0.0702667236328125, -0.06504058837890625, -0.059814453125, -0.05458831787109375, -0.0493621826171875, -0.04413604736328125, -0.038909912109375, -0.03368377685546875, -0.0284576416015625, -0.02323150634765625, -0.01800537109375, -0.01277923583984375, -0.0075531005859375, -0.00232696533203125, 0.002899169921875, 0.00812530517578125, 0.0133514404296875, 0.01857757568359375, 0.0238037109375, 0.02902984619140625, 0.0342559814453125, 0.03948211669921875, 0.044708251953125, 0.04993438720703125, 0.0551605224609375, 0.06038665771484375, 0.06561279296875, 0.07083892822265625, 0.0760650634765625, 0.08129119873046875, 0.086517333984375, 0.09174346923828125, 0.0969696044921875, 0.10219573974609375, 0.107421875, 0.11264801025390625, 0.1178741455078125, 0.12310028076171875, 0.128326416015625, 0.13355255126953125, 0.1387786865234375, 0.14400482177734375, 0.14923095703125, 0.15445709228515625, 0.1596832275390625, 0.16490936279296875, 0.170135498046875, 0.17536163330078125, 0.1805877685546875, 0.18581390380859375, 0.1910400390625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 7.0, 5.0, 2.0, 10.0, 8.0, 20.0, 28.0, 24.0, 41.0, 42.0, 71.0, 111.0, 170.0, 141.0, 93.0, 52.0, 36.0, 35.0, 9.0, 17.0, 18.0, 12.0, 7.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9948692321777344e-05, -4.8073939979076385e-05, -4.619918763637543e-05, -4.432443529367447e-05, -4.244968295097351e-05, -4.057493060827255e-05, -3.8700178265571594e-05, -3.6825425922870636e-05, -3.495067358016968e-05, -3.307592123746872e-05, -3.120116889476776e-05, -2.9326416552066803e-05, -2.7451664209365845e-05, -2.5576911866664886e-05, -2.3702159523963928e-05, -2.182740718126297e-05, -1.9952654838562012e-05, -1.8077902495861053e-05, -1.6203150153160095e-05, -1.4328397810459137e-05, -1.2453645467758179e-05, -1.057889312505722e-05, -8.704140782356262e-06, -6.829388439655304e-06, -4.954636096954346e-06, -3.0798837542533875e-06, -1.2051314115524292e-06, 6.69620931148529e-07, 2.5443732738494873e-06, 4.4191256165504456e-06, 6.293877959251404e-06, 8.168630301952362e-06, 1.004338264465332e-05, 1.1918134987354279e-05, 1.3792887330055237e-05, 1.5667639672756195e-05, 1.7542392015457153e-05, 1.941714435815811e-05, 2.129189670085907e-05, 2.3166649043560028e-05, 2.5041401386260986e-05, 2.6916153728961945e-05, 2.8790906071662903e-05, 3.066565841436386e-05, 3.254041075706482e-05, 3.441516309976578e-05, 3.6289915442466736e-05, 3.8164667785167694e-05, 4.003942012786865e-05, 4.191417247056961e-05, 4.378892481327057e-05, 4.566367715597153e-05, 4.7538429498672485e-05, 4.9413181841373444e-05, 5.12879341840744e-05, 5.316268652677536e-05, 5.503743886947632e-05, 5.6912191212177277e-05, 5.8786943554878235e-05, 6.066169589757919e-05, 6.253644824028015e-05, 6.441120058298111e-05, 6.628595292568207e-05, 6.816070526838303e-05, 7.003545761108398e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 7.0, 22.0, 28.0, 38.0, 38.0, 99.0, 135.0, 209.0, 360.0, 667.0, 1432.0, 3021.0, 7535.0, 21071.0, 65769.0, 289174.0, 491760.0, 114363.0, 33160.0, 11427.0, 4320.0, 1865.0, 854.0, 473.0, 281.0, 165.0, 81.0, 49.0, 44.0, 34.0, 21.0, 13.0, 6.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2269287109375, -0.2200946807861328, -0.21326065063476562, -0.20642662048339844, -0.19959259033203125, -0.19275856018066406, -0.18592453002929688, -0.1790904998779297, -0.1722564697265625, -0.1654224395751953, -0.15858840942382812, -0.15175437927246094, -0.14492034912109375, -0.13808631896972656, -0.13125228881835938, -0.12441825866699219, -0.117584228515625, -0.11075019836425781, -0.10391616821289062, -0.09708213806152344, -0.09024810791015625, -0.08341407775878906, -0.07658004760742188, -0.06974601745605469, -0.0629119873046875, -0.05607795715332031, -0.049243927001953125, -0.04240989685058594, -0.03557586669921875, -0.028741836547851562, -0.021907806396484375, -0.015073776245117188, -0.00823974609375, -0.0014057159423828125, 0.005428314208984375, 0.012262344360351562, 0.01909637451171875, 0.025930404663085938, 0.032764434814453125, 0.03959846496582031, 0.0464324951171875, 0.05326652526855469, 0.060100555419921875, 0.06693458557128906, 0.07376861572265625, 0.08060264587402344, 0.08743667602539062, 0.09427070617675781, 0.101104736328125, 0.10793876647949219, 0.11477279663085938, 0.12160682678222656, 0.12844085693359375, 0.13527488708496094, 0.14210891723632812, 0.1489429473876953, 0.1557769775390625, 0.1626110076904297, 0.16944503784179688, 0.17627906799316406, 0.18311309814453125, 0.18994712829589844, 0.19678115844726562, 0.2036151885986328, 0.21044921875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 3.0, 9.0, 7.0, 14.0, 7.0, 11.0, 17.0, 17.0, 26.0, 36.0, 46.0, 54.0, 69.0, 80.0, 87.0, 84.0, 87.0, 69.0, 55.0, 41.0, 31.0, 28.0, 22.0, 21.0, 16.0, 8.0, 9.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13326644897460938, -0.12798309326171875, -0.12269973754882812, -0.1174163818359375, -0.11213302612304688, -0.10684967041015625, -0.10156631469726562, -0.096282958984375, -0.09099960327148438, -0.08571624755859375, -0.08043289184570312, -0.0751495361328125, -0.06986618041992188, -0.06458282470703125, -0.059299468994140625, -0.05401611328125, -0.048732757568359375, -0.04344940185546875, -0.038166046142578125, -0.0328826904296875, -0.027599334716796875, -0.02231597900390625, -0.017032623291015625, -0.011749267578125, -0.006465911865234375, -0.00118255615234375, 0.004100799560546875, 0.0093841552734375, 0.014667510986328125, 0.01995086669921875, 0.025234222412109375, 0.030517578125, 0.035800933837890625, 0.04108428955078125, 0.046367645263671875, 0.0516510009765625, 0.056934356689453125, 0.06221771240234375, 0.06750106811523438, 0.072784423828125, 0.07806777954101562, 0.08335113525390625, 0.08863449096679688, 0.0939178466796875, 0.09920120239257812, 0.10448455810546875, 0.10976791381835938, 0.11505126953125, 0.12033462524414062, 0.12561798095703125, 0.13090133666992188, 0.1361846923828125, 0.14146804809570312, 0.14675140380859375, 0.15203475952148438, 0.157318115234375, 0.16260147094726562, 0.16788482666015625, 0.17316818237304688, 0.1784515380859375, 0.18373489379882812, 0.18901824951171875, 0.19430160522460938, 0.1995849609375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 10.0, 26.0, 51.0, 100.0, 167.0, 189.0, 174.0, 130.0, 72.0, 33.0, 19.0, 11.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6679210662841797, -2.5510668754577637, -2.4342126846313477, -2.3173584938049316, -2.2005043029785156, -2.0836501121520996, -1.966795802116394, -1.849941611289978, -1.733087420463562, -1.616233229637146, -1.49937903881073, -1.3825247287750244, -1.2656705379486084, -1.1488163471221924, -1.0319621562957764, -0.9151079654693604, -0.7982537746429443, -0.6813995838165283, -0.5645453929901123, -0.4476911425590515, -0.3308369517326355, -0.21398276090621948, -0.09712851047515869, 0.019725680351257324, 0.13657987117767334, 0.25343406200408936, 0.37028828263282776, 0.48714250326156616, 0.6039966940879822, 0.7208508849143982, 0.837705135345459, 0.954559326171875, 1.071413516998291, 1.188267707824707, 1.305121898651123, 1.421976089477539, 1.538830280303955, 1.655684471130371, 1.7725387811660767, 1.8893929719924927, 2.006247043609619, 2.123101234436035, 2.239955425262451, 2.356809616088867, 2.473663806915283, 2.590517997741699, 2.7073721885681152, 2.8242263793945312, 2.9410808086395264, 3.0579349994659424, 3.1747891902923584, 3.2916433811187744, 3.4084975719451904, 3.5253517627716064, 3.6422061920166016, 3.7590603828430176, 3.8759145736694336, 3.9927687644958496, 4.109622955322266, 4.226477146148682, 4.343331336975098, 4.460185527801514, 4.57703971862793, 4.693893909454346, 4.810748100280762]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 8.0, 10.0, 12.0, 10.0, 23.0, 17.0, 25.0, 16.0, 29.0, 31.0, 40.0, 38.0, 42.0, 34.0, 49.0, 42.0, 46.0, 46.0, 59.0, 45.0, 47.0, 40.0, 43.0, 26.0, 38.0, 29.0, 30.0, 18.0, 13.0, 15.0, 24.0, 11.0, 7.0, 4.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1940765380859375, -1.1514370441436768, -1.108797550201416, -1.0661580562591553, -1.023518443107605, -0.9808789491653442, -0.9382394552230835, -0.8955999612808228, -0.8529604077339172, -0.8103209137916565, -0.767681360244751, -0.7250418663024902, -0.6824023723602295, -0.639762818813324, -0.5971233248710632, -0.5544837713241577, -0.511844277381897, -0.46920475363731384, -0.4265652298927307, -0.38392573595046997, -0.34128621220588684, -0.2986466884613037, -0.25600719451904297, -0.21336767077445984, -0.1707281470298767, -0.12808862328529358, -0.08544911444187164, -0.04280960559844971, -0.00017008185386657715, 0.04246944189071655, 0.0851089358329773, 0.12774845957756042, 0.17038798332214355, 0.21302750706672668, 0.2556670308113098, 0.29830652475357056, 0.3409460484981537, 0.3835855722427368, 0.42622506618499756, 0.4688645899295807, 0.5115041136741638, 0.5541436076164246, 0.5967831611633301, 0.6394226551055908, 0.6820621490478516, 0.7247017025947571, 0.7673411965370178, 0.8099807500839233, 0.8526202440261841, 0.8952597379684448, 0.9378992915153503, 0.9805387854576111, 1.0231783390045166, 1.0658178329467773, 1.108457326889038, 1.1510968208312988, 1.1937363147735596, 1.2363758087158203, 1.279015302658081, 1.3216547966003418, 1.364294409751892, 1.4069339036941528, 1.4495733976364136, 1.4922128915786743, 1.5348525047302246]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 4.0, 5.0, 7.0, 16.0, 16.0, 13.0, 36.0, 43.0, 70.0, 114.0, 172.0, 325.0, 547.0, 1067.0, 2169.0, 4920.0, 12402.0, 35932.0, 126108.0, 574099.0, 2177728.0, 982409.0, 196702.0, 51431.0, 16377.0, 6122.0, 2601.0, 1265.0, 693.0, 324.0, 193.0, 127.0, 73.0, 56.0, 31.0, 25.0, 14.0, 8.0, 6.0, 10.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27294921875, -0.2637443542480469, -0.25453948974609375, -0.24533462524414062, -0.2361297607421875, -0.22692489624023438, -0.21772003173828125, -0.20851516723632812, -0.199310302734375, -0.19010543823242188, -0.18090057373046875, -0.17169570922851562, -0.1624908447265625, -0.15328598022460938, -0.14408111572265625, -0.13487625122070312, -0.12567138671875, -0.11646652221679688, -0.10726165771484375, -0.09805679321289062, -0.0888519287109375, -0.07964706420898438, -0.07044219970703125, -0.061237335205078125, -0.052032470703125, -0.042827606201171875, -0.03362274169921875, -0.024417877197265625, -0.0152130126953125, -0.006008148193359375, 0.00319671630859375, 0.012401580810546875, 0.0216064453125, 0.030811309814453125, 0.04001617431640625, 0.049221038818359375, 0.0584259033203125, 0.06763076782226562, 0.07683563232421875, 0.08604049682617188, 0.095245361328125, 0.10445022583007812, 0.11365509033203125, 0.12285995483398438, 0.1320648193359375, 0.14126968383789062, 0.15047454833984375, 0.15967941284179688, 0.16888427734375, 0.17808914184570312, 0.18729400634765625, 0.19649887084960938, 0.2057037353515625, 0.21490859985351562, 0.22411346435546875, 0.23331832885742188, 0.242523193359375, 0.2517280578613281, 0.26093292236328125, 0.2701377868652344, 0.2793426513671875, 0.2885475158691406, 0.29775238037109375, 0.3069572448730469, 0.316162109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 6.0, 7.0, 14.0, 10.0, 9.0, 8.0, 18.0, 22.0, 19.0, 21.0, 36.0, 26.0, 35.0, 36.0, 40.0, 45.0, 54.0, 42.0, 49.0, 39.0, 35.0, 45.0, 40.0, 33.0, 33.0, 43.0, 20.0, 30.0, 25.0, 16.0, 16.0, 27.0, 17.0, 17.0, 5.0, 13.0, 8.0, 7.0, 4.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1500244140625, -0.1452198028564453, -0.14041519165039062, -0.13561058044433594, -0.13080596923828125, -0.12600135803222656, -0.12119674682617188, -0.11639213562011719, -0.1115875244140625, -0.10678291320800781, -0.10197830200195312, -0.09717369079589844, -0.09236907958984375, -0.08756446838378906, -0.08275985717773438, -0.07795524597167969, -0.073150634765625, -0.06834602355957031, -0.06354141235351562, -0.05873680114746094, -0.05393218994140625, -0.04912757873535156, -0.044322967529296875, -0.03951835632324219, -0.0347137451171875, -0.029909133911132812, -0.025104522705078125, -0.020299911499023438, -0.01549530029296875, -0.010690689086914062, -0.005886077880859375, -0.0010814666748046875, 0.00372314453125, 0.008527755737304688, 0.013332366943359375, 0.018136978149414062, 0.02294158935546875, 0.027746200561523438, 0.032550811767578125, 0.03735542297363281, 0.0421600341796875, 0.04696464538574219, 0.051769256591796875, 0.05657386779785156, 0.06137847900390625, 0.06618309020996094, 0.07098770141601562, 0.07579231262207031, 0.080596923828125, 0.08540153503417969, 0.09020614624023438, 0.09501075744628906, 0.09981536865234375, 0.10461997985839844, 0.10942459106445312, 0.11422920227050781, 0.1190338134765625, 0.12383842468261719, 0.12864303588867188, 0.13344764709472656, 0.13825225830078125, 0.14305686950683594, 0.14786148071289062, 0.1526660919189453, 0.157470703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 6.0, 4.0, 12.0, 20.0, 20.0, 35.0, 36.0, 56.0, 81.0, 134.0, 275.0, 567.0, 1213.0, 3223.0, 10885.0, 68548.0, 1591558.0, 2410642.0, 88037.0, 12695.0, 3630.0, 1275.0, 612.0, 280.0, 147.0, 98.0, 53.0, 27.0, 30.0, 20.0, 18.0, 14.0, 6.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90185546875, -0.8718490600585938, -0.8418426513671875, -0.8118362426757812, -0.781829833984375, -0.7518234252929688, -0.7218170166015625, -0.6918106079101562, -0.66180419921875, -0.6317977905273438, -0.6017913818359375, -0.5717849731445312, -0.541778564453125, -0.5117721557617188, -0.4817657470703125, -0.45175933837890625, -0.4217529296875, -0.39174652099609375, -0.3617401123046875, -0.33173370361328125, -0.301727294921875, -0.27172088623046875, -0.2417144775390625, -0.21170806884765625, -0.18170166015625, -0.15169525146484375, -0.1216888427734375, -0.09168243408203125, -0.061676025390625, -0.03166961669921875, -0.0016632080078125, 0.02834320068359375, 0.058349609375, 0.08835601806640625, 0.1183624267578125, 0.14836883544921875, 0.178375244140625, 0.20838165283203125, 0.2383880615234375, 0.26839447021484375, 0.29840087890625, 0.32840728759765625, 0.3584136962890625, 0.38842010498046875, 0.418426513671875, 0.44843292236328125, 0.4784393310546875, 0.5084457397460938, 0.5384521484375, 0.5684585571289062, 0.5984649658203125, 0.6284713745117188, 0.658477783203125, 0.6884841918945312, 0.7184906005859375, 0.7484970092773438, 0.77850341796875, 0.8085098266601562, 0.8385162353515625, 0.8685226440429688, 0.898529052734375, 0.9285354614257812, 0.9585418701171875, 0.9885482788085938, 1.0185546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 11.0, 21.0, 30.0, 62.0, 91.0, 192.0, 325.0, 755.0, 1287.0, 659.0, 307.0, 155.0, 70.0, 46.0, 29.0, 9.0, 9.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.1089706420898438, -1.0821990966796875, -1.0554275512695312, -1.028656005859375, -1.0018844604492188, -0.9751129150390625, -0.9483413696289062, -0.92156982421875, -0.8947982788085938, -0.8680267333984375, -0.8412551879882812, -0.814483642578125, -0.7877120971679688, -0.7609405517578125, -0.7341690063476562, -0.7073974609375, -0.6806259155273438, -0.6538543701171875, -0.6270828247070312, -0.600311279296875, -0.5735397338867188, -0.5467681884765625, -0.5199966430664062, -0.49322509765625, -0.46645355224609375, -0.4396820068359375, -0.41291046142578125, -0.386138916015625, -0.35936737060546875, -0.3325958251953125, -0.30582427978515625, -0.279052734375, -0.25228118896484375, -0.2255096435546875, -0.19873809814453125, -0.171966552734375, -0.14519500732421875, -0.1184234619140625, -0.09165191650390625, -0.06488037109375, -0.03810882568359375, -0.0113372802734375, 0.01543426513671875, 0.042205810546875, 0.06897735595703125, 0.0957489013671875, 0.12252044677734375, 0.1492919921875, 0.17606353759765625, 0.2028350830078125, 0.22960662841796875, 0.256378173828125, 0.28314971923828125, 0.3099212646484375, 0.33669281005859375, 0.36346435546875, 0.39023590087890625, 0.4170074462890625, 0.44377899169921875, 0.470550537109375, 0.49732208251953125, 0.5240936279296875, 0.5508651733398438, 0.57763671875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 7.0, 11.0, 21.0, 45.0, 65.0, 131.0, 157.0, 165.0, 158.0, 110.0, 70.0, 21.0, 14.0, 9.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.241469383239746, -6.104079246520996, -5.966689586639404, -5.829299449920654, -5.6919097900390625, -5.5545196533203125, -5.4171295166015625, -5.279739856719971, -5.142349720001221, -5.004959583282471, -4.867569923400879, -4.730179786682129, -4.592789649963379, -4.455399990081787, -4.318009853363037, -4.180620193481445, -4.043230056762695, -3.9058401584625244, -3.7684502601623535, -3.6310601234436035, -3.4936702251434326, -3.3562803268432617, -3.2188901901245117, -3.081500291824341, -2.94411039352417, -2.806720495223999, -2.669330596923828, -2.531940460205078, -2.3945505619049072, -2.2571606636047363, -2.1197705268859863, -1.9823806285858154, -1.8449907302856445, -1.7076008319854736, -1.5702108144760132, -1.4328207969665527, -1.2954308986663818, -1.158041000366211, -1.0206509828567505, -0.8832610249519348, -0.7458710670471191, -0.6084811091423035, -0.4710911512374878, -0.3337011933326721, -0.19631123542785645, -0.05892127752304077, 0.0784686803817749, 0.21585863828659058, 0.35324859619140625, 0.4906385540962219, 0.6280285120010376, 0.7654184699058533, 0.902808427810669, 1.0401983261108398, 1.1775883436203003, 1.3149783611297607, 1.4523682594299316, 1.5897581577301025, 1.727148175239563, 1.8645381927490234, 2.0019280910491943, 2.1393179893493652, 2.2767081260681152, 2.414098024368286, 2.551487922668457]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 9.0, 6.0, 14.0, 9.0, 11.0, 13.0, 21.0, 29.0, 18.0, 21.0, 31.0, 19.0, 27.0, 33.0, 39.0, 37.0, 32.0, 43.0, 41.0, 43.0, 32.0, 30.0, 47.0, 46.0, 29.0, 42.0, 29.0, 37.0, 28.0, 28.0, 9.0, 19.0, 20.0, 19.0, 16.0, 9.0, 10.0, 8.0, 14.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2509021759033203, -1.2080273628234863, -1.1651525497436523, -1.1222777366638184, -1.0794029235839844, -1.03652822971344, -0.993653416633606, -0.950778603553772, -0.907903790473938, -0.865028977394104, -0.82215416431427, -0.7792794108390808, -0.7364045977592468, -0.6935297846794128, -0.6506550312042236, -0.6077802181243896, -0.5649054050445557, -0.5220305919647217, -0.4791558086872101, -0.4362810254096985, -0.3934062123298645, -0.3505313992500305, -0.3076566159725189, -0.2647818326950073, -0.22190701961517334, -0.17903222143650055, -0.13615742325782776, -0.09328262507915497, -0.05040782690048218, -0.007533028721809387, 0.0353417694568634, 0.078216552734375, 0.12109136581420898, 0.16396616399288177, 0.20684096217155457, 0.24971576035022736, 0.29259055852890015, 0.33546537160873413, 0.3783401548862457, 0.4212149381637573, 0.4640897512435913, 0.5069645643234253, 0.5498393774032593, 0.5927141308784485, 0.6355889439582825, 0.6784637570381165, 0.7213385105133057, 0.7642133235931396, 0.8070881366729736, 0.8499629497528076, 0.8928377628326416, 0.9357125163078308, 0.9785873293876648, 1.021462082862854, 1.064336895942688, 1.107211709022522, 1.150086522102356, 1.19296133518219, 1.235836148262024, 1.278710961341858, 1.3215856552124023, 1.3644604682922363, 1.4073352813720703, 1.4502100944519043, 1.4930849075317383]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 10.0, 16.0, 30.0, 41.0, 67.0, 115.0, 217.0, 370.0, 688.0, 1408.0, 3055.0, 7280.0, 20885.0, 77673.0, 289393.0, 426563.0, 159512.0, 40089.0, 12206.0, 4728.0, 2056.0, 969.0, 523.0, 273.0, 129.0, 90.0, 55.0, 31.0, 15.0, 15.0, 13.0, 8.0, 10.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.432373046875, -0.41854095458984375, -0.4047088623046875, -0.39087677001953125, -0.377044677734375, -0.36321258544921875, -0.3493804931640625, -0.33554840087890625, -0.32171630859375, -0.30788421630859375, -0.2940521240234375, -0.28022003173828125, -0.266387939453125, -0.25255584716796875, -0.2387237548828125, -0.22489166259765625, -0.2110595703125, -0.19722747802734375, -0.1833953857421875, -0.16956329345703125, -0.155731201171875, -0.14189910888671875, -0.1280670166015625, -0.11423492431640625, -0.10040283203125, -0.08657073974609375, -0.0727386474609375, -0.05890655517578125, -0.045074462890625, -0.03124237060546875, -0.0174102783203125, -0.00357818603515625, 0.01025390625, 0.02408599853515625, 0.0379180908203125, 0.05175018310546875, 0.065582275390625, 0.07941436767578125, 0.0932464599609375, 0.10707855224609375, 0.12091064453125, 0.13474273681640625, 0.1485748291015625, 0.16240692138671875, 0.176239013671875, 0.19007110595703125, 0.2039031982421875, 0.21773529052734375, 0.2315673828125, 0.24539947509765625, 0.2592315673828125, 0.27306365966796875, 0.286895751953125, 0.30072784423828125, 0.3145599365234375, 0.32839202880859375, 0.34222412109375, 0.35605621337890625, 0.3698883056640625, 0.38372039794921875, 0.397552490234375, 0.41138458251953125, 0.4252166748046875, 0.43904876708984375, 0.452880859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 7.0, 7.0, 11.0, 18.0, 13.0, 9.0, 22.0, 16.0, 24.0, 24.0, 26.0, 27.0, 34.0, 35.0, 32.0, 49.0, 37.0, 50.0, 35.0, 33.0, 35.0, 38.0, 38.0, 34.0, 39.0, 35.0, 31.0, 34.0, 30.0, 27.0, 16.0, 20.0, 10.0, 19.0, 20.0, 13.0, 10.0, 6.0, 3.0, 6.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.1795654296875, -0.17431259155273438, -0.16905975341796875, -0.16380691528320312, -0.1585540771484375, -0.15330123901367188, -0.14804840087890625, -0.14279556274414062, -0.137542724609375, -0.13228988647460938, -0.12703704833984375, -0.12178421020507812, -0.1165313720703125, -0.11127853393554688, -0.10602569580078125, -0.10077285766601562, -0.09552001953125, -0.09026718139648438, -0.08501434326171875, -0.07976150512695312, -0.0745086669921875, -0.06925582885742188, -0.06400299072265625, -0.058750152587890625, -0.053497314453125, -0.048244476318359375, -0.04299163818359375, -0.037738800048828125, -0.0324859619140625, -0.027233123779296875, -0.02198028564453125, -0.016727447509765625, -0.011474609375, -0.006221771240234375, -0.00096893310546875, 0.004283905029296875, 0.0095367431640625, 0.014789581298828125, 0.02004241943359375, 0.025295257568359375, 0.030548095703125, 0.035800933837890625, 0.04105377197265625, 0.046306610107421875, 0.0515594482421875, 0.056812286376953125, 0.06206512451171875, 0.06731796264648438, 0.07257080078125, 0.07782363891601562, 0.08307647705078125, 0.08832931518554688, 0.0935821533203125, 0.09883499145507812, 0.10408782958984375, 0.10934066772460938, 0.114593505859375, 0.11984634399414062, 0.12509918212890625, 0.13035202026367188, 0.1356048583984375, 0.14085769653320312, 0.14611053466796875, 0.15136337280273438, 0.1566162109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 7.0, 10.0, 16.0, 25.0, 35.0, 73.0, 149.0, 305.0, 684.0, 1655.0, 4915.0, 17382.0, 74259.0, 342551.0, 453863.0, 116445.0, 25156.0, 7115.0, 2349.0, 863.0, 334.0, 158.0, 81.0, 36.0, 25.0, 13.0, 16.0, 4.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453369140625, -0.4366645812988281, -0.41996002197265625, -0.4032554626464844, -0.3865509033203125, -0.3698463439941406, -0.35314178466796875, -0.3364372253417969, -0.319732666015625, -0.3030281066894531, -0.28632354736328125, -0.2696189880371094, -0.2529144287109375, -0.23620986938476562, -0.21950531005859375, -0.20280075073242188, -0.18609619140625, -0.16939163208007812, -0.15268707275390625, -0.13598251342773438, -0.1192779541015625, -0.10257339477539062, -0.08586883544921875, -0.06916427612304688, -0.052459716796875, -0.035755157470703125, -0.01905059814453125, -0.002346038818359375, 0.0143585205078125, 0.031063079833984375, 0.04776763916015625, 0.06447219848632812, 0.0811767578125, 0.09788131713867188, 0.11458587646484375, 0.13129043579101562, 0.1479949951171875, 0.16469955444335938, 0.18140411376953125, 0.19810867309570312, 0.214813232421875, 0.23151779174804688, 0.24822235107421875, 0.2649269104003906, 0.2816314697265625, 0.2983360290527344, 0.31504058837890625, 0.3317451477050781, 0.34844970703125, 0.3651542663574219, 0.38185882568359375, 0.3985633850097656, 0.4152679443359375, 0.4319725036621094, 0.44867706298828125, 0.4653816223144531, 0.482086181640625, 0.4987907409667969, 0.5154953002929688, 0.5321998596191406, 0.5489044189453125, 0.5656089782714844, 0.5823135375976562, 0.5990180969238281, 0.61572265625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 7.0, 12.0, 3.0, 16.0, 13.0, 16.0, 14.0, 22.0, 28.0, 19.0, 30.0, 44.0, 38.0, 45.0, 48.0, 51.0, 52.0, 41.0, 49.0, 36.0, 39.0, 51.0, 49.0, 31.0, 27.0, 38.0, 30.0, 30.0, 22.0, 19.0, 20.0, 12.0, 10.0, 13.0, 2.0, 5.0, 1.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56591796875, -0.5464859008789062, -0.5270538330078125, -0.5076217651367188, -0.488189697265625, -0.46875762939453125, -0.4493255615234375, -0.42989349365234375, -0.41046142578125, -0.39102935791015625, -0.3715972900390625, -0.35216522216796875, -0.332733154296875, -0.31330108642578125, -0.2938690185546875, -0.27443695068359375, -0.2550048828125, -0.23557281494140625, -0.2161407470703125, -0.19670867919921875, -0.177276611328125, -0.15784454345703125, -0.1384124755859375, -0.11898040771484375, -0.09954833984375, -0.08011627197265625, -0.0606842041015625, -0.04125213623046875, -0.021820068359375, -0.00238800048828125, 0.0170440673828125, 0.03647613525390625, 0.055908203125, 0.07534027099609375, 0.0947723388671875, 0.11420440673828125, 0.133636474609375, 0.15306854248046875, 0.1725006103515625, 0.19193267822265625, 0.21136474609375, 0.23079681396484375, 0.2502288818359375, 0.26966094970703125, 0.289093017578125, 0.30852508544921875, 0.3279571533203125, 0.34738922119140625, 0.3668212890625, 0.38625335693359375, 0.4056854248046875, 0.42511749267578125, 0.444549560546875, 0.46398162841796875, 0.4834136962890625, 0.5028457641601562, 0.52227783203125, 0.5417098999023438, 0.5611419677734375, 0.5805740356445312, 0.600006103515625, 0.6194381713867188, 0.6388702392578125, 0.6583023071289062, 0.677734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 18.0, 18.0, 28.0, 42.0, 72.0, 116.0, 191.0, 321.0, 530.0, 1016.0, 1835.0, 3721.0, 7628.0, 17017.0, 43313.0, 135000.0, 388760.0, 300624.0, 91115.0, 31741.0, 12969.0, 6079.0, 2925.0, 1491.0, 831.0, 459.0, 270.0, 160.0, 90.0, 56.0, 43.0, 27.0, 16.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.267822265625, -0.2603492736816406, -0.25287628173828125, -0.24540328979492188, -0.2379302978515625, -0.23045730590820312, -0.22298431396484375, -0.21551132202148438, -0.208038330078125, -0.20056533813476562, -0.19309234619140625, -0.18561935424804688, -0.1781463623046875, -0.17067337036132812, -0.16320037841796875, -0.15572738647460938, -0.14825439453125, -0.14078140258789062, -0.13330841064453125, -0.12583541870117188, -0.1183624267578125, -0.11088943481445312, -0.10341644287109375, -0.09594345092773438, -0.088470458984375, -0.08099746704101562, -0.07352447509765625, -0.06605148315429688, -0.0585784912109375, -0.051105499267578125, -0.04363250732421875, -0.036159515380859375, -0.0286865234375, -0.021213531494140625, -0.01374053955078125, -0.006267547607421875, 0.0012054443359375, 0.008678436279296875, 0.01615142822265625, 0.023624420166015625, 0.031097412109375, 0.038570404052734375, 0.04604339599609375, 0.053516387939453125, 0.0609893798828125, 0.06846237182617188, 0.07593536376953125, 0.08340835571289062, 0.09088134765625, 0.09835433959960938, 0.10582733154296875, 0.11330032348632812, 0.1207733154296875, 0.12824630737304688, 0.13571929931640625, 0.14319229125976562, 0.150665283203125, 0.15813827514648438, 0.16561126708984375, 0.17308425903320312, 0.1805572509765625, 0.18803024291992188, 0.19550323486328125, 0.20297622680664062, 0.21044921875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 9.0, 10.0, 2.0, 8.0, 18.0, 24.0, 37.0, 56.0, 75.0, 97.0, 114.0, 137.0, 134.0, 90.0, 47.0, 31.0, 34.0, 29.0, 13.0, 14.0, 10.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.449222564697266e-05, -6.221514195203781e-05, -5.9938058257102966e-05, -5.766097456216812e-05, -5.5383890867233276e-05, -5.310680717229843e-05, -5.0829723477363586e-05, -4.855263978242874e-05, -4.6275556087493896e-05, -4.399847239255905e-05, -4.1721388697624207e-05, -3.944430500268936e-05, -3.7167221307754517e-05, -3.489013761281967e-05, -3.261305391788483e-05, -3.033597022294998e-05, -2.8058886528015137e-05, -2.5781802833080292e-05, -2.3504719138145447e-05, -2.1227635443210602e-05, -1.8950551748275757e-05, -1.6673468053340912e-05, -1.4396384358406067e-05, -1.2119300663471222e-05, -9.842216968536377e-06, -7.565133273601532e-06, -5.288049578666687e-06, -3.010965883731842e-06, -7.338821887969971e-07, 1.543201506137848e-06, 3.820285201072693e-06, 6.097368896007538e-06, 8.374452590942383e-06, 1.0651536285877228e-05, 1.2928619980812073e-05, 1.5205703675746918e-05, 1.7482787370681763e-05, 1.9759871065616608e-05, 2.2036954760551453e-05, 2.4314038455486298e-05, 2.6591122150421143e-05, 2.8868205845355988e-05, 3.114528954029083e-05, 3.342237323522568e-05, 3.569945693016052e-05, 3.797654062509537e-05, 4.025362432003021e-05, 4.253070801496506e-05, 4.48077917098999e-05, 4.708487540483475e-05, 4.936195909976959e-05, 5.163904279470444e-05, 5.391612648963928e-05, 5.619321018457413e-05, 5.847029387950897e-05, 6.074737757444382e-05, 6.302446126937866e-05, 6.530154496431351e-05, 6.757862865924835e-05, 6.98557123541832e-05, 7.213279604911804e-05, 7.440987974405289e-05, 7.668696343898773e-05, 7.896404713392258e-05, 8.124113082885742e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 16.0, 33.0, 44.0, 81.0, 141.0, 210.0, 360.0, 686.0, 1342.0, 2564.0, 5529.0, 12895.0, 36999.0, 146561.0, 469310.0, 272449.0, 64565.0, 19515.0, 7857.0, 3464.0, 1800.0, 900.0, 463.0, 250.0, 176.0, 99.0, 67.0, 33.0, 21.0, 20.0, 19.0, 9.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307373046875, -0.2979774475097656, -0.28858184814453125, -0.2791862487792969, -0.2697906494140625, -0.2603950500488281, -0.25099945068359375, -0.24160385131835938, -0.232208251953125, -0.22281265258789062, -0.21341705322265625, -0.20402145385742188, -0.1946258544921875, -0.18523025512695312, -0.17583465576171875, -0.16643905639648438, -0.15704345703125, -0.14764785766601562, -0.13825225830078125, -0.12885665893554688, -0.1194610595703125, -0.11006546020507812, -0.10066986083984375, -0.09127426147460938, -0.081878662109375, -0.07248306274414062, -0.06308746337890625, -0.053691864013671875, -0.0442962646484375, -0.034900665283203125, -0.02550506591796875, -0.016109466552734375, -0.0067138671875, 0.002681732177734375, 0.01207733154296875, 0.021472930908203125, 0.0308685302734375, 0.040264129638671875, 0.04965972900390625, 0.059055328369140625, 0.068450927734375, 0.07784652709960938, 0.08724212646484375, 0.09663772583007812, 0.1060333251953125, 0.11542892456054688, 0.12482452392578125, 0.13422012329101562, 0.14361572265625, 0.15301132202148438, 0.16240692138671875, 0.17180252075195312, 0.1811981201171875, 0.19059371948242188, 0.19998931884765625, 0.20938491821289062, 0.218780517578125, 0.22817611694335938, 0.23757171630859375, 0.24696731567382812, 0.2563629150390625, 0.2657585144042969, 0.27515411376953125, 0.2845497131347656, 0.2939453125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 12.0, 9.0, 19.0, 17.0, 23.0, 23.0, 42.0, 50.0, 51.0, 62.0, 82.0, 81.0, 93.0, 75.0, 69.0, 58.0, 34.0, 33.0, 23.0, 26.0, 19.0, 13.0, 12.0, 16.0, 7.0, 4.0, 6.0, 4.0, 1.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.194580078125, -0.18806076049804688, -0.18154144287109375, -0.17502212524414062, -0.1685028076171875, -0.16198348999023438, -0.15546417236328125, -0.14894485473632812, -0.142425537109375, -0.13590621948242188, -0.12938690185546875, -0.12286758422851562, -0.1163482666015625, -0.10982894897460938, -0.10330963134765625, -0.09679031372070312, -0.09027099609375, -0.08375167846679688, -0.07723236083984375, -0.07071304321289062, -0.0641937255859375, -0.057674407958984375, -0.05115509033203125, -0.044635772705078125, -0.038116455078125, -0.031597137451171875, -0.02507781982421875, -0.018558502197265625, -0.0120391845703125, -0.005519866943359375, 0.00099945068359375, 0.007518768310546875, 0.0140380859375, 0.020557403564453125, 0.02707672119140625, 0.033596038818359375, 0.0401153564453125, 0.046634674072265625, 0.05315399169921875, 0.059673309326171875, 0.066192626953125, 0.07271194458007812, 0.07923126220703125, 0.08575057983398438, 0.0922698974609375, 0.09878921508789062, 0.10530853271484375, 0.11182785034179688, 0.11834716796875, 0.12486648559570312, 0.13138580322265625, 0.13790512084960938, 0.1444244384765625, 0.15094375610351562, 0.15746307373046875, 0.16398239135742188, 0.170501708984375, 0.17702102661132812, 0.18354034423828125, 0.19005966186523438, 0.1965789794921875, 0.20309829711914062, 0.20961761474609375, 0.21613693237304688, 0.22265625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 14.0, 38.0, 89.0, 172.0, 234.0, 220.0, 124.0, 64.0, 22.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.845476150512695, -5.6986165046691895, -5.551756858825684, -5.404897689819336, -5.25803804397583, -5.111178398132324, -4.964318752288818, -4.8174591064453125, -4.670599460601807, -4.523739814758301, -4.376880168914795, -4.230020523071289, -4.083161354064941, -3.9363017082214355, -3.7894420623779297, -3.642582416534424, -3.495723009109497, -3.348863363265991, -3.2020039558410645, -3.0551443099975586, -2.9082846641540527, -2.761425018310547, -2.61456561088562, -2.4677059650421143, -2.3208465576171875, -2.1739869117736816, -2.027127504348755, -1.880267858505249, -1.7334082126617432, -1.5865486860275269, -1.4396891593933105, -1.2928295135498047, -1.145970106124878, -0.9991105198860168, -0.8522509336471558, -0.7053914070129395, -0.5585318207740784, -0.4116722345352173, -0.264812707901001, -0.11795306205749512, 0.02890646457672119, 0.17576603591442108, 0.32262560725212097, 0.46948516368865967, 0.6163447499275208, 0.7632043361663818, 0.9100638628005981, 1.056923508644104, 1.2037830352783203, 1.3506425619125366, 1.4975022077560425, 1.6443617343902588, 1.7912213802337646, 1.938080906867981, 2.0849404335021973, 2.231800079345703, 2.378659725189209, 2.525519371032715, 2.6723787784576416, 2.8192384243011475, 2.9660980701446533, 3.11295747756958, 3.259817123413086, 3.406676769256592, 3.5535361766815186]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 6.0, 9.0, 8.0, 12.0, 11.0, 18.0, 16.0, 11.0, 16.0, 21.0, 38.0, 29.0, 31.0, 26.0, 34.0, 32.0, 42.0, 26.0, 42.0, 43.0, 47.0, 38.0, 39.0, 33.0, 45.0, 39.0, 38.0, 26.0, 32.0, 18.0, 23.0, 22.0, 22.0, 15.0, 20.0, 15.0, 10.0, 5.0, 8.0, 10.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.6498146057128906, -1.5995581150054932, -1.5493016242980957, -1.4990451335906982, -1.4487886428833008, -1.3985321521759033, -1.3482756614685059, -1.2980191707611084, -1.247762680053711, -1.1975061893463135, -1.147249698638916, -1.0969932079315186, -1.046736717224121, -0.9964802265167236, -0.9462236762046814, -0.8959671854972839, -0.8457106351852417, -0.7954541444778442, -0.7451976537704468, -0.6949411630630493, -0.6446846723556519, -0.5944281816482544, -0.5441716313362122, -0.4939151406288147, -0.44365864992141724, -0.3934021592140198, -0.3431456685066223, -0.29288914799690247, -0.242632657289505, -0.19237616658210754, -0.1421196460723877, -0.09186315536499023, -0.04160666465759277, 0.008649833500385284, 0.05890633165836334, 0.109162837266922, 0.15941932797431946, 0.20967581868171692, 0.25993233919143677, 0.31018882989883423, 0.3604453206062317, 0.41070181131362915, 0.4609583020210266, 0.5112148523330688, 0.5614713430404663, 0.6117278337478638, 0.6619843244552612, 0.7122408151626587, 0.7624973058700562, 0.8127537965774536, 0.8630102872848511, 0.9132667779922485, 0.963523268699646, 1.0137797594070435, 1.0640363693237305, 1.114292860031128, 1.1645493507385254, 1.2148058414459229, 1.2650623321533203, 1.3153188228607178, 1.3655753135681152, 1.4158318042755127, 1.4660882949829102, 1.5163447856903076, 1.566601276397705]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 12.0, 15.0, 26.0, 18.0, 39.0, 43.0, 68.0, 85.0, 135.0, 193.0, 275.0, 433.0, 644.0, 998.0, 1691.0, 2833.0, 5192.0, 10374.0, 24255.0, 74940.0, 327328.0, 1555616.0, 1696971.0, 357166.0, 84006.0, 27261.0, 11080.0, 5392.0, 2824.0, 1601.0, 1031.0, 612.0, 352.0, 250.0, 166.0, 107.0, 75.0, 57.0, 44.0, 22.0, 14.0, 9.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.35546875, -0.34560394287109375, -0.3357391357421875, -0.32587432861328125, -0.316009521484375, -0.30614471435546875, -0.2962799072265625, -0.28641510009765625, -0.27655029296875, -0.26668548583984375, -0.2568206787109375, -0.24695587158203125, -0.237091064453125, -0.22722625732421875, -0.2173614501953125, -0.20749664306640625, -0.1976318359375, -0.18776702880859375, -0.1779022216796875, -0.16803741455078125, -0.158172607421875, -0.14830780029296875, -0.1384429931640625, -0.12857818603515625, -0.11871337890625, -0.10884857177734375, -0.0989837646484375, -0.08911895751953125, -0.079254150390625, -0.06938934326171875, -0.0595245361328125, -0.04965972900390625, -0.039794921875, -0.02993011474609375, -0.0200653076171875, -0.01020050048828125, -0.000335693359375, 0.00952911376953125, 0.0193939208984375, 0.02925872802734375, 0.03912353515625, 0.04898834228515625, 0.0588531494140625, 0.06871795654296875, 0.078582763671875, 0.08844757080078125, 0.0983123779296875, 0.10817718505859375, 0.1180419921875, 0.12790679931640625, 0.1377716064453125, 0.14763641357421875, 0.157501220703125, 0.16736602783203125, 0.1772308349609375, 0.18709564208984375, 0.19696044921875, 0.20682525634765625, 0.2166900634765625, 0.22655487060546875, 0.236419677734375, 0.24628448486328125, 0.2561492919921875, 0.26601409912109375, 0.27587890625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 5.0, 12.0, 8.0, 18.0, 16.0, 12.0, 17.0, 27.0, 31.0, 36.0, 31.0, 44.0, 36.0, 49.0, 50.0, 60.0, 50.0, 48.0, 36.0, 32.0, 42.0, 45.0, 43.0, 37.0, 32.0, 18.0, 29.0, 25.0, 12.0, 17.0, 15.0, 11.0, 13.0, 8.0, 4.0, 10.0, 4.0, 5.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-0.2454833984375, -0.23904037475585938, -0.23259735107421875, -0.22615432739257812, -0.2197113037109375, -0.21326828002929688, -0.20682525634765625, -0.20038223266601562, -0.193939208984375, -0.18749618530273438, -0.18105316162109375, -0.17461013793945312, -0.1681671142578125, -0.16172409057617188, -0.15528106689453125, -0.14883804321289062, -0.14239501953125, -0.13595199584960938, -0.12950897216796875, -0.12306594848632812, -0.1166229248046875, -0.11017990112304688, -0.10373687744140625, -0.09729385375976562, -0.090850830078125, -0.08440780639648438, -0.07796478271484375, -0.07152175903320312, -0.0650787353515625, -0.058635711669921875, -0.05219268798828125, -0.045749664306640625, -0.039306640625, -0.032863616943359375, -0.02642059326171875, -0.019977569580078125, -0.0135345458984375, -0.007091522216796875, -0.00064849853515625, 0.005794525146484375, 0.012237548828125, 0.018680572509765625, 0.02512359619140625, 0.031566619873046875, 0.0380096435546875, 0.044452667236328125, 0.05089569091796875, 0.057338714599609375, 0.06378173828125, 0.07022476196289062, 0.07666778564453125, 0.08311080932617188, 0.0895538330078125, 0.09599685668945312, 0.10243988037109375, 0.10888290405273438, 0.115325927734375, 0.12176895141601562, 0.12821197509765625, 0.13465499877929688, 0.1410980224609375, 0.14754104614257812, 0.15398406982421875, 0.16042709350585938, 0.1668701171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 14.0, 9.0, 12.0, 24.0, 18.0, 36.0, 48.0, 57.0, 106.0, 147.0, 234.0, 349.0, 549.0, 913.0, 1730.0, 3723.0, 9052.0, 28752.0, 146011.0, 1909489.0, 1902036.0, 145253.0, 28707.0, 9085.0, 3670.0, 1724.0, 985.0, 553.0, 304.0, 234.0, 143.0, 93.0, 57.0, 34.0, 39.0, 23.0, 22.0, 15.0, 12.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57861328125, -0.5563583374023438, -0.5341033935546875, -0.5118484497070312, -0.489593505859375, -0.46733856201171875, -0.4450836181640625, -0.42282867431640625, -0.40057373046875, -0.37831878662109375, -0.3560638427734375, -0.33380889892578125, -0.311553955078125, -0.28929901123046875, -0.2670440673828125, -0.24478912353515625, -0.2225341796875, -0.20027923583984375, -0.1780242919921875, -0.15576934814453125, -0.133514404296875, -0.11125946044921875, -0.0890045166015625, -0.06674957275390625, -0.04449462890625, -0.02223968505859375, 1.52587890625e-05, 0.02227020263671875, 0.044525146484375, 0.06678009033203125, 0.0890350341796875, 0.11128997802734375, 0.133544921875, 0.15579986572265625, 0.1780548095703125, 0.20030975341796875, 0.222564697265625, 0.24481964111328125, 0.2670745849609375, 0.28932952880859375, 0.31158447265625, 0.33383941650390625, 0.3560943603515625, 0.37834930419921875, 0.400604248046875, 0.42285919189453125, 0.4451141357421875, 0.46736907958984375, 0.4896240234375, 0.5118789672851562, 0.5341339111328125, 0.5563888549804688, 0.578643798828125, 0.6008987426757812, 0.6231536865234375, 0.6454086303710938, 0.66766357421875, 0.6899185180664062, 0.7121734619140625, 0.7344284057617188, 0.756683349609375, 0.7789382934570312, 0.8011932373046875, 0.8234481811523438, 0.845703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 8.0, 3.0, 4.0, 13.0, 29.0, 34.0, 38.0, 82.0, 103.0, 175.0, 266.0, 487.0, 804.0, 866.0, 494.0, 239.0, 141.0, 96.0, 69.0, 34.0, 22.0, 23.0, 12.0, 12.0, 0.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.7998046875, -0.7802886962890625, -0.760772705078125, -0.7412567138671875, -0.72174072265625, -0.7022247314453125, -0.682708740234375, -0.6631927490234375, -0.6436767578125, -0.6241607666015625, -0.604644775390625, -0.5851287841796875, -0.56561279296875, -0.5460968017578125, -0.526580810546875, -0.5070648193359375, -0.487548828125, -0.4680328369140625, -0.448516845703125, -0.4290008544921875, -0.40948486328125, -0.3899688720703125, -0.370452880859375, -0.3509368896484375, -0.3314208984375, -0.3119049072265625, -0.292388916015625, -0.2728729248046875, -0.25335693359375, -0.2338409423828125, -0.214324951171875, -0.1948089599609375, -0.17529296875, -0.1557769775390625, -0.136260986328125, -0.1167449951171875, -0.09722900390625, -0.0777130126953125, -0.058197021484375, -0.0386810302734375, -0.0191650390625, 0.0003509521484375, 0.019866943359375, 0.0393829345703125, 0.05889892578125, 0.0784149169921875, 0.097930908203125, 0.1174468994140625, 0.136962890625, 0.1564788818359375, 0.175994873046875, 0.1955108642578125, 0.21502685546875, 0.2345428466796875, 0.254058837890625, 0.2735748291015625, 0.2930908203125, 0.3126068115234375, 0.332122802734375, 0.3516387939453125, 0.37115478515625, 0.3906707763671875, 0.410186767578125, 0.4297027587890625, 0.44921875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 7.0, 16.0, 13.0, 30.0, 42.0, 136.0, 238.0, 243.0, 155.0, 81.0, 28.0, 11.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.802663803100586, -7.630014419555664, -7.457364559173584, -7.284715175628662, -7.11206579208374, -6.939416408538818, -6.766766548156738, -6.594117164611816, -6.4214677810668945, -6.248818397521973, -6.076168537139893, -5.903519153594971, -5.730869770050049, -5.558220386505127, -5.385570526123047, -5.212921142578125, -5.040271759033203, -4.867622375488281, -4.694972515106201, -4.522323131561279, -4.349673748016357, -4.1770243644714355, -4.0043745040893555, -3.8317251205444336, -3.6590752601623535, -3.4864256381988525, -3.3137762546539307, -3.1411266326904297, -2.968477249145508, -2.795827627182007, -2.623178005218506, -2.450528621673584, -2.277879238128662, -2.105229616165161, -1.9325802326202393, -1.7599306106567383, -1.5872812271118164, -1.4146316051483154, -1.241982102394104, -1.0693325996398926, -0.8966830968856812, -0.7240335941314697, -0.5513840913772583, -0.3787345290184021, -0.20608502626419067, -0.03343552350997925, 0.13921403884887695, 0.3118635416030884, 0.4845130443572998, 0.6571625471115112, 0.8298120498657227, 1.0024616718292236, 1.1751110553741455, 1.3477606773376465, 1.520410180091858, 1.6930596828460693, 1.8657091856002808, 2.038358688354492, 2.211008310317993, 2.383657693862915, 2.556307315826416, 2.728956699371338, 2.901606321334839, 3.07425594329834, 3.2469053268432617]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 13.0, 9.0, 11.0, 6.0, 17.0, 10.0, 20.0, 18.0, 19.0, 28.0, 33.0, 32.0, 29.0, 24.0, 29.0, 41.0, 33.0, 44.0, 37.0, 30.0, 38.0, 44.0, 45.0, 30.0, 40.0, 38.0, 30.0, 31.0, 24.0, 25.0, 23.0, 19.0, 22.0, 21.0, 12.0, 13.0, 8.0, 12.0, 6.0, 8.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.2920538187026978, -1.2525336742401123, -1.2130136489868164, -1.173493504524231, -1.1339733600616455, -1.0944533348083496, -1.0549331903457642, -1.0154130458831787, -0.9758930206298828, -0.9363729357719421, -0.8968528509140015, -0.857332706451416, -0.8178126215934753, -0.7782925367355347, -0.7387723922729492, -0.6992523074150085, -0.6597322225570679, -0.6202121376991272, -0.5806920528411865, -0.5411719083786011, -0.5016518235206604, -0.4621317386627197, -0.42261162400245667, -0.3830915093421936, -0.34357142448425293, -0.30405133962631226, -0.2645312249660492, -0.22501112520694733, -0.18549102544784546, -0.1459709256887436, -0.10645082592964172, -0.06693071126937866, -0.02741062641143799, 0.01210947334766388, 0.05162957310676575, 0.09114967286586761, 0.13066977262496948, 0.17018987238407135, 0.20970997214317322, 0.24923008680343628, 0.28875017166137695, 0.3282702565193176, 0.3677903711795807, 0.40731048583984375, 0.4468305706977844, 0.4863506555557251, 0.5258708000183105, 0.5653908848762512, 0.6049109697341919, 0.6444310545921326, 0.6839511394500732, 0.7234712839126587, 0.7629913687705994, 0.80251145362854, 0.8420315980911255, 0.8815516829490662, 0.9210717678070068, 0.9605918526649475, 1.0001119375228882, 1.0396320819854736, 1.0791521072387695, 1.118672251701355, 1.1581923961639404, 1.1977124214172363, 1.2372325658798218]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 16.0, 23.0, 20.0, 36.0, 79.0, 112.0, 172.0, 276.0, 443.0, 725.0, 1314.0, 2350.0, 4350.0, 8770.0, 18687.0, 45650.0, 134330.0, 346117.0, 306532.0, 107597.0, 38025.0, 16371.0, 7787.0, 3883.0, 2042.0, 1147.0, 631.0, 414.0, 240.0, 127.0, 95.0, 71.0, 46.0, 29.0, 15.0, 12.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.45361328125, -0.4393959045410156, -0.42517852783203125, -0.4109611511230469, -0.3967437744140625, -0.3825263977050781, -0.36830902099609375, -0.3540916442871094, -0.339874267578125, -0.3256568908691406, -0.31143951416015625, -0.2972221374511719, -0.2830047607421875, -0.2687873840332031, -0.25457000732421875, -0.24035263061523438, -0.22613525390625, -0.21191787719726562, -0.19770050048828125, -0.18348312377929688, -0.1692657470703125, -0.15504837036132812, -0.14083099365234375, -0.12661361694335938, -0.112396240234375, -0.09817886352539062, -0.08396148681640625, -0.06974411010742188, -0.0555267333984375, -0.041309356689453125, -0.02709197998046875, -0.012874603271484375, 0.0013427734375, 0.015560150146484375, 0.02977752685546875, 0.043994903564453125, 0.0582122802734375, 0.07242965698242188, 0.08664703369140625, 0.10086441040039062, 0.115081787109375, 0.12929916381835938, 0.14351654052734375, 0.15773391723632812, 0.1719512939453125, 0.18616867065429688, 0.20038604736328125, 0.21460342407226562, 0.22882080078125, 0.24303817749023438, 0.25725555419921875, 0.2714729309082031, 0.2856903076171875, 0.2999076843261719, 0.31412506103515625, 0.3283424377441406, 0.342559814453125, 0.3567771911621094, 0.37099456787109375, 0.3852119445800781, 0.3994293212890625, 0.4136466979980469, 0.42786407470703125, 0.4420814514160156, 0.456298828125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 3.0, 2.0, 12.0, 9.0, 12.0, 11.0, 21.0, 20.0, 19.0, 24.0, 32.0, 28.0, 28.0, 50.0, 31.0, 43.0, 52.0, 43.0, 35.0, 49.0, 44.0, 54.0, 39.0, 41.0, 34.0, 35.0, 28.0, 28.0, 29.0, 22.0, 23.0, 20.0, 19.0, 10.0, 10.0, 7.0, 6.0, 3.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0], "bins": [-0.248779296875, -0.241973876953125, -0.23516845703125, -0.228363037109375, -0.2215576171875, -0.214752197265625, -0.20794677734375, -0.201141357421875, -0.1943359375, -0.187530517578125, -0.18072509765625, -0.173919677734375, -0.1671142578125, -0.160308837890625, -0.15350341796875, -0.146697998046875, -0.139892578125, -0.133087158203125, -0.12628173828125, -0.119476318359375, -0.1126708984375, -0.105865478515625, -0.09906005859375, -0.092254638671875, -0.08544921875, -0.078643798828125, -0.07183837890625, -0.065032958984375, -0.0582275390625, -0.051422119140625, -0.04461669921875, -0.037811279296875, -0.031005859375, -0.024200439453125, -0.01739501953125, -0.010589599609375, -0.0037841796875, 0.003021240234375, 0.00982666015625, 0.016632080078125, 0.0234375, 0.030242919921875, 0.03704833984375, 0.043853759765625, 0.0506591796875, 0.057464599609375, 0.06427001953125, 0.071075439453125, 0.077880859375, 0.084686279296875, 0.09149169921875, 0.098297119140625, 0.1051025390625, 0.111907958984375, 0.11871337890625, 0.125518798828125, 0.13232421875, 0.139129638671875, 0.14593505859375, 0.152740478515625, 0.1595458984375, 0.166351318359375, 0.17315673828125, 0.179962158203125, 0.186767578125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 14.0, 28.0, 33.0, 58.0, 88.0, 135.0, 176.0, 266.0, 407.0, 675.0, 1087.0, 1806.0, 3180.0, 5323.0, 9886.0, 19250.0, 46786.0, 142864.0, 383623.0, 280472.0, 88077.0, 31695.0, 14467.0, 7502.0, 4125.0, 2466.0, 1492.0, 890.0, 592.0, 351.0, 214.0, 157.0, 106.0, 88.0, 46.0, 40.0, 24.0, 10.0, 14.0, 8.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.474853515625, -0.4599189758300781, -0.44498443603515625, -0.4300498962402344, -0.4151153564453125, -0.4001808166503906, -0.38524627685546875, -0.3703117370605469, -0.355377197265625, -0.3404426574707031, -0.32550811767578125, -0.3105735778808594, -0.2956390380859375, -0.2807044982910156, -0.26576995849609375, -0.2508354187011719, -0.23590087890625, -0.22096633911132812, -0.20603179931640625, -0.19109725952148438, -0.1761627197265625, -0.16122817993164062, -0.14629364013671875, -0.13135910034179688, -0.116424560546875, -0.10149002075195312, -0.08655548095703125, -0.07162094116210938, -0.0566864013671875, -0.041751861572265625, -0.02681732177734375, -0.011882781982421875, 0.0030517578125, 0.017986297607421875, 0.03292083740234375, 0.047855377197265625, 0.0627899169921875, 0.07772445678710938, 0.09265899658203125, 0.10759353637695312, 0.122528076171875, 0.13746261596679688, 0.15239715576171875, 0.16733169555664062, 0.1822662353515625, 0.19720077514648438, 0.21213531494140625, 0.22706985473632812, 0.24200439453125, 0.2569389343261719, 0.27187347412109375, 0.2868080139160156, 0.3017425537109375, 0.3166770935058594, 0.33161163330078125, 0.3465461730957031, 0.361480712890625, 0.3764152526855469, 0.39134979248046875, 0.4062843322753906, 0.4212188720703125, 0.4361534118652344, 0.45108795166015625, 0.4660224914550781, 0.48095703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 7.0, 11.0, 14.0, 8.0, 16.0, 15.0, 19.0, 21.0, 28.0, 36.0, 27.0, 34.0, 43.0, 43.0, 34.0, 52.0, 39.0, 44.0, 59.0, 40.0, 46.0, 32.0, 34.0, 32.0, 48.0, 42.0, 34.0, 20.0, 20.0, 8.0, 17.0, 7.0, 14.0, 7.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75, -0.7263717651367188, -0.7027435302734375, -0.6791152954101562, -0.655487060546875, -0.6318588256835938, -0.6082305908203125, -0.5846023559570312, -0.56097412109375, -0.5373458862304688, -0.5137176513671875, -0.49008941650390625, -0.466461181640625, -0.44283294677734375, -0.4192047119140625, -0.39557647705078125, -0.3719482421875, -0.34832000732421875, -0.3246917724609375, -0.30106353759765625, -0.277435302734375, -0.25380706787109375, -0.2301788330078125, -0.20655059814453125, -0.18292236328125, -0.15929412841796875, -0.1356658935546875, -0.11203765869140625, -0.088409423828125, -0.06478118896484375, -0.0411529541015625, -0.01752471923828125, 0.006103515625, 0.02973175048828125, 0.0533599853515625, 0.07698822021484375, 0.100616455078125, 0.12424468994140625, 0.1478729248046875, 0.17150115966796875, 0.19512939453125, 0.21875762939453125, 0.2423858642578125, 0.26601409912109375, 0.289642333984375, 0.31327056884765625, 0.3368988037109375, 0.36052703857421875, 0.3841552734375, 0.40778350830078125, 0.4314117431640625, 0.45503997802734375, 0.478668212890625, 0.5022964477539062, 0.5259246826171875, 0.5495529174804688, 0.57318115234375, 0.5968093872070312, 0.6204376220703125, 0.6440658569335938, 0.667694091796875, 0.6913223266601562, 0.7149505615234375, 0.7385787963867188, 0.76220703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 21.0, 21.0, 42.0, 56.0, 92.0, 129.0, 188.0, 255.0, 403.0, 588.0, 937.0, 1380.0, 2200.0, 3424.0, 5399.0, 8973.0, 15350.0, 27956.0, 55244.0, 124366.0, 299346.0, 275702.0, 112154.0, 51022.0, 26213.0, 14349.0, 8458.0, 5058.0, 3141.0, 2111.0, 1347.0, 898.0, 614.0, 343.0, 248.0, 175.0, 105.0, 84.0, 50.0, 37.0, 20.0, 11.0, 7.0, 12.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1513671875, -0.1459503173828125, -0.140533447265625, -0.1351165771484375, -0.12969970703125, -0.1242828369140625, -0.118865966796875, -0.1134490966796875, -0.1080322265625, -0.1026153564453125, -0.097198486328125, -0.0917816162109375, -0.08636474609375, -0.0809478759765625, -0.075531005859375, -0.0701141357421875, -0.064697265625, -0.0592803955078125, -0.053863525390625, -0.0484466552734375, -0.04302978515625, -0.0376129150390625, -0.032196044921875, -0.0267791748046875, -0.0213623046875, -0.0159454345703125, -0.010528564453125, -0.0051116943359375, 0.00030517578125, 0.0057220458984375, 0.011138916015625, 0.0165557861328125, 0.02197265625, 0.0273895263671875, 0.032806396484375, 0.0382232666015625, 0.04364013671875, 0.0490570068359375, 0.054473876953125, 0.0598907470703125, 0.0653076171875, 0.0707244873046875, 0.076141357421875, 0.0815582275390625, 0.08697509765625, 0.0923919677734375, 0.097808837890625, 0.1032257080078125, 0.108642578125, 0.1140594482421875, 0.119476318359375, 0.1248931884765625, 0.13031005859375, 0.1357269287109375, 0.141143798828125, 0.1465606689453125, 0.1519775390625, 0.1573944091796875, 0.162811279296875, 0.1682281494140625, 0.17364501953125, 0.1790618896484375, 0.184478759765625, 0.1898956298828125, 0.1953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 4.0, 7.0, 14.0, 16.0, 24.0, 28.0, 38.0, 50.0, 72.0, 135.0, 161.0, 121.0, 88.0, 53.0, 40.0, 23.0, 26.0, 16.0, 15.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.022785186767578e-05, -7.783900946378708e-05, -7.545016705989838e-05, -7.306132465600967e-05, -7.067248225212097e-05, -6.828363984823227e-05, -6.589479744434357e-05, -6.350595504045486e-05, -6.111711263656616e-05, -5.872827023267746e-05, -5.633942782878876e-05, -5.3950585424900055e-05, -5.156174302101135e-05, -4.917290061712265e-05, -4.678405821323395e-05, -4.4395215809345245e-05, -4.200637340545654e-05, -3.961753100156784e-05, -3.722868859767914e-05, -3.4839846193790436e-05, -3.2451003789901733e-05, -3.006216138601303e-05, -2.767331898212433e-05, -2.5284476578235626e-05, -2.2895634174346924e-05, -2.050679177045822e-05, -1.811794936656952e-05, -1.5729106962680817e-05, -1.3340264558792114e-05, -1.0951422154903412e-05, -8.56257975101471e-06, -6.173737347126007e-06, -3.7848949432373047e-06, -1.3960525393486023e-06, 9.927898645401e-07, 3.3816322684288025e-06, 5.770474672317505e-06, 8.159317076206207e-06, 1.054815948009491e-05, 1.2937001883983612e-05, 1.5325844287872314e-05, 1.7714686691761017e-05, 2.010352909564972e-05, 2.249237149953842e-05, 2.4881213903427124e-05, 2.7270056307315826e-05, 2.965889871120453e-05, 3.204774111509323e-05, 3.4436583518981934e-05, 3.6825425922870636e-05, 3.921426832675934e-05, 4.160311073064804e-05, 4.399195313453674e-05, 4.6380795538425446e-05, 4.876963794231415e-05, 5.115848034620285e-05, 5.354732275009155e-05, 5.5936165153980255e-05, 5.832500755786896e-05, 6.071384996175766e-05, 6.310269236564636e-05, 6.549153476953506e-05, 6.788037717342377e-05, 7.026921957731247e-05, 7.265806198120117e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 13.0, 9.0, 11.0, 34.0, 34.0, 57.0, 92.0, 139.0, 207.0, 337.0, 529.0, 949.0, 1511.0, 2569.0, 4637.0, 8431.0, 16506.0, 34166.0, 74069.0, 166784.0, 312321.0, 229342.0, 102582.0, 46522.0, 22004.0, 10924.0, 5726.0, 3317.0, 1820.0, 1101.0, 663.0, 416.0, 247.0, 158.0, 98.0, 79.0, 37.0, 36.0, 22.0, 17.0, 11.0, 8.0, 5.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.17626953125, -0.17087936401367188, -0.16548919677734375, -0.16009902954101562, -0.1547088623046875, -0.14931869506835938, -0.14392852783203125, -0.13853836059570312, -0.133148193359375, -0.12775802612304688, -0.12236785888671875, -0.11697769165039062, -0.1115875244140625, -0.10619735717773438, -0.10080718994140625, -0.09541702270507812, -0.09002685546875, -0.08463668823242188, -0.07924652099609375, -0.07385635375976562, -0.0684661865234375, -0.06307601928710938, -0.05768585205078125, -0.052295684814453125, -0.046905517578125, -0.041515350341796875, -0.03612518310546875, -0.030735015869140625, -0.0253448486328125, -0.019954681396484375, -0.01456451416015625, -0.009174346923828125, -0.0037841796875, 0.001605987548828125, 0.00699615478515625, 0.012386322021484375, 0.0177764892578125, 0.023166656494140625, 0.02855682373046875, 0.033946990966796875, 0.039337158203125, 0.044727325439453125, 0.05011749267578125, 0.055507659912109375, 0.0608978271484375, 0.06628799438476562, 0.07167816162109375, 0.07706832885742188, 0.08245849609375, 0.08784866333007812, 0.09323883056640625, 0.09862899780273438, 0.1040191650390625, 0.10940933227539062, 0.11479949951171875, 0.12018966674804688, 0.125579833984375, 0.13097000122070312, 0.13636016845703125, 0.14175033569335938, 0.1471405029296875, 0.15253067016601562, 0.15792083740234375, 0.16331100463867188, 0.168701171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 4.0, 6.0, 9.0, 14.0, 14.0, 23.0, 33.0, 29.0, 35.0, 44.0, 48.0, 73.0, 80.0, 64.0, 91.0, 82.0, 61.0, 47.0, 49.0, 34.0, 28.0, 23.0, 19.0, 18.0, 11.0, 13.0, 6.0, 6.0, 1.0, 3.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.200927734375, -0.1944255828857422, -0.18792343139648438, -0.18142127990722656, -0.17491912841796875, -0.16841697692871094, -0.16191482543945312, -0.1554126739501953, -0.1489105224609375, -0.1424083709716797, -0.13590621948242188, -0.12940406799316406, -0.12290191650390625, -0.11639976501464844, -0.10989761352539062, -0.10339546203613281, -0.096893310546875, -0.09039115905761719, -0.08388900756835938, -0.07738685607910156, -0.07088470458984375, -0.06438255310058594, -0.057880401611328125, -0.05137825012207031, -0.0448760986328125, -0.03837394714355469, -0.031871795654296875, -0.025369644165039062, -0.01886749267578125, -0.012365341186523438, -0.005863189697265625, 0.0006389617919921875, 0.00714111328125, 0.013643264770507812, 0.020145416259765625, 0.026647567749023438, 0.03314971923828125, 0.03965187072753906, 0.046154022216796875, 0.05265617370605469, 0.0591583251953125, 0.06566047668457031, 0.07216262817382812, 0.07866477966308594, 0.08516693115234375, 0.09166908264160156, 0.09817123413085938, 0.10467338562011719, 0.111175537109375, 0.11767768859863281, 0.12417984008789062, 0.13068199157714844, 0.13718414306640625, 0.14368629455566406, 0.15018844604492188, 0.1566905975341797, 0.1631927490234375, 0.1696949005126953, 0.17619705200195312, 0.18269920349121094, 0.18920135498046875, 0.19570350646972656, 0.20220565795898438, 0.2087078094482422, 0.2152099609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 9.0, 6.0, 12.0, 27.0, 45.0, 64.0, 98.0, 125.0, 132.0, 129.0, 108.0, 74.0, 57.0, 44.0, 27.0, 12.0, 6.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.774855613708496, -2.675018310546875, -2.575181007385254, -2.475343704223633, -2.3755064010620117, -2.2756690979003906, -2.1758317947387695, -2.0759944915771484, -1.9761570692062378, -1.8763197660446167, -1.7764824628829956, -1.676645040512085, -1.5768077373504639, -1.4769704341888428, -1.3771331310272217, -1.2772958278656006, -1.1774585247039795, -1.0776212215423584, -0.9777839183807373, -0.8779465556144714, -0.7781092524528503, -0.6782719492912292, -0.5784345865249634, -0.4785972833633423, -0.3787599802017212, -0.2789226770401001, -0.17908534407615662, -0.07924801111221313, 0.02058929204940796, 0.12042659521102905, 0.22026395797729492, 0.320101261138916, 0.4199388027191162, 0.5197761058807373, 0.6196134090423584, 0.7194507718086243, 0.8192880749702454, 0.9191253781318665, 1.0189627408981323, 1.1188000440597534, 1.2186373472213745, 1.3184746503829956, 1.4183119535446167, 1.5181493759155273, 1.6179866790771484, 1.7178239822387695, 1.8176612854003906, 1.9174985885620117, 2.017335891723633, 2.117173194885254, 2.217010498046875, 2.316847801208496, 2.416685104370117, 2.5165224075317383, 2.6163597106933594, 2.7161970138549805, 2.8160343170166016, 2.9158716201782227, 3.0157089233398438, 3.115546226501465, 3.215383529663086, 3.315220832824707, 3.415058135986328, 3.514895439147949, 3.6147329807281494]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 5.0, 3.0, 5.0, 4.0, 7.0, 10.0, 12.0, 21.0, 18.0, 16.0, 23.0, 24.0, 36.0, 35.0, 26.0, 27.0, 28.0, 39.0, 37.0, 50.0, 45.0, 43.0, 43.0, 38.0, 34.0, 34.0, 34.0, 31.0, 30.0, 30.0, 28.0, 22.0, 23.0, 25.0, 16.0, 10.0, 17.0, 10.0, 13.0, 10.0, 8.0, 9.0, 5.0, 6.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5864137411117554, -1.5318446159362793, -1.4772756099700928, -1.4227064847946167, -1.3681373596191406, -1.313568353652954, -1.258999228477478, -1.204430103302002, -1.1498610973358154, -1.0952919721603394, -1.0407229661941528, -0.9861538410186768, -0.9315847754478455, -0.8770157098770142, -0.8224465847015381, -0.7678775191307068, -0.7133084535598755, -0.6587393879890442, -0.6041703224182129, -0.5496011972427368, -0.4950321316719055, -0.4404630661010742, -0.38589397072792053, -0.33132487535476685, -0.27675580978393555, -0.22218672931194305, -0.16761764883995056, -0.11304856836795807, -0.058479487895965576, -0.003910422325134277, 0.05065867304801941, 0.1052277684211731, 0.1597968339920044, 0.2143659144639969, 0.2689349949359894, 0.32350409030914307, 0.37807315587997437, 0.43264222145080566, 0.48721131682395935, 0.541780412197113, 0.5963494777679443, 0.6509185433387756, 0.7054876089096069, 0.760056734085083, 0.8146257996559143, 0.8691948652267456, 0.9237639904022217, 0.978333055973053, 1.0329021215438843, 1.0874712467193604, 1.1420402526855469, 1.196609377861023, 1.251178503036499, 1.3057475090026855, 1.3603166341781616, 1.4148857593536377, 1.4694547653198242, 1.5240238904953003, 1.5785928964614868, 1.633162021636963, 1.6877310276031494, 1.7423001527786255, 1.7968692779541016, 1.851438283920288, 1.9060074090957642]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 8.0, 18.0, 15.0, 33.0, 20.0, 44.0, 66.0, 80.0, 79.0, 122.0, 171.0, 208.0, 333.0, 444.0, 740.0, 1287.0, 2007.0, 3771.0, 7148.0, 15882.0, 40382.0, 126260.0, 459388.0, 1507619.0, 1411146.0, 430578.0, 120045.0, 37909.0, 14326.0, 6274.0, 3131.0, 1657.0, 971.0, 702.0, 421.0, 277.0, 167.0, 152.0, 110.0, 65.0, 67.0, 23.0, 25.0, 24.0, 25.0, 12.0, 15.0, 8.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2958984375, -0.2863426208496094, -0.27678680419921875, -0.2672309875488281, -0.2576751708984375, -0.24811935424804688, -0.23856353759765625, -0.22900772094726562, -0.219451904296875, -0.20989608764648438, -0.20034027099609375, -0.19078445434570312, -0.1812286376953125, -0.17167282104492188, -0.16211700439453125, -0.15256118774414062, -0.14300537109375, -0.13344955444335938, -0.12389373779296875, -0.11433792114257812, -0.1047821044921875, -0.09522628784179688, -0.08567047119140625, -0.07611465454101562, -0.066558837890625, -0.057003021240234375, -0.04744720458984375, -0.037891387939453125, -0.0283355712890625, -0.018779754638671875, -0.00922393798828125, 0.000331878662109375, 0.0098876953125, 0.019443511962890625, 0.02899932861328125, 0.038555145263671875, 0.0481109619140625, 0.057666778564453125, 0.06722259521484375, 0.07677841186523438, 0.086334228515625, 0.09589004516601562, 0.10544586181640625, 0.11500167846679688, 0.1245574951171875, 0.13411331176757812, 0.14366912841796875, 0.15322494506835938, 0.16278076171875, 0.17233657836914062, 0.18189239501953125, 0.19144821166992188, 0.2010040283203125, 0.21055984497070312, 0.22011566162109375, 0.22967147827148438, 0.239227294921875, 0.24878311157226562, 0.25833892822265625, 0.2678947448730469, 0.2774505615234375, 0.2870063781738281, 0.29656219482421875, 0.3061180114746094, 0.315673828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 4.0, 5.0, 4.0, 17.0, 15.0, 22.0, 21.0, 17.0, 20.0, 22.0, 25.0, 27.0, 30.0, 36.0, 40.0, 41.0, 44.0, 53.0, 42.0, 47.0, 38.0, 51.0, 40.0, 28.0, 37.0, 37.0, 36.0, 28.0, 37.0, 22.0, 15.0, 22.0, 12.0, 12.0, 14.0, 5.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19873046875, -0.19141387939453125, -0.1840972900390625, -0.17678070068359375, -0.169464111328125, -0.16214752197265625, -0.1548309326171875, -0.14751434326171875, -0.14019775390625, -0.13288116455078125, -0.1255645751953125, -0.11824798583984375, -0.110931396484375, -0.10361480712890625, -0.0962982177734375, -0.08898162841796875, -0.0816650390625, -0.07434844970703125, -0.0670318603515625, -0.05971527099609375, -0.052398681640625, -0.04508209228515625, -0.0377655029296875, -0.03044891357421875, -0.02313232421875, -0.01581573486328125, -0.0084991455078125, -0.00118255615234375, 0.006134033203125, 0.01345062255859375, 0.0207672119140625, 0.02808380126953125, 0.035400390625, 0.04271697998046875, 0.0500335693359375, 0.05735015869140625, 0.064666748046875, 0.07198333740234375, 0.0792999267578125, 0.08661651611328125, 0.09393310546875, 0.10124969482421875, 0.1085662841796875, 0.11588287353515625, 0.123199462890625, 0.13051605224609375, 0.1378326416015625, 0.14514923095703125, 0.1524658203125, 0.15978240966796875, 0.1670989990234375, 0.17441558837890625, 0.181732177734375, 0.18904876708984375, 0.1963653564453125, 0.20368194580078125, 0.21099853515625, 0.21831512451171875, 0.2256317138671875, 0.23294830322265625, 0.240264892578125, 0.24758148193359375, 0.2548980712890625, 0.26221466064453125, 0.26953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 8.0, 7.0, 29.0, 39.0, 40.0, 55.0, 77.0, 107.0, 199.0, 242.0, 360.0, 576.0, 943.0, 1444.0, 2361.0, 4266.0, 8146.0, 17933.0, 47143.0, 164703.0, 927631.0, 2410399.0, 448169.0, 98936.0, 31994.0, 13123.0, 6418.0, 3439.0, 2002.0, 1227.0, 726.0, 512.0, 311.0, 232.0, 138.0, 91.0, 71.0, 48.0, 37.0, 26.0, 23.0, 16.0, 14.0, 10.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.59619140625, -0.57977294921875, -0.5633544921875, -0.54693603515625, -0.530517578125, -0.51409912109375, -0.4976806640625, -0.48126220703125, -0.46484375, -0.44842529296875, -0.4320068359375, -0.41558837890625, -0.399169921875, -0.38275146484375, -0.3663330078125, -0.34991455078125, -0.33349609375, -0.31707763671875, -0.3006591796875, -0.28424072265625, -0.267822265625, -0.25140380859375, -0.2349853515625, -0.21856689453125, -0.2021484375, -0.18572998046875, -0.1693115234375, -0.15289306640625, -0.136474609375, -0.12005615234375, -0.1036376953125, -0.08721923828125, -0.07080078125, -0.05438232421875, -0.0379638671875, -0.02154541015625, -0.005126953125, 0.01129150390625, 0.0277099609375, 0.04412841796875, 0.060546875, 0.07696533203125, 0.0933837890625, 0.10980224609375, 0.126220703125, 0.14263916015625, 0.1590576171875, 0.17547607421875, 0.19189453125, 0.20831298828125, 0.2247314453125, 0.24114990234375, 0.257568359375, 0.27398681640625, 0.2904052734375, 0.30682373046875, 0.3232421875, 0.33966064453125, 0.3560791015625, 0.37249755859375, 0.388916015625, 0.40533447265625, 0.4217529296875, 0.43817138671875, 0.45458984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 1.0, 6.0, 9.0, 15.0, 17.0, 25.0, 27.0, 47.0, 73.0, 120.0, 200.0, 307.0, 557.0, 837.0, 678.0, 427.0, 261.0, 136.0, 92.0, 61.0, 49.0, 34.0, 25.0, 17.0, 10.0, 5.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.693359375, -0.6728363037109375, -0.652313232421875, -0.6317901611328125, -0.61126708984375, -0.5907440185546875, -0.570220947265625, -0.5496978759765625, -0.5291748046875, -0.5086517333984375, -0.488128662109375, -0.4676055908203125, -0.44708251953125, -0.4265594482421875, -0.406036376953125, -0.3855133056640625, -0.364990234375, -0.3444671630859375, -0.323944091796875, -0.3034210205078125, -0.28289794921875, -0.2623748779296875, -0.241851806640625, -0.2213287353515625, -0.2008056640625, -0.1802825927734375, -0.159759521484375, -0.1392364501953125, -0.11871337890625, -0.0981903076171875, -0.077667236328125, -0.0571441650390625, -0.03662109375, -0.0160980224609375, 0.004425048828125, 0.0249481201171875, 0.04547119140625, 0.0659942626953125, 0.086517333984375, 0.1070404052734375, 0.1275634765625, 0.1480865478515625, 0.168609619140625, 0.1891326904296875, 0.20965576171875, 0.2301788330078125, 0.250701904296875, 0.2712249755859375, 0.291748046875, 0.3122711181640625, 0.332794189453125, 0.3533172607421875, 0.37384033203125, 0.3943634033203125, 0.414886474609375, 0.4354095458984375, 0.4559326171875, 0.4764556884765625, 0.496978759765625, 0.5175018310546875, 0.53802490234375, 0.5585479736328125, 0.579071044921875, 0.5995941162109375, 0.6201171875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 3.0, 5.0, 4.0, 5.0, 20.0, 41.0, 66.0, 78.0, 112.0, 133.0, 164.0, 110.0, 104.0, 62.0, 38.0, 22.0, 9.0, 8.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.158179998397827, -2.038081407546997, -1.9179826974868774, -1.7978839874267578, -1.6777853965759277, -1.5576868057250977, -1.437588095664978, -1.3174893856048584, -1.1973907947540283, -1.0772922039031982, -0.9571934938430786, -0.8370948433876038, -0.7169961929321289, -0.596897542476654, -0.4767988920211792, -0.35670024156570435, -0.2366015911102295, -0.11650294065475464, 0.003595709800720215, 0.12369436025619507, 0.24379301071166992, 0.3638916611671448, 0.48399031162261963, 0.6040889620780945, 0.7241876125335693, 0.8442862629890442, 0.964384913444519, 1.0844836235046387, 1.2045822143554688, 1.3246808052062988, 1.4447795152664185, 1.564878225326538, 1.6849770545959473, 1.8050756454467773, 1.925174355506897, 2.0452730655670166, 2.1653716564178467, 2.2854702472686768, 2.405569076538086, 2.525667667388916, 2.645766258239746, 2.765864849090576, 2.8859634399414062, 3.0060622692108154, 3.1261608600616455, 3.2462594509124756, 3.3663582801818848, 3.486456871032715, 3.606555461883545, 3.726654052734375, 3.846752643585205, 3.9668514728546143, 4.086950302124023, 4.2070488929748535, 4.327147483825684, 4.447246074676514, 4.567344665527344, 4.687443256378174, 4.807541847229004, 4.927640438079834, 5.047739028930664, 5.167838096618652, 5.287936687469482, 5.4080352783203125, 5.528133869171143]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 11.0, 15.0, 12.0, 22.0, 26.0, 23.0, 28.0, 20.0, 35.0, 31.0, 34.0, 46.0, 45.0, 35.0, 38.0, 52.0, 44.0, 48.0, 38.0, 34.0, 34.0, 45.0, 30.0, 24.0, 26.0, 19.0, 25.0, 25.0, 18.0, 16.0, 17.0, 11.0, 6.0, 8.0, 2.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6161739826202393, -1.5630261898040771, -1.5098782777786255, -1.4567304849624634, -1.4035825729370117, -1.3504347801208496, -1.2972869873046875, -1.2441390752792358, -1.1909911632537842, -1.137843370437622, -1.0846954584121704, -1.0315476655960083, -0.9783997535705566, -0.9252519607543945, -0.8721041083335876, -0.8189562559127808, -0.7658084630966187, -0.7126606106758118, -0.6595127582550049, -0.6063649654388428, -0.5532170534133911, -0.500069260597229, -0.4469214081764221, -0.39377355575561523, -0.34062570333480835, -0.28747785091400146, -0.23433001339435577, -0.18118217587471008, -0.1280343234539032, -0.07488647103309631, -0.021738648414611816, 0.03140920400619507, 0.0845571756362915, 0.1377050280570984, 0.19085286557674408, 0.24400070309638977, 0.29714855551719666, 0.35029640793800354, 0.40344423055648804, 0.4565920829772949, 0.5097399353981018, 0.5628877878189087, 0.6160356402397156, 0.6691834926605225, 0.7223312854766846, 0.7754791975021362, 0.8286269903182983, 0.8817748427391052, 0.9349226951599121, 0.988070547580719, 1.0412184000015259, 1.094366192817688, 1.1475141048431396, 1.2006618976593018, 1.2538096904754639, 1.3069576025009155, 1.3601055145263672, 1.4132533073425293, 1.466401219367981, 1.519549012184143, 1.5726969242095947, 1.6258447170257568, 1.678992509841919, 1.7321404218673706, 1.7852882146835327]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 12.0, 10.0, 30.0, 33.0, 44.0, 71.0, 84.0, 104.0, 174.0, 254.0, 395.0, 646.0, 953.0, 1629.0, 2746.0, 4774.0, 8607.0, 16776.0, 36053.0, 93584.0, 242293.0, 337289.0, 179134.0, 65346.0, 27238.0, 13244.0, 6948.0, 3793.0, 2357.0, 1420.0, 841.0, 544.0, 386.0, 202.0, 171.0, 112.0, 61.0, 45.0, 41.0, 33.0, 18.0, 16.0, 11.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.456298828125, -0.4407386779785156, -0.42517852783203125, -0.4096183776855469, -0.3940582275390625, -0.3784980773925781, -0.36293792724609375, -0.3473777770996094, -0.331817626953125, -0.3162574768066406, -0.30069732666015625, -0.2851371765136719, -0.2695770263671875, -0.2540168762207031, -0.23845672607421875, -0.22289657592773438, -0.20733642578125, -0.19177627563476562, -0.17621612548828125, -0.16065597534179688, -0.1450958251953125, -0.12953567504882812, -0.11397552490234375, -0.09841537475585938, -0.082855224609375, -0.06729507446289062, -0.05173492431640625, -0.036174774169921875, -0.0206146240234375, -0.005054473876953125, 0.01050567626953125, 0.026065826416015625, 0.0416259765625, 0.057186126708984375, 0.07274627685546875, 0.08830642700195312, 0.1038665771484375, 0.11942672729492188, 0.13498687744140625, 0.15054702758789062, 0.166107177734375, 0.18166732788085938, 0.19722747802734375, 0.21278762817382812, 0.2283477783203125, 0.24390792846679688, 0.25946807861328125, 0.2750282287597656, 0.29058837890625, 0.3061485290527344, 0.32170867919921875, 0.3372688293457031, 0.3528289794921875, 0.3683891296386719, 0.38394927978515625, 0.3995094299316406, 0.415069580078125, 0.4306297302246094, 0.44618988037109375, 0.4617500305175781, 0.4773101806640625, 0.4928703308105469, 0.5084304809570312, 0.5239906311035156, 0.53955078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 3.0, 5.0, 3.0, 9.0, 11.0, 18.0, 14.0, 14.0, 22.0, 28.0, 26.0, 42.0, 39.0, 41.0, 34.0, 38.0, 46.0, 46.0, 66.0, 52.0, 56.0, 62.0, 33.0, 44.0, 35.0, 23.0, 32.0, 28.0, 21.0, 20.0, 19.0, 19.0, 9.0, 9.0, 8.0, 9.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24728775024414062, -0.23896026611328125, -0.23063278198242188, -0.2223052978515625, -0.21397781372070312, -0.20565032958984375, -0.19732284545898438, -0.188995361328125, -0.18066787719726562, -0.17234039306640625, -0.16401290893554688, -0.1556854248046875, -0.14735794067382812, -0.13903045654296875, -0.13070297241210938, -0.12237548828125, -0.11404800415039062, -0.10572052001953125, -0.09739303588867188, -0.0890655517578125, -0.08073806762695312, -0.07241058349609375, -0.06408309936523438, -0.055755615234375, -0.047428131103515625, -0.03910064697265625, -0.030773162841796875, -0.0224456787109375, -0.014118194580078125, -0.00579071044921875, 0.002536773681640625, 0.0108642578125, 0.019191741943359375, 0.02751922607421875, 0.035846710205078125, 0.0441741943359375, 0.052501678466796875, 0.06082916259765625, 0.06915664672851562, 0.077484130859375, 0.08581161499023438, 0.09413909912109375, 0.10246658325195312, 0.1107940673828125, 0.11912155151367188, 0.12744903564453125, 0.13577651977539062, 0.14410400390625, 0.15243148803710938, 0.16075897216796875, 0.16908645629882812, 0.1774139404296875, 0.18574142456054688, 0.19406890869140625, 0.20239639282226562, 0.210723876953125, 0.21905136108398438, 0.22737884521484375, 0.23570632934570312, 0.2440338134765625, 0.2523612976074219, 0.26068878173828125, 0.2690162658691406, 0.27734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 2.0, 6.0, 13.0, 16.0, 23.0, 35.0, 47.0, 78.0, 139.0, 213.0, 390.0, 671.0, 1298.0, 2573.0, 5465.0, 12954.0, 34033.0, 105465.0, 334983.0, 364135.0, 121646.0, 38142.0, 14257.0, 6022.0, 2817.0, 1394.0, 674.0, 403.0, 262.0, 143.0, 97.0, 50.0, 38.0, 24.0, 19.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4755859375, -0.45660400390625, -0.4376220703125, -0.41864013671875, -0.399658203125, -0.38067626953125, -0.3616943359375, -0.34271240234375, -0.32373046875, -0.30474853515625, -0.2857666015625, -0.26678466796875, -0.247802734375, -0.22882080078125, -0.2098388671875, -0.19085693359375, -0.171875, -0.15289306640625, -0.1339111328125, -0.11492919921875, -0.095947265625, -0.07696533203125, -0.0579833984375, -0.03900146484375, -0.02001953125, -0.00103759765625, 0.0179443359375, 0.03692626953125, 0.055908203125, 0.07489013671875, 0.0938720703125, 0.11285400390625, 0.1318359375, 0.15081787109375, 0.1697998046875, 0.18878173828125, 0.207763671875, 0.22674560546875, 0.2457275390625, 0.26470947265625, 0.28369140625, 0.30267333984375, 0.3216552734375, 0.34063720703125, 0.359619140625, 0.37860107421875, 0.3975830078125, 0.41656494140625, 0.435546875, 0.45452880859375, 0.4735107421875, 0.49249267578125, 0.511474609375, 0.53045654296875, 0.5494384765625, 0.56842041015625, 0.58740234375, 0.60638427734375, 0.6253662109375, 0.64434814453125, 0.663330078125, 0.68231201171875, 0.7012939453125, 0.72027587890625, 0.7392578125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 5.0, 5.0, 8.0, 9.0, 10.0, 17.0, 17.0, 18.0, 19.0, 30.0, 19.0, 37.0, 28.0, 24.0, 29.0, 37.0, 31.0, 36.0, 34.0, 34.0, 34.0, 44.0, 48.0, 27.0, 33.0, 44.0, 35.0, 36.0, 32.0, 27.0, 31.0, 17.0, 19.0, 22.0, 16.0, 14.0, 11.0, 6.0, 8.0, 5.0, 9.0, 9.0, 7.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.71923828125, -0.6988601684570312, -0.6784820556640625, -0.6581039428710938, -0.637725830078125, -0.6173477172851562, -0.5969696044921875, -0.5765914916992188, -0.55621337890625, -0.5358352661132812, -0.5154571533203125, -0.49507904052734375, -0.474700927734375, -0.45432281494140625, -0.4339447021484375, -0.41356658935546875, -0.3931884765625, -0.37281036376953125, -0.3524322509765625, -0.33205413818359375, -0.311676025390625, -0.29129791259765625, -0.2709197998046875, -0.25054168701171875, -0.23016357421875, -0.20978546142578125, -0.1894073486328125, -0.16902923583984375, -0.148651123046875, -0.12827301025390625, -0.1078948974609375, -0.08751678466796875, -0.067138671875, -0.04676055908203125, -0.0263824462890625, -0.00600433349609375, 0.014373779296875, 0.03475189208984375, 0.0551300048828125, 0.07550811767578125, 0.09588623046875, 0.11626434326171875, 0.1366424560546875, 0.15702056884765625, 0.177398681640625, 0.19777679443359375, 0.2181549072265625, 0.23853302001953125, 0.2589111328125, 0.27928924560546875, 0.2996673583984375, 0.32004547119140625, 0.340423583984375, 0.36080169677734375, 0.3811798095703125, 0.40155792236328125, 0.42193603515625, 0.44231414794921875, 0.4626922607421875, 0.48307037353515625, 0.503448486328125, 0.5238265991210938, 0.5442047119140625, 0.5645828247070312, 0.5849609375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 6.0, 12.0, 13.0, 18.0, 38.0, 47.0, 71.0, 104.0, 120.0, 212.0, 337.0, 518.0, 796.0, 1232.0, 2013.0, 3430.0, 6113.0, 11515.0, 23684.0, 53499.0, 137723.0, 328869.0, 282681.0, 108740.0, 43344.0, 20192.0, 9965.0, 5304.0, 2997.0, 1782.0, 1091.0, 705.0, 487.0, 301.0, 182.0, 117.0, 114.0, 46.0, 47.0, 30.0, 15.0, 13.0, 5.0, 13.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.230712890625, -0.222991943359375, -0.21527099609375, -0.207550048828125, -0.1998291015625, -0.192108154296875, -0.18438720703125, -0.176666259765625, -0.1689453125, -0.161224365234375, -0.15350341796875, -0.145782470703125, -0.1380615234375, -0.130340576171875, -0.12261962890625, -0.114898681640625, -0.107177734375, -0.099456787109375, -0.09173583984375, -0.084014892578125, -0.0762939453125, -0.068572998046875, -0.06085205078125, -0.053131103515625, -0.04541015625, -0.037689208984375, -0.02996826171875, -0.022247314453125, -0.0145263671875, -0.006805419921875, 0.00091552734375, 0.008636474609375, 0.016357421875, 0.024078369140625, 0.03179931640625, 0.039520263671875, 0.0472412109375, 0.054962158203125, 0.06268310546875, 0.070404052734375, 0.078125, 0.085845947265625, 0.09356689453125, 0.101287841796875, 0.1090087890625, 0.116729736328125, 0.12445068359375, 0.132171630859375, 0.139892578125, 0.147613525390625, 0.15533447265625, 0.163055419921875, 0.1707763671875, 0.178497314453125, 0.18621826171875, 0.193939208984375, 0.20166015625, 0.209381103515625, 0.21710205078125, 0.224822998046875, 0.2325439453125, 0.240264892578125, 0.24798583984375, 0.255706787109375, 0.263427734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 2.0, 8.0, 13.0, 11.0, 10.0, 20.0, 24.0, 39.0, 64.0, 90.0, 121.0, 127.0, 124.0, 93.0, 57.0, 46.0, 33.0, 28.0, 15.0, 15.0, 10.0, 10.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.22083854675293e-05, -8.912384510040283e-05, -8.603930473327637e-05, -8.29547643661499e-05, -7.987022399902344e-05, -7.678568363189697e-05, -7.370114326477051e-05, -7.061660289764404e-05, -6.753206253051758e-05, -6.444752216339111e-05, -6.136298179626465e-05, -5.8278441429138184e-05, -5.519390106201172e-05, -5.2109360694885254e-05, -4.902482032775879e-05, -4.5940279960632324e-05, -4.285573959350586e-05, -3.9771199226379395e-05, -3.668665885925293e-05, -3.3602118492126465e-05, -3.0517578125e-05, -2.7433037757873535e-05, -2.434849739074707e-05, -2.1263957023620605e-05, -1.817941665649414e-05, -1.5094876289367676e-05, -1.2010335922241211e-05, -8.925795555114746e-06, -5.841255187988281e-06, -2.7567148208618164e-06, 3.2782554626464844e-07, 3.4123659133911133e-06, 6.496906280517578e-06, 9.581446647644043e-06, 1.2665987014770508e-05, 1.5750527381896973e-05, 1.8835067749023438e-05, 2.1919608116149902e-05, 2.5004148483276367e-05, 2.8088688850402832e-05, 3.11732292175293e-05, 3.425776958465576e-05, 3.7342309951782227e-05, 4.042685031890869e-05, 4.3511390686035156e-05, 4.659593105316162e-05, 4.9680471420288086e-05, 5.276501178741455e-05, 5.5849552154541016e-05, 5.893409252166748e-05, 6.201863288879395e-05, 6.510317325592041e-05, 6.818771362304688e-05, 7.127225399017334e-05, 7.43567943572998e-05, 7.744133472442627e-05, 8.052587509155273e-05, 8.36104154586792e-05, 8.669495582580566e-05, 8.977949619293213e-05, 9.28640365600586e-05, 9.594857692718506e-05, 9.903311729431152e-05, 0.00010211765766143799, 0.00010520219802856445]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 11.0, 21.0, 13.0, 22.0, 46.0, 57.0, 110.0, 123.0, 180.0, 257.0, 357.0, 553.0, 870.0, 1344.0, 2197.0, 3704.0, 6297.0, 11322.0, 22210.0, 45974.0, 99983.0, 209946.0, 284832.0, 186743.0, 86168.0, 40461.0, 19641.0, 10435.0, 5692.0, 3323.0, 1986.0, 1232.0, 773.0, 544.0, 353.0, 225.0, 159.0, 96.0, 72.0, 49.0, 42.0, 38.0, 32.0, 14.0, 12.0, 9.0, 8.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2027587890625, -0.196502685546875, -0.19024658203125, -0.183990478515625, -0.177734375, -0.171478271484375, -0.16522216796875, -0.158966064453125, -0.1527099609375, -0.146453857421875, -0.14019775390625, -0.133941650390625, -0.127685546875, -0.121429443359375, -0.11517333984375, -0.108917236328125, -0.1026611328125, -0.096405029296875, -0.09014892578125, -0.083892822265625, -0.07763671875, -0.071380615234375, -0.06512451171875, -0.058868408203125, -0.0526123046875, -0.046356201171875, -0.04010009765625, -0.033843994140625, -0.027587890625, -0.021331787109375, -0.01507568359375, -0.008819580078125, -0.0025634765625, 0.003692626953125, 0.00994873046875, 0.016204833984375, 0.0224609375, 0.028717041015625, 0.03497314453125, 0.041229248046875, 0.0474853515625, 0.053741455078125, 0.05999755859375, 0.066253662109375, 0.072509765625, 0.078765869140625, 0.08502197265625, 0.091278076171875, 0.0975341796875, 0.103790283203125, 0.11004638671875, 0.116302490234375, 0.12255859375, 0.128814697265625, 0.13507080078125, 0.141326904296875, 0.1475830078125, 0.153839111328125, 0.16009521484375, 0.166351318359375, 0.172607421875, 0.178863525390625, 0.18511962890625, 0.191375732421875, 0.1976318359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 6.0, 5.0, 8.0, 16.0, 14.0, 18.0, 26.0, 23.0, 31.0, 33.0, 39.0, 49.0, 57.0, 63.0, 68.0, 63.0, 82.0, 51.0, 46.0, 55.0, 35.0, 28.0, 37.0, 22.0, 19.0, 18.0, 14.0, 9.0, 13.0, 7.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2423095703125, -0.23499488830566406, -0.22768020629882812, -0.2203655242919922, -0.21305084228515625, -0.2057361602783203, -0.19842147827148438, -0.19110679626464844, -0.1837921142578125, -0.17647743225097656, -0.16916275024414062, -0.1618480682373047, -0.15453338623046875, -0.1472187042236328, -0.13990402221679688, -0.13258934020996094, -0.125274658203125, -0.11795997619628906, -0.11064529418945312, -0.10333061218261719, -0.09601593017578125, -0.08870124816894531, -0.08138656616210938, -0.07407188415527344, -0.0667572021484375, -0.05944252014160156, -0.052127838134765625, -0.04481315612792969, -0.03749847412109375, -0.030183792114257812, -0.022869110107421875, -0.015554428100585938, -0.00823974609375, -0.0009250640869140625, 0.006389617919921875, 0.013704299926757812, 0.02101898193359375, 0.028333663940429688, 0.035648345947265625, 0.04296302795410156, 0.0502777099609375, 0.05759239196777344, 0.06490707397460938, 0.07222175598144531, 0.07953643798828125, 0.08685111999511719, 0.09416580200195312, 0.10148048400878906, 0.108795166015625, 0.11610984802246094, 0.12342453002929688, 0.1307392120361328, 0.13805389404296875, 0.1453685760498047, 0.15268325805664062, 0.15999794006347656, 0.1673126220703125, 0.17462730407714844, 0.18194198608398438, 0.1892566680908203, 0.19657135009765625, 0.2038860321044922, 0.21120071411132812, 0.21851539611816406, 0.225830078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 12.0, 7.0, 47.0, 95.0, 154.0, 222.0, 199.0, 134.0, 61.0, 30.0, 13.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1180877685546875, -6.924006462097168, -6.729925155639648, -6.535843849182129, -6.341762542724609, -6.14768123626709, -5.95359992980957, -5.759518623352051, -5.565437316894531, -5.371356010437012, -5.177274703979492, -4.983193397521973, -4.789112091064453, -4.595030784606934, -4.400949478149414, -4.2068681716918945, -4.012786865234375, -3.8187055587768555, -3.624624252319336, -3.4305429458618164, -3.236461639404297, -3.0423803329467773, -2.848299026489258, -2.6542177200317383, -2.4601359367370605, -2.266054630279541, -2.0719733238220215, -1.877892017364502, -1.6838107109069824, -1.489729404449463, -1.2956479787826538, -1.1015666723251343, -0.9074854850769043, -0.7134041786193848, -0.5193228721618652, -0.3252415060997009, -0.1311601996421814, 0.06292110681533813, 0.25700247287750244, 0.451083779335022, 0.6451650857925415, 0.839246392250061, 1.0333276987075806, 1.2274091243743896, 1.4214904308319092, 1.6155717372894287, 1.8096530437469482, 2.0037343502044678, 2.1978156566619873, 2.391896963119507, 2.5859782695770264, 2.780059576034546, 2.9741408824920654, 3.168222188949585, 3.3623037338256836, 3.556385040283203, 3.7504663467407227, 3.944547653198242, 4.138628959655762, 4.332710266113281, 4.526791572570801, 4.72087287902832, 4.91495418548584, 5.109035491943359, 5.303116798400879]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 11.0, 11.0, 13.0, 18.0, 13.0, 11.0, 18.0, 25.0, 24.0, 28.0, 24.0, 33.0, 29.0, 40.0, 38.0, 39.0, 43.0, 41.0, 44.0, 33.0, 37.0, 32.0, 27.0, 39.0, 40.0, 29.0, 36.0, 37.0, 25.0, 26.0, 21.0, 17.0, 14.0, 21.0, 4.0, 9.0, 9.0, 5.0, 5.0, 9.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6392848491668701, -1.5844029188156128, -1.529520869255066, -1.4746389389038086, -1.4197568893432617, -1.3648749589920044, -1.309993028640747, -1.2551109790802002, -1.2002290487289429, -1.1453471183776855, -1.0904650688171387, -1.0355831384658813, -0.9807011485099792, -0.9258191585540771, -0.8709372282028198, -0.8160552382469177, -0.7611732482910156, -0.7062912583351135, -0.6514092683792114, -0.5965273380279541, -0.541645348072052, -0.4867633581161499, -0.4318813979625702, -0.3769994378089905, -0.3221174478530884, -0.2672354578971863, -0.21235349774360657, -0.15747152268886566, -0.10258954763412476, -0.047707557678222656, 0.007174402475357056, 0.06205636262893677, 0.11693823337554932, 0.17182020843029022, 0.22670218348503113, 0.28158414363861084, 0.33646613359451294, 0.39134812355041504, 0.44623008370399475, 0.5011120438575745, 0.5559940338134766, 0.6108760237693787, 0.6657580137252808, 0.7206399440765381, 0.7755219340324402, 0.8304039239883423, 0.8852858543395996, 0.9401678442955017, 0.9950498342514038, 1.0499317646026611, 1.104813814163208, 1.1596957445144653, 1.2145776748657227, 1.2694597244262695, 1.3243416547775269, 1.3792235851287842, 1.434105634689331, 1.4889875650405884, 1.5438696146011353, 1.5987515449523926, 1.6536335945129395, 1.7085155248641968, 1.763397455215454, 1.818279504776001, 1.8731614351272583]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 15.0, 17.0, 29.0, 44.0, 68.0, 101.0, 134.0, 180.0, 250.0, 384.0, 557.0, 816.0, 1202.0, 2126.0, 3523.0, 6493.0, 13432.0, 31728.0, 91680.0, 325470.0, 1113615.0, 1673050.0, 650410.0, 179982.0, 55362.0, 21258.0, 9719.0, 4997.0, 2798.0, 1668.0, 1040.0, 715.0, 428.0, 285.0, 212.0, 154.0, 102.0, 69.0, 46.0, 38.0, 22.0, 16.0, 9.0, 5.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.3359375, -0.3248405456542969, -0.31374359130859375, -0.3026466369628906, -0.2915496826171875, -0.2804527282714844, -0.26935577392578125, -0.2582588195800781, -0.247161865234375, -0.23606491088867188, -0.22496795654296875, -0.21387100219726562, -0.2027740478515625, -0.19167709350585938, -0.18058013916015625, -0.16948318481445312, -0.15838623046875, -0.14728927612304688, -0.13619232177734375, -0.12509536743164062, -0.1139984130859375, -0.10290145874023438, -0.09180450439453125, -0.08070755004882812, -0.069610595703125, -0.058513641357421875, -0.04741668701171875, -0.036319732666015625, -0.0252227783203125, -0.014125823974609375, -0.00302886962890625, 0.008068084716796875, 0.0191650390625, 0.030261993408203125, 0.04135894775390625, 0.052455902099609375, 0.0635528564453125, 0.07464981079101562, 0.08574676513671875, 0.09684371948242188, 0.107940673828125, 0.11903762817382812, 0.13013458251953125, 0.14123153686523438, 0.1523284912109375, 0.16342544555664062, 0.17452239990234375, 0.18561935424804688, 0.19671630859375, 0.20781326293945312, 0.21891021728515625, 0.23000717163085938, 0.2411041259765625, 0.2522010803222656, 0.26329803466796875, 0.2743949890136719, 0.285491943359375, 0.2965888977050781, 0.30768585205078125, 0.3187828063964844, 0.3298797607421875, 0.3409767150878906, 0.35207366943359375, 0.3631706237792969, 0.374267578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 7.0, 6.0, 6.0, 14.0, 15.0, 8.0, 20.0, 18.0, 14.0, 22.0, 27.0, 17.0, 28.0, 33.0, 33.0, 31.0, 36.0, 35.0, 42.0, 40.0, 45.0, 39.0, 42.0, 27.0, 41.0, 37.0, 24.0, 25.0, 38.0, 25.0, 22.0, 17.0, 30.0, 20.0, 14.0, 16.0, 21.0, 13.0, 9.0, 8.0, 4.0, 5.0, 7.0, 2.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2186279296875, -0.21173477172851562, -0.20484161376953125, -0.19794845581054688, -0.1910552978515625, -0.18416213989257812, -0.17726898193359375, -0.17037582397460938, -0.163482666015625, -0.15658950805664062, -0.14969635009765625, -0.14280319213867188, -0.1359100341796875, -0.12901687622070312, -0.12212371826171875, -0.11523056030273438, -0.10833740234375, -0.10144424438476562, -0.09455108642578125, -0.08765792846679688, -0.0807647705078125, -0.07387161254882812, -0.06697845458984375, -0.060085296630859375, -0.053192138671875, -0.046298980712890625, -0.03940582275390625, -0.032512664794921875, -0.0256195068359375, -0.018726348876953125, -0.01183319091796875, -0.004940032958984375, 0.001953125, 0.008846282958984375, 0.01573944091796875, 0.022632598876953125, 0.0295257568359375, 0.036418914794921875, 0.04331207275390625, 0.050205230712890625, 0.057098388671875, 0.06399154663085938, 0.07088470458984375, 0.07777786254882812, 0.0846710205078125, 0.09156417846679688, 0.09845733642578125, 0.10535049438476562, 0.11224365234375, 0.11913681030273438, 0.12602996826171875, 0.13292312622070312, 0.1398162841796875, 0.14670944213867188, 0.15360260009765625, 0.16049575805664062, 0.167388916015625, 0.17428207397460938, 0.18117523193359375, 0.18806838989257812, 0.1949615478515625, 0.20185470581054688, 0.20874786376953125, 0.21564102172851562, 0.2225341796875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 10.0, 8.0, 25.0, 29.0, 39.0, 63.0, 81.0, 113.0, 176.0, 283.0, 435.0, 768.0, 1265.0, 2234.0, 4462.0, 9894.0, 25793.0, 84803.0, 398928.0, 2384233.0, 1036954.0, 169912.0, 44605.0, 15529.0, 6326.0, 3159.0, 1639.0, 950.0, 541.0, 323.0, 217.0, 150.0, 101.0, 58.0, 52.0, 25.0, 21.0, 15.0, 15.0, 11.0, 11.0, 7.0, 3.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.5501937866210938, -0.5310516357421875, -0.5119094848632812, -0.492767333984375, -0.47362518310546875, -0.4544830322265625, -0.43534088134765625, -0.41619873046875, -0.39705657958984375, -0.3779144287109375, -0.35877227783203125, -0.339630126953125, -0.32048797607421875, -0.3013458251953125, -0.28220367431640625, -0.2630615234375, -0.24391937255859375, -0.2247772216796875, -0.20563507080078125, -0.186492919921875, -0.16735076904296875, -0.1482086181640625, -0.12906646728515625, -0.10992431640625, -0.09078216552734375, -0.0716400146484375, -0.05249786376953125, -0.033355712890625, -0.01421356201171875, 0.0049285888671875, 0.02407073974609375, 0.043212890625, 0.06235504150390625, 0.0814971923828125, 0.10063934326171875, 0.119781494140625, 0.13892364501953125, 0.1580657958984375, 0.17720794677734375, 0.19635009765625, 0.21549224853515625, 0.2346343994140625, 0.25377655029296875, 0.272918701171875, 0.29206085205078125, 0.3112030029296875, 0.33034515380859375, 0.3494873046875, 0.36862945556640625, 0.3877716064453125, 0.40691375732421875, 0.426055908203125, 0.44519805908203125, 0.4643402099609375, 0.48348236083984375, 0.50262451171875, 0.5217666625976562, 0.5409088134765625, 0.5600509643554688, 0.579193115234375, 0.5983352661132812, 0.6174774169921875, 0.6366195678710938, 0.65576171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 7.0, 4.0, 7.0, 10.0, 16.0, 27.0, 26.0, 31.0, 41.0, 50.0, 77.0, 89.0, 117.0, 170.0, 264.0, 348.0, 502.0, 557.0, 497.0, 343.0, 231.0, 143.0, 115.0, 87.0, 61.0, 70.0, 45.0, 20.0, 22.0, 24.0, 16.0, 15.0, 7.0, 6.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.5078125, -0.49213409423828125, -0.4764556884765625, -0.46077728271484375, -0.445098876953125, -0.42942047119140625, -0.4137420654296875, -0.39806365966796875, -0.38238525390625, -0.36670684814453125, -0.3510284423828125, -0.33535003662109375, -0.319671630859375, -0.30399322509765625, -0.2883148193359375, -0.27263641357421875, -0.2569580078125, -0.24127960205078125, -0.2256011962890625, -0.20992279052734375, -0.194244384765625, -0.17856597900390625, -0.1628875732421875, -0.14720916748046875, -0.13153076171875, -0.11585235595703125, -0.1001739501953125, -0.08449554443359375, -0.068817138671875, -0.05313873291015625, -0.0374603271484375, -0.02178192138671875, -0.006103515625, 0.00957489013671875, 0.0252532958984375, 0.04093170166015625, 0.056610107421875, 0.07228851318359375, 0.0879669189453125, 0.10364532470703125, 0.11932373046875, 0.13500213623046875, 0.1506805419921875, 0.16635894775390625, 0.182037353515625, 0.19771575927734375, 0.2133941650390625, 0.22907257080078125, 0.2447509765625, 0.26042938232421875, 0.2761077880859375, 0.29178619384765625, 0.307464599609375, 0.32314300537109375, 0.3388214111328125, 0.35449981689453125, 0.37017822265625, 0.38585662841796875, 0.4015350341796875, 0.41721343994140625, 0.432891845703125, 0.44857025146484375, 0.4642486572265625, 0.47992706298828125, 0.49560546875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 6.0, 4.0, 6.0, 18.0, 30.0, 45.0, 65.0, 119.0, 115.0, 180.0, 154.0, 93.0, 82.0, 31.0, 19.0, 14.0, 10.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7933478355407715, -3.649268865585327, -3.505189895629883, -3.3611106872558594, -3.217031717300415, -3.0729527473449707, -2.9288735389709473, -2.784794569015503, -2.6407155990600586, -2.4966366291046143, -2.35255765914917, -2.2084784507751465, -2.064399480819702, -1.9203205108642578, -1.776241421699524, -1.63216233253479, -1.4880833625793457, -1.3440043926239014, -1.1999253034591675, -1.0558462142944336, -0.9117672443389893, -0.7676882147789001, -0.623609185218811, -0.47953009605407715, -0.3354511260986328, -0.1913720965385437, -0.04729306697845459, 0.09678596258163452, 0.24086499214172363, 0.38494402170181274, 0.5290230512619019, 0.6731021404266357, 0.8171811103820801, 0.9612601399421692, 1.1053391695022583, 1.2494182586669922, 1.3934972286224365, 1.5375761985778809, 1.6816552877426147, 1.8257343769073486, 1.969813346862793, 2.1138923168182373, 2.2579712867736816, 2.402050495147705, 2.5461294651031494, 2.6902084350585938, 2.834287643432617, 2.9783666133880615, 3.122445583343506, 3.26652455329895, 3.4106035232543945, 3.554682731628418, 3.6987617015838623, 3.8428406715393066, 3.98691987991333, 4.130998611450195, 4.275077819824219, 4.419157028198242, 4.563235759735107, 4.707314968109131, 4.851393699645996, 4.9954729080200195, 5.139552116394043, 5.283631324768066, 5.427710056304932]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 8.0, 6.0, 8.0, 11.0, 10.0, 14.0, 20.0, 16.0, 16.0, 21.0, 19.0, 29.0, 23.0, 32.0, 36.0, 37.0, 28.0, 35.0, 27.0, 28.0, 36.0, 44.0, 26.0, 31.0, 32.0, 39.0, 38.0, 36.0, 35.0, 29.0, 34.0, 33.0, 20.0, 24.0, 18.0, 10.0, 17.0, 14.0, 10.0, 11.0, 10.0, 4.0, 10.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5321400165557861, -1.485368251800537, -1.438596487045288, -1.391824722290039, -1.34505295753479, -1.298281192779541, -1.251509428024292, -1.204737663269043, -1.157965898513794, -1.111194133758545, -1.064422369003296, -1.0176506042480469, -0.9708788394927979, -0.9241070747375488, -0.877335250377655, -0.830563485622406, -0.7837916612625122, -0.7370198965072632, -0.6902481317520142, -0.6434763669967651, -0.5967046022415161, -0.5499328374862671, -0.5031610131263733, -0.45638924837112427, -0.40961748361587524, -0.3628457188606262, -0.3160739541053772, -0.2693021595478058, -0.22253039479255676, -0.17575863003730774, -0.12898683547973633, -0.0822150707244873, -0.03544342517852783, 0.011328347027301788, 0.05810011923313141, 0.10487189888954163, 0.15164366364479065, 0.19841542840003967, 0.24518722295761108, 0.2919589877128601, 0.33873075246810913, 0.38550251722335815, 0.4322742819786072, 0.4790460765361786, 0.52581787109375, 0.572589635848999, 0.619361400604248, 0.6661331653594971, 0.7129049301147461, 0.7596766948699951, 0.8064484596252441, 0.8532202243804932, 0.8999919891357422, 0.9467637538909912, 0.993535578250885, 1.0403072834014893, 1.0870790481567383, 1.1338508129119873, 1.1806225776672363, 1.2273943424224854, 1.2741661071777344, 1.3209378719329834, 1.3677096366882324, 1.4144814014434814, 1.46125328540802]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 4.0, 8.0, 16.0, 13.0, 29.0, 32.0, 59.0, 63.0, 91.0, 145.0, 221.0, 310.0, 432.0, 649.0, 979.0, 1634.0, 2692.0, 4463.0, 8613.0, 18235.0, 42246.0, 104633.0, 233815.0, 303695.0, 185127.0, 77609.0, 31516.0, 14316.0, 6932.0, 3787.0, 2143.0, 1417.0, 874.0, 521.0, 384.0, 271.0, 193.0, 121.0, 76.0, 50.0, 37.0, 38.0, 11.0, 15.0, 10.0, 10.0, 11.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.429443359375, -0.4157371520996094, -0.40203094482421875, -0.3883247375488281, -0.3746185302734375, -0.3609123229980469, -0.34720611572265625, -0.3334999084472656, -0.319793701171875, -0.3060874938964844, -0.29238128662109375, -0.2786750793457031, -0.2649688720703125, -0.2512626647949219, -0.23755645751953125, -0.22385025024414062, -0.21014404296875, -0.19643783569335938, -0.18273162841796875, -0.16902542114257812, -0.1553192138671875, -0.14161300659179688, -0.12790679931640625, -0.11420059204101562, -0.100494384765625, -0.08678817749023438, -0.07308197021484375, -0.059375762939453125, -0.0456695556640625, -0.031963348388671875, -0.01825714111328125, -0.004550933837890625, 0.0091552734375, 0.022861480712890625, 0.03656768798828125, 0.050273895263671875, 0.0639801025390625, 0.07768630981445312, 0.09139251708984375, 0.10509872436523438, 0.118804931640625, 0.13251113891601562, 0.14621734619140625, 0.15992355346679688, 0.1736297607421875, 0.18733596801757812, 0.20104217529296875, 0.21474838256835938, 0.22845458984375, 0.24216079711914062, 0.25586700439453125, 0.2695732116699219, 0.2832794189453125, 0.2969856262207031, 0.31069183349609375, 0.3243980407714844, 0.338104248046875, 0.3518104553222656, 0.36551666259765625, 0.3792228698730469, 0.3929290771484375, 0.4066352844238281, 0.42034149169921875, 0.4340476989746094, 0.44775390625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 18.0, 15.0, 16.0, 22.0, 18.0, 28.0, 39.0, 31.0, 28.0, 22.0, 29.0, 38.0, 38.0, 41.0, 27.0, 40.0, 33.0, 32.0, 37.0, 41.0, 42.0, 41.0, 37.0, 22.0, 22.0, 30.0, 25.0, 27.0, 23.0, 13.0, 11.0, 18.0, 13.0, 9.0, 8.0, 3.0, 5.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.25830078125, -0.25070953369140625, -0.2431182861328125, -0.23552703857421875, -0.227935791015625, -0.22034454345703125, -0.2127532958984375, -0.20516204833984375, -0.19757080078125, -0.18997955322265625, -0.1823883056640625, -0.17479705810546875, -0.167205810546875, -0.15961456298828125, -0.1520233154296875, -0.14443206787109375, -0.1368408203125, -0.12924957275390625, -0.1216583251953125, -0.11406707763671875, -0.106475830078125, -0.09888458251953125, -0.0912933349609375, -0.08370208740234375, -0.07611083984375, -0.06851959228515625, -0.0609283447265625, -0.05333709716796875, -0.045745849609375, -0.03815460205078125, -0.0305633544921875, -0.02297210693359375, -0.015380859375, -0.00778961181640625, -0.0001983642578125, 0.00739288330078125, 0.014984130859375, 0.02257537841796875, 0.0301666259765625, 0.03775787353515625, 0.04534912109375, 0.05294036865234375, 0.0605316162109375, 0.06812286376953125, 0.075714111328125, 0.08330535888671875, 0.0908966064453125, 0.09848785400390625, 0.1060791015625, 0.11367034912109375, 0.1212615966796875, 0.12885284423828125, 0.136444091796875, 0.14403533935546875, 0.1516265869140625, 0.15921783447265625, 0.16680908203125, 0.17440032958984375, 0.1819915771484375, 0.18958282470703125, 0.197174072265625, 0.20476531982421875, 0.2123565673828125, 0.21994781494140625, 0.2275390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 12.0, 20.0, 25.0, 37.0, 67.0, 98.0, 154.0, 215.0, 450.0, 724.0, 1267.0, 2378.0, 4913.0, 10178.0, 23784.0, 63107.0, 176463.0, 341401.0, 258171.0, 100668.0, 35897.0, 14607.0, 6709.0, 3186.0, 1703.0, 933.0, 516.0, 337.0, 190.0, 114.0, 65.0, 52.0, 32.0, 23.0, 13.0, 11.0, 9.0, 7.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5, -0.4855995178222656, -0.47119903564453125, -0.4567985534667969, -0.4423980712890625, -0.4279975891113281, -0.41359710693359375, -0.3991966247558594, -0.384796142578125, -0.3703956604003906, -0.35599517822265625, -0.3415946960449219, -0.3271942138671875, -0.3127937316894531, -0.29839324951171875, -0.2839927673339844, -0.26959228515625, -0.2551918029785156, -0.24079132080078125, -0.22639083862304688, -0.2119903564453125, -0.19758987426757812, -0.18318939208984375, -0.16878890991210938, -0.154388427734375, -0.13998794555664062, -0.12558746337890625, -0.11118698120117188, -0.0967864990234375, -0.08238601684570312, -0.06798553466796875, -0.053585052490234375, -0.0391845703125, -0.024784088134765625, -0.01038360595703125, 0.004016876220703125, 0.0184173583984375, 0.032817840576171875, 0.04721832275390625, 0.061618804931640625, 0.076019287109375, 0.09041976928710938, 0.10482025146484375, 0.11922073364257812, 0.1336212158203125, 0.14802169799804688, 0.16242218017578125, 0.17682266235351562, 0.19122314453125, 0.20562362670898438, 0.22002410888671875, 0.23442459106445312, 0.2488250732421875, 0.2632255554199219, 0.27762603759765625, 0.2920265197753906, 0.306427001953125, 0.3208274841308594, 0.33522796630859375, 0.3496284484863281, 0.3640289306640625, 0.3784294128417969, 0.39282989501953125, 0.4072303771972656, 0.421630859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 8.0, 5.0, 6.0, 12.0, 14.0, 18.0, 18.0, 22.0, 24.0, 33.0, 39.0, 31.0, 44.0, 47.0, 50.0, 62.0, 39.0, 56.0, 57.0, 43.0, 48.0, 32.0, 27.0, 39.0, 45.0, 31.0, 26.0, 20.0, 21.0, 21.0, 18.0, 8.0, 11.0, 6.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87109375, -0.844970703125, -0.81884765625, -0.792724609375, -0.7666015625, -0.740478515625, -0.71435546875, -0.688232421875, -0.662109375, -0.635986328125, -0.60986328125, -0.583740234375, -0.5576171875, -0.531494140625, -0.50537109375, -0.479248046875, -0.453125, -0.427001953125, -0.40087890625, -0.374755859375, -0.3486328125, -0.322509765625, -0.29638671875, -0.270263671875, -0.244140625, -0.218017578125, -0.19189453125, -0.165771484375, -0.1396484375, -0.113525390625, -0.08740234375, -0.061279296875, -0.03515625, -0.009033203125, 0.01708984375, 0.043212890625, 0.0693359375, 0.095458984375, 0.12158203125, 0.147705078125, 0.173828125, 0.199951171875, 0.22607421875, 0.252197265625, 0.2783203125, 0.304443359375, 0.33056640625, 0.356689453125, 0.3828125, 0.408935546875, 0.43505859375, 0.461181640625, 0.4873046875, 0.513427734375, 0.53955078125, 0.565673828125, 0.591796875, 0.617919921875, 0.64404296875, 0.670166015625, 0.6962890625, 0.722412109375, 0.74853515625, 0.774658203125, 0.80078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 8.0, 2.0, 7.0, 11.0, 19.0, 28.0, 47.0, 58.0, 88.0, 148.0, 202.0, 354.0, 542.0, 866.0, 1459.0, 2572.0, 4519.0, 8680.0, 17459.0, 37608.0, 85885.0, 202042.0, 318720.0, 204679.0, 87209.0, 38182.0, 17444.0, 8707.0, 4580.0, 2658.0, 1391.0, 864.0, 544.0, 369.0, 214.0, 119.0, 110.0, 60.0, 35.0, 29.0, 15.0, 12.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1971435546875, -0.1915912628173828, -0.18603897094726562, -0.18048667907714844, -0.17493438720703125, -0.16938209533691406, -0.16382980346679688, -0.1582775115966797, -0.1527252197265625, -0.1471729278564453, -0.14162063598632812, -0.13606834411621094, -0.13051605224609375, -0.12496376037597656, -0.11941146850585938, -0.11385917663574219, -0.108306884765625, -0.10275459289550781, -0.09720230102539062, -0.09165000915527344, -0.08609771728515625, -0.08054542541503906, -0.07499313354492188, -0.06944084167480469, -0.0638885498046875, -0.05833625793457031, -0.052783966064453125, -0.04723167419433594, -0.04167938232421875, -0.03612709045410156, -0.030574798583984375, -0.025022506713867188, -0.01947021484375, -0.013917922973632812, -0.008365631103515625, -0.0028133392333984375, 0.00273895263671875, 0.008291244506835938, 0.013843536376953125, 0.019395828247070312, 0.0249481201171875, 0.030500411987304688, 0.036052703857421875, 0.04160499572753906, 0.04715728759765625, 0.05270957946777344, 0.058261871337890625, 0.06381416320800781, 0.069366455078125, 0.07491874694824219, 0.08047103881835938, 0.08602333068847656, 0.09157562255859375, 0.09712791442871094, 0.10268020629882812, 0.10823249816894531, 0.1137847900390625, 0.11933708190917969, 0.12488937377929688, 0.13044166564941406, 0.13599395751953125, 0.14154624938964844, 0.14709854125976562, 0.1526508331298828, 0.158203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 5.0, 16.0, 19.0, 15.0, 40.0, 36.0, 49.0, 50.0, 85.0, 93.0, 109.0, 95.0, 88.0, 58.0, 43.0, 40.0, 31.0, 23.0, 14.0, 14.0, 9.0, 8.0, 7.0, 4.0, 3.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.0677528381347656e-05, -5.8564357459545135e-05, -5.6451186537742615e-05, -5.4338015615940094e-05, -5.222484469413757e-05, -5.011167377233505e-05, -4.799850285053253e-05, -4.588533192873001e-05, -4.377216100692749e-05, -4.165899008512497e-05, -3.954581916332245e-05, -3.743264824151993e-05, -3.531947731971741e-05, -3.3206306397914886e-05, -3.1093135476112366e-05, -2.8979964554309845e-05, -2.6866793632507324e-05, -2.4753622710704803e-05, -2.2640451788902283e-05, -2.0527280867099762e-05, -1.841410994529724e-05, -1.630093902349472e-05, -1.41877681016922e-05, -1.2074597179889679e-05, -9.961426258087158e-06, -7.848255336284637e-06, -5.735084414482117e-06, -3.621913492679596e-06, -1.5087425708770752e-06, 6.044283509254456e-07, 2.7175992727279663e-06, 4.830770194530487e-06, 6.943941116333008e-06, 9.057112038135529e-06, 1.117028295993805e-05, 1.328345388174057e-05, 1.539662480354309e-05, 1.750979572534561e-05, 1.9622966647148132e-05, 2.1736137568950653e-05, 2.3849308490753174e-05, 2.5962479412555695e-05, 2.8075650334358215e-05, 3.0188821256160736e-05, 3.230199217796326e-05, 3.441516309976578e-05, 3.65283340215683e-05, 3.864150494337082e-05, 4.075467586517334e-05, 4.286784678697586e-05, 4.498101770877838e-05, 4.70941886305809e-05, 4.920735955238342e-05, 5.1320530474185944e-05, 5.3433701395988464e-05, 5.5546872317790985e-05, 5.7660043239593506e-05, 5.9773214161396027e-05, 6.188638508319855e-05, 6.399955600500107e-05, 6.611272692680359e-05, 6.822589784860611e-05, 7.033906877040863e-05, 7.245223969221115e-05, 7.456541061401367e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 16.0, 18.0, 22.0, 30.0, 31.0, 59.0, 86.0, 130.0, 203.0, 312.0, 466.0, 765.0, 1239.0, 1903.0, 3109.0, 4933.0, 7859.0, 13276.0, 22626.0, 39405.0, 70163.0, 122539.0, 190666.0, 209918.0, 149748.0, 88356.0, 50058.0, 28355.0, 16436.0, 9813.0, 6109.0, 3648.0, 2285.0, 1480.0, 852.0, 550.0, 346.0, 250.0, 176.0, 105.0, 77.0, 40.0, 30.0, 26.0, 13.0, 9.0, 4.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10792827606201172, -0.10410118103027344, -0.10027408599853516, -0.09644699096679688, -0.0926198959350586, -0.08879280090332031, -0.08496570587158203, -0.08113861083984375, -0.07731151580810547, -0.07348442077636719, -0.0696573257446289, -0.06583023071289062, -0.062003135681152344, -0.05817604064941406, -0.05434894561767578, -0.0505218505859375, -0.04669475555419922, -0.04286766052246094, -0.039040565490722656, -0.035213470458984375, -0.031386375427246094, -0.027559280395507812, -0.02373218536376953, -0.01990509033203125, -0.01607799530029297, -0.012250900268554688, -0.008423805236816406, -0.004596710205078125, -0.0007696151733398438, 0.0030574798583984375, 0.006884574890136719, 0.010711669921875, 0.014538764953613281, 0.018365859985351562, 0.022192955017089844, 0.026020050048828125, 0.029847145080566406, 0.03367424011230469, 0.03750133514404297, 0.04132843017578125, 0.04515552520751953, 0.04898262023925781, 0.052809715270996094, 0.056636810302734375, 0.060463905334472656, 0.06429100036621094, 0.06811809539794922, 0.0719451904296875, 0.07577228546142578, 0.07959938049316406, 0.08342647552490234, 0.08725357055664062, 0.0910806655883789, 0.09490776062011719, 0.09873485565185547, 0.10256195068359375, 0.10638904571533203, 0.11021614074707031, 0.1140432357788086, 0.11787033081054688, 0.12169742584228516, 0.12552452087402344, 0.12935161590576172, 0.1331787109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 15.0, 9.0, 16.0, 20.0, 17.0, 15.0, 20.0, 31.0, 38.0, 38.0, 58.0, 53.0, 60.0, 47.0, 52.0, 66.0, 58.0, 43.0, 49.0, 33.0, 23.0, 24.0, 25.0, 26.0, 22.0, 24.0, 13.0, 12.0, 11.0, 9.0, 7.0, 4.0, 13.0, 4.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1829833984375, -0.1775360107421875, -0.172088623046875, -0.1666412353515625, -0.16119384765625, -0.1557464599609375, -0.150299072265625, -0.1448516845703125, -0.139404296875, -0.1339569091796875, -0.128509521484375, -0.1230621337890625, -0.11761474609375, -0.1121673583984375, -0.106719970703125, -0.1012725830078125, -0.0958251953125, -0.0903778076171875, -0.084930419921875, -0.0794830322265625, -0.07403564453125, -0.0685882568359375, -0.063140869140625, -0.0576934814453125, -0.05224609375, -0.0467987060546875, -0.041351318359375, -0.0359039306640625, -0.03045654296875, -0.0250091552734375, -0.019561767578125, -0.0141143798828125, -0.0086669921875, -0.0032196044921875, 0.002227783203125, 0.0076751708984375, 0.01312255859375, 0.0185699462890625, 0.024017333984375, 0.0294647216796875, 0.034912109375, 0.0403594970703125, 0.045806884765625, 0.0512542724609375, 0.05670166015625, 0.0621490478515625, 0.067596435546875, 0.0730438232421875, 0.0784912109375, 0.0839385986328125, 0.089385986328125, 0.0948333740234375, 0.10028076171875, 0.1057281494140625, 0.111175537109375, 0.1166229248046875, 0.1220703125, 0.1275177001953125, 0.132965087890625, 0.1384124755859375, 0.14385986328125, 0.1493072509765625, 0.154754638671875, 0.1602020263671875, 0.1656494140625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 19.0, 28.0, 113.0, 195.0, 225.0, 206.0, 119.0, 50.0, 19.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.889909744262695, -8.674944877624512, -8.459980010986328, -8.245015144348145, -8.030050277709961, -7.815085411071777, -7.600120544433594, -7.385156154632568, -7.170191287994385, -6.955226421356201, -6.740261554718018, -6.525296688079834, -6.31033182144165, -6.095367431640625, -5.880402565002441, -5.665437698364258, -5.450472831726074, -5.235507965087891, -5.020543098449707, -4.805578231811523, -4.59061336517334, -4.375648498535156, -4.160683631896973, -3.9457192420959473, -3.7307538986206055, -3.515789031982422, -3.3008241653442383, -3.0858592987060547, -2.87089467048645, -2.6559298038482666, -2.440964937210083, -2.2260003089904785, -2.011035442352295, -1.7960705757141113, -1.5811058282852173, -1.3661409616470337, -1.1511762142181396, -0.936211347579956, -0.7212464809417725, -0.5062817335128784, -0.2913168668746948, -0.07635204493999481, 0.1386127769947052, 0.3535776138305664, 0.5685424208641052, 0.783507227897644, 0.9984720945358276, 1.2134368419647217, 1.4284017086029053, 1.6433665752410889, 1.858331322669983, 2.073296070098877, 2.2882609367370605, 2.503225803375244, 2.7181906700134277, 2.9331555366516113, 3.148120403289795, 3.3630852699279785, 3.578050136566162, 3.7930150032043457, 4.007979869842529, 4.222944259643555, 4.437909126281738, 4.652873992919922, 4.8678388595581055]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 4.0, 3.0, 6.0, 6.0, 12.0, 11.0, 11.0, 12.0, 16.0, 18.0, 21.0, 25.0, 20.0, 22.0, 30.0, 31.0, 29.0, 31.0, 36.0, 31.0, 48.0, 30.0, 39.0, 47.0, 45.0, 34.0, 33.0, 38.0, 42.0, 32.0, 26.0, 28.0, 35.0, 17.0, 25.0, 31.0, 7.0, 14.0, 14.0, 7.0, 5.0, 4.0, 4.0, 5.0, 5.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6282906532287598, -1.573364019393921, -1.5184375047683716, -1.4635108709335327, -1.4085842370986938, -1.3536577224731445, -1.2987310886383057, -1.2438044548034668, -1.1888779401779175, -1.1339513063430786, -1.0790247917175293, -1.0240981578826904, -0.9691715836524963, -0.9142450094223022, -0.8593183755874634, -0.8043918013572693, -0.7494651675224304, -0.6945385932922363, -0.6396119594573975, -0.5846853852272034, -0.5297588109970093, -0.4748322069644928, -0.4199056029319763, -0.3649790287017822, -0.31005242466926575, -0.25512582063674927, -0.20019924640655518, -0.1452726423740387, -0.09034605324268341, -0.035419464111328125, 0.019507139921188354, 0.07443371415138245, 0.12936031818389893, 0.1842869073152542, 0.2392134964466095, 0.294140100479126, 0.34906667470932007, 0.40399327874183655, 0.458919882774353, 0.5138464570045471, 0.5687730312347412, 0.6236996054649353, 0.6786262392997742, 0.7335528135299683, 0.7884793877601624, 0.8434059619903564, 0.8983325958251953, 0.9532591700553894, 1.008185863494873, 1.063112497329712, 1.1180390119552612, 1.1729656457901, 1.227892279624939, 1.2828187942504883, 1.3377454280853271, 1.392672061920166, 1.4475985765457153, 1.5025252103805542, 1.5574517250061035, 1.6123783588409424, 1.6673049926757812, 1.7222315073013306, 1.7771581411361694, 1.8320846557617188, 1.8870112895965576]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 3.0, 9.0, 4.0, 4.0, 15.0, 8.0, 30.0, 32.0, 51.0, 52.0, 98.0, 103.0, 141.0, 185.0, 277.0, 400.0, 633.0, 1063.0, 1803.0, 3130.0, 5997.0, 12554.0, 30390.0, 95868.0, 415304.0, 1652136.0, 1481583.0, 353373.0, 85524.0, 28176.0, 11611.0, 5718.0, 3028.0, 1768.0, 1066.0, 688.0, 394.0, 297.0, 210.0, 157.0, 97.0, 75.0, 65.0, 45.0, 26.0, 13.0, 17.0, 24.0, 11.0, 10.0, 4.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.400146484375, -0.3863258361816406, -0.37250518798828125, -0.3586845397949219, -0.3448638916015625, -0.3310432434082031, -0.31722259521484375, -0.3034019470214844, -0.289581298828125, -0.2757606506347656, -0.26194000244140625, -0.24811935424804688, -0.2342987060546875, -0.22047805786132812, -0.20665740966796875, -0.19283676147460938, -0.17901611328125, -0.16519546508789062, -0.15137481689453125, -0.13755416870117188, -0.1237335205078125, -0.10991287231445312, -0.09609222412109375, -0.08227157592773438, -0.068450927734375, -0.054630279541015625, -0.04080963134765625, -0.026988983154296875, -0.0131683349609375, 0.000652313232421875, 0.01447296142578125, 0.028293609619140625, 0.0421142578125, 0.055934906005859375, 0.06975555419921875, 0.08357620239257812, 0.0973968505859375, 0.11121749877929688, 0.12503814697265625, 0.13885879516601562, 0.152679443359375, 0.16650009155273438, 0.18032073974609375, 0.19414138793945312, 0.2079620361328125, 0.22178268432617188, 0.23560333251953125, 0.24942398071289062, 0.26324462890625, 0.2770652770996094, 0.29088592529296875, 0.3047065734863281, 0.3185272216796875, 0.3323478698730469, 0.34616851806640625, 0.3599891662597656, 0.373809814453125, 0.3876304626464844, 0.40145111083984375, 0.4152717590332031, 0.4290924072265625, 0.4429130554199219, 0.45673370361328125, 0.4705543518066406, 0.484375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 8.0, 7.0, 6.0, 13.0, 9.0, 18.0, 16.0, 21.0, 25.0, 32.0, 23.0, 25.0, 39.0, 37.0, 46.0, 46.0, 52.0, 35.0, 34.0, 31.0, 42.0, 45.0, 33.0, 37.0, 33.0, 32.0, 27.0, 35.0, 37.0, 28.0, 29.0, 14.0, 17.0, 16.0, 11.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.287841796875, -0.2797889709472656, -0.27173614501953125, -0.2636833190917969, -0.2556304931640625, -0.24757766723632812, -0.23952484130859375, -0.23147201538085938, -0.223419189453125, -0.21536636352539062, -0.20731353759765625, -0.19926071166992188, -0.1912078857421875, -0.18315505981445312, -0.17510223388671875, -0.16704940795898438, -0.15899658203125, -0.15094375610351562, -0.14289093017578125, -0.13483810424804688, -0.1267852783203125, -0.11873245239257812, -0.11067962646484375, -0.10262680053710938, -0.094573974609375, -0.08652114868164062, -0.07846832275390625, -0.07041549682617188, -0.0623626708984375, -0.054309844970703125, -0.04625701904296875, -0.038204193115234375, -0.0301513671875, -0.022098541259765625, -0.01404571533203125, -0.005992889404296875, 0.0020599365234375, 0.010112762451171875, 0.01816558837890625, 0.026218414306640625, 0.034271240234375, 0.042324066162109375, 0.05037689208984375, 0.058429718017578125, 0.0664825439453125, 0.07453536987304688, 0.08258819580078125, 0.09064102172851562, 0.09869384765625, 0.10674667358398438, 0.11479949951171875, 0.12285232543945312, 0.1309051513671875, 0.13895797729492188, 0.14701080322265625, 0.15506362915039062, 0.163116455078125, 0.17116928100585938, 0.17922210693359375, 0.18727493286132812, 0.1953277587890625, 0.20338058471679688, 0.21143341064453125, 0.21948623657226562, 0.2275390625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 14.0, 7.0, 10.0, 11.0, 18.0, 43.0, 42.0, 68.0, 79.0, 123.0, 196.0, 268.0, 383.0, 545.0, 865.0, 1290.0, 1966.0, 3172.0, 5190.0, 9084.0, 17002.0, 33708.0, 76096.0, 204619.0, 743618.0, 2026978.0, 721687.0, 199408.0, 74479.0, 33313.0, 16686.0, 8951.0, 5260.0, 3175.0, 1977.0, 1268.0, 825.0, 583.0, 393.0, 258.0, 177.0, 141.0, 93.0, 63.0, 52.0, 22.0, 25.0, 11.0, 12.0, 10.0, 8.0, 2.0, 2.0, 5.0, 2.0, 3.0], "bins": [-0.40625, -0.3941192626953125, -0.381988525390625, -0.3698577880859375, -0.35772705078125, -0.3455963134765625, -0.333465576171875, -0.3213348388671875, -0.3092041015625, -0.2970733642578125, -0.284942626953125, -0.2728118896484375, -0.26068115234375, -0.2485504150390625, -0.236419677734375, -0.2242889404296875, -0.212158203125, -0.2000274658203125, -0.187896728515625, -0.1757659912109375, -0.16363525390625, -0.1515045166015625, -0.139373779296875, -0.1272430419921875, -0.1151123046875, -0.1029815673828125, -0.090850830078125, -0.0787200927734375, -0.06658935546875, -0.0544586181640625, -0.042327880859375, -0.0301971435546875, -0.01806640625, -0.0059356689453125, 0.006195068359375, 0.0183258056640625, 0.03045654296875, 0.0425872802734375, 0.054718017578125, 0.0668487548828125, 0.0789794921875, 0.0911102294921875, 0.103240966796875, 0.1153717041015625, 0.12750244140625, 0.1396331787109375, 0.151763916015625, 0.1638946533203125, 0.176025390625, 0.1881561279296875, 0.200286865234375, 0.2124176025390625, 0.22454833984375, 0.2366790771484375, 0.248809814453125, 0.2609405517578125, 0.2730712890625, 0.2852020263671875, 0.297332763671875, 0.3094635009765625, 0.32159423828125, 0.3337249755859375, 0.345855712890625, 0.3579864501953125, 0.3701171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 5.0, 10.0, 13.0, 28.0, 25.0, 30.0, 40.0, 65.0, 93.0, 130.0, 183.0, 266.0, 491.0, 644.0, 667.0, 420.0, 320.0, 187.0, 119.0, 84.0, 61.0, 43.0, 29.0, 26.0, 16.0, 16.0, 13.0, 8.0, 7.0, 9.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65673828125, -0.6373977661132812, -0.6180572509765625, -0.5987167358398438, -0.579376220703125, -0.5600357055664062, -0.5406951904296875, -0.5213546752929688, -0.50201416015625, -0.48267364501953125, -0.4633331298828125, -0.44399261474609375, -0.424652099609375, -0.40531158447265625, -0.3859710693359375, -0.36663055419921875, -0.3472900390625, -0.32794952392578125, -0.3086090087890625, -0.28926849365234375, -0.269927978515625, -0.25058746337890625, -0.2312469482421875, -0.21190643310546875, -0.19256591796875, -0.17322540283203125, -0.1538848876953125, -0.13454437255859375, -0.115203857421875, -0.09586334228515625, -0.0765228271484375, -0.05718231201171875, -0.037841796875, -0.01850128173828125, 0.0008392333984375, 0.02017974853515625, 0.039520263671875, 0.05886077880859375, 0.0782012939453125, 0.09754180908203125, 0.11688232421875, 0.13622283935546875, 0.1555633544921875, 0.17490386962890625, 0.194244384765625, 0.21358489990234375, 0.2329254150390625, 0.25226593017578125, 0.2716064453125, 0.29094696044921875, 0.3102874755859375, 0.32962799072265625, 0.348968505859375, 0.36830902099609375, 0.3876495361328125, 0.40699005126953125, 0.42633056640625, 0.44567108154296875, 0.4650115966796875, 0.48435211181640625, 0.503692626953125, 0.5230331420898438, 0.5423736572265625, 0.5617141723632812, 0.5810546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 9.0, 12.0, 17.0, 31.0, 54.0, 84.0, 111.0, 137.0, 130.0, 122.0, 106.0, 61.0, 35.0, 31.0, 24.0, 11.0, 9.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.198857307434082, -3.0600762367248535, -2.921294927597046, -2.7825136184692383, -2.6437325477600098, -2.5049514770507812, -2.3661701679229736, -2.227388858795166, -2.0886077880859375, -1.9498265981674194, -1.8110454082489014, -1.6722642183303833, -1.5334830284118652, -1.3947018384933472, -1.255920648574829, -1.117139458656311, -0.978358268737793, -0.8395770788192749, -0.7007958889007568, -0.5620146989822388, -0.4232335090637207, -0.28445231914520264, -0.14567112922668457, -0.006889939308166504, 0.13189125061035156, 0.27067244052886963, 0.4094536304473877, 0.5482348203659058, 0.6870160102844238, 0.8257972002029419, 0.96457839012146, 1.103359580039978, 1.242140293121338, 1.380921483039856, 1.519702672958374, 1.658483862876892, 1.7972650527954102, 1.9360462427139282, 2.0748274326324463, 2.213608741760254, 2.3523898124694824, 2.491170883178711, 2.6299521923065186, 2.768733501434326, 2.9075145721435547, 3.046295642852783, 3.185076951980591, 3.3238582611083984, 3.462639331817627, 3.6014204025268555, 3.740201711654663, 3.8789830207824707, 4.017764091491699, 4.156545162200928, 4.295326232910156, 4.434107780456543, 4.5728888511657715, 4.711669921875, 4.850451469421387, 4.989232540130615, 5.128013610839844, 5.266794681549072, 5.405575752258301, 5.5443572998046875, 5.683138370513916]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 9.0, 4.0, 9.0, 5.0, 7.0, 15.0, 16.0, 12.0, 19.0, 21.0, 34.0, 21.0, 26.0, 42.0, 34.0, 39.0, 45.0, 38.0, 38.0, 52.0, 39.0, 39.0, 44.0, 38.0, 42.0, 44.0, 35.0, 24.0, 33.0, 22.0, 30.0, 17.0, 20.0, 17.0, 12.0, 10.0, 11.0, 7.0, 3.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-2.0705385208129883, -2.0139200687408447, -1.9573014974594116, -1.900683045387268, -1.844064474105835, -1.7874460220336914, -1.7308274507522583, -1.6742089986801147, -1.6175904273986816, -1.560971975326538, -1.504353404045105, -1.4477349519729614, -1.3911163806915283, -1.3344979286193848, -1.2778793573379517, -1.221260905265808, -1.164642333984375, -1.1080238819122314, -1.0514053106307983, -0.99478679895401, -0.9381682872772217, -0.8815498352050781, -0.824931263923645, -0.7683128118515015, -0.7116943597793579, -0.6550758481025696, -0.5984573364257812, -0.5418388247489929, -0.4852203130722046, -0.42860183119773865, -0.3719833195209503, -0.315364807844162, -0.25874626636505127, -0.20212775468826294, -0.1455092430114746, -0.08889074623584747, -0.03227223455905914, 0.024346262216567993, 0.08096477389335632, 0.13758328557014465, 0.19420179724693298, 0.2508203089237213, 0.30743882060050964, 0.3640573024749756, 0.4206758141517639, 0.47729432582855225, 0.5339128375053406, 0.5905313491821289, 0.6471498608589172, 0.7037683725357056, 0.7603868842124939, 0.8170053958892822, 0.8736239075660706, 0.9302424192428589, 0.9868608713150024, 1.0434794425964355, 1.100097894668579, 1.1567163467407227, 1.2133349180221558, 1.2699533700942993, 1.3265719413757324, 1.383190393447876, 1.439808964729309, 1.4964274168014526, 1.5530459880828857]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 10.0, 23.0, 22.0, 29.0, 39.0, 78.0, 104.0, 132.0, 228.0, 329.0, 543.0, 970.0, 1476.0, 2451.0, 4113.0, 7023.0, 11828.0, 20595.0, 35713.0, 62053.0, 102763.0, 157048.0, 193805.0, 167764.0, 114289.0, 69529.0, 39847.0, 22944.0, 13450.0, 7746.0, 4460.0, 2648.0, 1660.0, 988.0, 637.0, 422.0, 266.0, 185.0, 100.0, 90.0, 43.0, 26.0, 33.0, 17.0, 12.0, 10.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.255615234375, -0.24800872802734375, -0.2404022216796875, -0.23279571533203125, -0.225189208984375, -0.21758270263671875, -0.2099761962890625, -0.20236968994140625, -0.19476318359375, -0.18715667724609375, -0.1795501708984375, -0.17194366455078125, -0.164337158203125, -0.15673065185546875, -0.1491241455078125, -0.14151763916015625, -0.1339111328125, -0.12630462646484375, -0.1186981201171875, -0.11109161376953125, -0.103485107421875, -0.09587860107421875, -0.0882720947265625, -0.08066558837890625, -0.07305908203125, -0.06545257568359375, -0.0578460693359375, -0.05023956298828125, -0.042633056640625, -0.03502655029296875, -0.0274200439453125, -0.01981353759765625, -0.01220703125, -0.00460052490234375, 0.0030059814453125, 0.01061248779296875, 0.018218994140625, 0.02582550048828125, 0.0334320068359375, 0.04103851318359375, 0.04864501953125, 0.05625152587890625, 0.0638580322265625, 0.07146453857421875, 0.079071044921875, 0.08667755126953125, 0.0942840576171875, 0.10189056396484375, 0.1094970703125, 0.11710357666015625, 0.1247100830078125, 0.13231658935546875, 0.139923095703125, 0.14752960205078125, 0.1551361083984375, 0.16274261474609375, 0.17034912109375, 0.17795562744140625, 0.1855621337890625, 0.19316864013671875, 0.200775146484375, 0.20838165283203125, 0.2159881591796875, 0.22359466552734375, 0.231201171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 2.0, 9.0, 6.0, 13.0, 5.0, 13.0, 8.0, 23.0, 20.0, 29.0, 28.0, 20.0, 24.0, 22.0, 37.0, 46.0, 40.0, 51.0, 45.0, 60.0, 42.0, 42.0, 48.0, 37.0, 37.0, 36.0, 28.0, 27.0, 22.0, 27.0, 24.0, 20.0, 23.0, 12.0, 12.0, 6.0, 11.0, 12.0, 7.0, 4.0, 4.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.355712890625, -0.3458404541015625, -0.335968017578125, -0.3260955810546875, -0.31622314453125, -0.3063507080078125, -0.296478271484375, -0.2866058349609375, -0.2767333984375, -0.2668609619140625, -0.256988525390625, -0.2471160888671875, -0.23724365234375, -0.2273712158203125, -0.217498779296875, -0.2076263427734375, -0.19775390625, -0.1878814697265625, -0.178009033203125, -0.1681365966796875, -0.15826416015625, -0.1483917236328125, -0.138519287109375, -0.1286468505859375, -0.1187744140625, -0.1089019775390625, -0.099029541015625, -0.0891571044921875, -0.07928466796875, -0.0694122314453125, -0.059539794921875, -0.0496673583984375, -0.039794921875, -0.0299224853515625, -0.020050048828125, -0.0101776123046875, -0.00030517578125, 0.0095672607421875, 0.019439697265625, 0.0293121337890625, 0.0391845703125, 0.0490570068359375, 0.058929443359375, 0.0688018798828125, 0.07867431640625, 0.0885467529296875, 0.098419189453125, 0.1082916259765625, 0.1181640625, 0.1280364990234375, 0.137908935546875, 0.1477813720703125, 0.15765380859375, 0.1675262451171875, 0.177398681640625, 0.1872711181640625, 0.1971435546875, 0.2070159912109375, 0.216888427734375, 0.2267608642578125, 0.23663330078125, 0.2465057373046875, 0.256378173828125, 0.2662506103515625, 0.276123046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 6.0, 8.0, 8.0, 13.0, 36.0, 41.0, 62.0, 102.0, 167.0, 294.0, 481.0, 821.0, 1414.0, 2440.0, 4574.0, 8359.0, 15850.0, 30605.0, 59382.0, 110658.0, 190895.0, 261811.0, 165314.0, 92421.0, 48374.0, 25325.0, 13213.0, 7086.0, 3713.0, 2104.0, 1188.0, 695.0, 418.0, 237.0, 162.0, 90.0, 61.0, 41.0, 26.0, 26.0, 14.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24365234375, -0.23505783081054688, -0.22646331787109375, -0.21786880493164062, -0.2092742919921875, -0.20067977905273438, -0.19208526611328125, -0.18349075317382812, -0.174896240234375, -0.16630172729492188, -0.15770721435546875, -0.14911270141601562, -0.1405181884765625, -0.13192367553710938, -0.12332916259765625, -0.11473464965820312, -0.10614013671875, -0.09754562377929688, -0.08895111083984375, -0.08035659790039062, -0.0717620849609375, -0.06316757202148438, -0.05457305908203125, -0.045978546142578125, -0.037384033203125, -0.028789520263671875, -0.02019500732421875, -0.011600494384765625, -0.0030059814453125, 0.005588531494140625, 0.01418304443359375, 0.022777557373046875, 0.0313720703125, 0.039966583251953125, 0.04856109619140625, 0.057155609130859375, 0.0657501220703125, 0.07434463500976562, 0.08293914794921875, 0.09153366088867188, 0.100128173828125, 0.10872268676757812, 0.11731719970703125, 0.12591171264648438, 0.1345062255859375, 0.14310073852539062, 0.15169525146484375, 0.16028976440429688, 0.16888427734375, 0.17747879028320312, 0.18607330322265625, 0.19466781616210938, 0.2032623291015625, 0.21185684204101562, 0.22045135498046875, 0.22904586791992188, 0.237640380859375, 0.24623489379882812, 0.25482940673828125, 0.2634239196777344, 0.2720184326171875, 0.2806129455566406, 0.28920745849609375, 0.2978019714355469, 0.306396484375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 7.0, 6.0, 7.0, 9.0, 11.0, 16.0, 21.0, 24.0, 24.0, 24.0, 26.0, 30.0, 35.0, 43.0, 31.0, 29.0, 46.0, 49.0, 39.0, 46.0, 41.0, 33.0, 36.0, 46.0, 38.0, 30.0, 34.0, 37.0, 26.0, 25.0, 19.0, 16.0, 22.0, 13.0, 15.0, 10.0, 9.0, 3.0, 4.0, 8.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81982421875, -0.7932357788085938, -0.7666473388671875, -0.7400588989257812, -0.713470458984375, -0.6868820190429688, -0.6602935791015625, -0.6337051391601562, -0.60711669921875, -0.5805282592773438, -0.5539398193359375, -0.5273513793945312, -0.500762939453125, -0.47417449951171875, -0.4475860595703125, -0.42099761962890625, -0.3944091796875, -0.36782073974609375, -0.3412322998046875, -0.31464385986328125, -0.288055419921875, -0.26146697998046875, -0.2348785400390625, -0.20829010009765625, -0.18170166015625, -0.15511322021484375, -0.1285247802734375, -0.10193634033203125, -0.075347900390625, -0.04875946044921875, -0.0221710205078125, 0.00441741943359375, 0.031005859375, 0.05759429931640625, 0.0841827392578125, 0.11077117919921875, 0.137359619140625, 0.16394805908203125, 0.1905364990234375, 0.21712493896484375, 0.24371337890625, 0.27030181884765625, 0.2968902587890625, 0.32347869873046875, 0.350067138671875, 0.37665557861328125, 0.4032440185546875, 0.42983245849609375, 0.4564208984375, 0.48300933837890625, 0.5095977783203125, 0.5361862182617188, 0.562774658203125, 0.5893630981445312, 0.6159515380859375, 0.6425399780273438, 0.66912841796875, 0.6957168579101562, 0.7223052978515625, 0.7488937377929688, 0.775482177734375, 0.8020706176757812, 0.8286590576171875, 0.8552474975585938, 0.8818359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 8.0, 14.0, 20.0, 27.0, 49.0, 77.0, 109.0, 193.0, 338.0, 531.0, 920.0, 1580.0, 3004.0, 5326.0, 10571.0, 21009.0, 43107.0, 89487.0, 174100.0, 302363.0, 195240.0, 101246.0, 49334.0, 24025.0, 11954.0, 6199.0, 3348.0, 1807.0, 1033.0, 613.0, 344.0, 204.0, 138.0, 75.0, 58.0, 34.0, 19.0, 13.0, 9.0, 10.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0863037109375, -0.08373451232910156, -0.08116531372070312, -0.07859611511230469, -0.07602691650390625, -0.07345771789550781, -0.07088851928710938, -0.06831932067871094, -0.0657501220703125, -0.06318092346191406, -0.060611724853515625, -0.05804252624511719, -0.05547332763671875, -0.05290412902832031, -0.050334930419921875, -0.04776573181152344, -0.045196533203125, -0.04262733459472656, -0.040058135986328125, -0.03748893737792969, -0.03491973876953125, -0.03235054016113281, -0.029781341552734375, -0.027212142944335938, -0.0246429443359375, -0.022073745727539062, -0.019504547119140625, -0.016935348510742188, -0.01436614990234375, -0.011796951293945312, -0.009227752685546875, -0.0066585540771484375, -0.00408935546875, -0.0015201568603515625, 0.001049041748046875, 0.0036182403564453125, 0.00618743896484375, 0.008756637573242188, 0.011325836181640625, 0.013895034790039062, 0.0164642333984375, 0.019033432006835938, 0.021602630615234375, 0.024171829223632812, 0.02674102783203125, 0.029310226440429688, 0.031879425048828125, 0.03444862365722656, 0.037017822265625, 0.03958702087402344, 0.042156219482421875, 0.04472541809082031, 0.04729461669921875, 0.04986381530761719, 0.052433013916015625, 0.05500221252441406, 0.0575714111328125, 0.06014060974121094, 0.06270980834960938, 0.06527900695800781, 0.06784820556640625, 0.07041740417480469, 0.07298660278320312, 0.07555580139160156, 0.078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 7.0, 8.0, 9.0, 12.0, 15.0, 13.0, 21.0, 21.0, 28.0, 40.0, 45.0, 44.0, 51.0, 59.0, 74.0, 64.0, 70.0, 56.0, 65.0, 49.0, 38.0, 37.0, 24.0, 26.0, 21.0, 19.0, 16.0, 12.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.075599670410156e-05, -2.978462725877762e-05, -2.8813257813453674e-05, -2.784188836812973e-05, -2.6870518922805786e-05, -2.5899149477481842e-05, -2.4927780032157898e-05, -2.3956410586833954e-05, -2.298504114151001e-05, -2.2013671696186066e-05, -2.104230225086212e-05, -2.0070932805538177e-05, -1.9099563360214233e-05, -1.812819391489029e-05, -1.7156824469566345e-05, -1.61854550242424e-05, -1.5214085578918457e-05, -1.4242716133594513e-05, -1.3271346688270569e-05, -1.2299977242946625e-05, -1.132860779762268e-05, -1.0357238352298737e-05, -9.385868906974792e-06, -8.414499461650848e-06, -7.443130016326904e-06, -6.47176057100296e-06, -5.500391125679016e-06, -4.529021680355072e-06, -3.557652235031128e-06, -2.586282789707184e-06, -1.6149133443832397e-06, -6.435438990592957e-07, 3.2782554626464844e-07, 1.2991949915885925e-06, 2.2705644369125366e-06, 3.2419338822364807e-06, 4.213303327560425e-06, 5.184672772884369e-06, 6.156042218208313e-06, 7.127411663532257e-06, 8.098781108856201e-06, 9.070150554180145e-06, 1.004151999950409e-05, 1.1012889444828033e-05, 1.1984258890151978e-05, 1.2955628335475922e-05, 1.3926997780799866e-05, 1.489836722612381e-05, 1.5869736671447754e-05, 1.6841106116771698e-05, 1.7812475562095642e-05, 1.8783845007419586e-05, 1.975521445274353e-05, 2.0726583898067474e-05, 2.169795334339142e-05, 2.2669322788715363e-05, 2.3640692234039307e-05, 2.461206167936325e-05, 2.5583431124687195e-05, 2.655480057001114e-05, 2.7526170015335083e-05, 2.8497539460659027e-05, 2.946890890598297e-05, 3.0440278351306915e-05, 3.141164779663086e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 0.0, 4.0, 6.0, 3.0, 21.0, 14.0, 26.0, 51.0, 62.0, 99.0, 122.0, 171.0, 326.0, 482.0, 824.0, 1400.0, 2385.0, 4502.0, 8369.0, 16581.0, 34178.0, 71138.0, 144588.0, 283685.0, 235741.0, 124244.0, 60090.0, 28780.0, 14112.0, 7141.0, 3880.0, 2188.0, 1309.0, 765.0, 449.0, 270.0, 167.0, 146.0, 72.0, 43.0, 31.0, 30.0, 16.0, 17.0, 10.0, 5.0, 5.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07803058624267578, -0.07512855529785156, -0.07222652435302734, -0.06932449340820312, -0.0664224624633789, -0.06352043151855469, -0.06061840057373047, -0.05771636962890625, -0.05481433868408203, -0.05191230773925781, -0.049010276794433594, -0.046108245849609375, -0.043206214904785156, -0.04030418395996094, -0.03740215301513672, -0.0345001220703125, -0.03159809112548828, -0.028696060180664062, -0.025794029235839844, -0.022891998291015625, -0.019989967346191406, -0.017087936401367188, -0.014185905456542969, -0.01128387451171875, -0.008381843566894531, -0.0054798126220703125, -0.0025777816772460938, 0.000324249267578125, 0.0032262802124023438, 0.0061283111572265625, 0.009030342102050781, 0.011932373046875, 0.014834403991699219, 0.017736434936523438, 0.020638465881347656, 0.023540496826171875, 0.026442527770996094, 0.029344558715820312, 0.03224658966064453, 0.03514862060546875, 0.03805065155029297, 0.04095268249511719, 0.043854713439941406, 0.046756744384765625, 0.049658775329589844, 0.05256080627441406, 0.05546283721923828, 0.0583648681640625, 0.06126689910888672, 0.06416893005371094, 0.06707096099853516, 0.06997299194335938, 0.0728750228881836, 0.07577705383300781, 0.07867908477783203, 0.08158111572265625, 0.08448314666748047, 0.08738517761230469, 0.0902872085571289, 0.09318923950195312, 0.09609127044677734, 0.09899330139160156, 0.10189533233642578, 0.10479736328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 2.0, 8.0, 7.0, 11.0, 13.0, 13.0, 22.0, 22.0, 18.0, 34.0, 33.0, 51.0, 46.0, 66.0, 64.0, 85.0, 81.0, 59.0, 72.0, 48.0, 44.0, 38.0, 25.0, 30.0, 24.0, 14.0, 10.0, 9.0, 8.0, 13.0, 7.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.146484375, -0.1417407989501953, -0.13699722290039062, -0.13225364685058594, -0.12751007080078125, -0.12276649475097656, -0.11802291870117188, -0.11327934265136719, -0.1085357666015625, -0.10379219055175781, -0.09904861450195312, -0.09430503845214844, -0.08956146240234375, -0.08481788635253906, -0.08007431030273438, -0.07533073425292969, -0.070587158203125, -0.06584358215332031, -0.061100006103515625, -0.05635643005371094, -0.05161285400390625, -0.04686927795410156, -0.042125701904296875, -0.03738212585449219, -0.0326385498046875, -0.027894973754882812, -0.023151397705078125, -0.018407821655273438, -0.01366424560546875, -0.008920669555664062, -0.004177093505859375, 0.0005664825439453125, 0.00531005859375, 0.010053634643554688, 0.014797210693359375, 0.019540786743164062, 0.02428436279296875, 0.029027938842773438, 0.033771514892578125, 0.03851509094238281, 0.0432586669921875, 0.04800224304199219, 0.052745819091796875, 0.05748939514160156, 0.06223297119140625, 0.06697654724121094, 0.07172012329101562, 0.07646369934082031, 0.081207275390625, 0.08595085144042969, 0.09069442749023438, 0.09543800354003906, 0.10018157958984375, 0.10492515563964844, 0.10966873168945312, 0.11441230773925781, 0.1191558837890625, 0.12389945983886719, 0.12864303588867188, 0.13338661193847656, 0.13813018798828125, 0.14287376403808594, 0.14761734008789062, 0.1523609161376953, 0.1571044921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 16.0, 25.0, 27.0, 78.0, 94.0, 144.0, 147.0, 156.0, 131.0, 70.0, 42.0, 15.0, 14.0, 12.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.242569923400879, -4.136033535003662, -4.029497146606445, -3.9229609966278076, -3.81642484664917, -3.709888458251953, -3.6033520698547363, -3.4968156814575195, -3.390279531478882, -3.283743143081665, -3.1772069931030273, -3.0706706047058105, -2.9641342163085938, -2.857598066329956, -2.7510616779327393, -2.6445255279541016, -2.5379891395568848, -2.431452751159668, -2.3249166011810303, -2.2183802127838135, -2.111844062805176, -2.005307674407959, -1.8987712860107422, -1.792235016822815, -1.6856987476348877, -1.5791624784469604, -1.4726262092590332, -1.3660898208618164, -1.2595535516738892, -1.153017282485962, -1.0464808940887451, -0.9399446249008179, -0.8334083557128906, -0.7268720865249634, -0.6203357577323914, -0.5137994289398193, -0.4072631597518921, -0.30072689056396484, -0.19419056177139282, -0.0876542329788208, 0.018882036209106445, 0.12541833519935608, 0.2319546341896057, 0.33849093317985535, 0.445027232170105, 0.5515635013580322, 0.6580998301506042, 0.7646361589431763, 0.8711724281311035, 0.9777086973190308, 1.084244966506958, 1.1907813549041748, 1.297317624092102, 1.4038538932800293, 1.510390281677246, 1.6169265508651733, 1.7234628200531006, 1.8299990892410278, 1.936535358428955, 2.043071746826172, 2.1496081352233887, 2.2561442852020264, 2.362680673599243, 2.469216823577881, 2.5757532119750977]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 10.0, 9.0, 9.0, 13.0, 17.0, 23.0, 28.0, 24.0, 27.0, 27.0, 36.0, 35.0, 32.0, 51.0, 40.0, 38.0, 48.0, 56.0, 39.0, 42.0, 41.0, 44.0, 34.0, 41.0, 40.0, 30.0, 24.0, 26.0, 14.0, 18.0, 11.0, 14.0, 6.0, 6.0, 5.0, 6.0, 3.0, 6.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02490234375, -1.95806884765625, -1.8912352323532104, -1.8244017362594604, -1.757568120956421, -1.690734624862671, -1.623901128768921, -1.5570675134658813, -1.4902338981628418, -1.4234004020690918, -1.3565667867660522, -1.2897332906723022, -1.2228996753692627, -1.1560661792755127, -1.0892326831817627, -1.0223990678787231, -0.9555655717849731, -0.8887320160865784, -0.8218984603881836, -0.7550649642944336, -0.688231348991394, -0.621397852897644, -0.5545642971992493, -0.4877307415008545, -0.4208971858024597, -0.35406363010406494, -0.28723007440567017, -0.22039654850959778, -0.153562992811203, -0.08672943711280823, -0.01989591121673584, 0.046937644481658936, 0.11377120018005371, 0.1806047558784485, 0.24743829667568207, 0.31427183747291565, 0.3811053931713104, 0.4479389488697052, 0.5147724747657776, 0.5816060304641724, 0.6484395861625671, 0.7152731418609619, 0.7821066975593567, 0.8489402532577515, 0.9157737493515015, 0.982607364654541, 1.049440860748291, 1.116274356842041, 1.1831079721450806, 1.2499414682388306, 1.3167750835418701, 1.3836085796356201, 1.4504421949386597, 1.5172756910324097, 1.5841093063354492, 1.6509428024291992, 1.7177762985229492, 1.7846097946166992, 1.8514434099197388, 1.9182769060134888, 1.9851105213165283, 2.0519440174102783, 2.1187775135040283, 2.1856112480163574, 2.2524447441101074]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 4.0, 15.0, 17.0, 17.0, 23.0, 37.0, 58.0, 92.0, 97.0, 165.0, 261.0, 363.0, 598.0, 979.0, 1497.0, 2540.0, 4596.0, 9220.0, 21067.0, 54434.0, 162076.0, 442834.0, 912075.0, 1168746.0, 819447.0, 373995.0, 135724.0, 46654.0, 17874.0, 8025.0, 4253.0, 2458.0, 1450.0, 871.0, 586.0, 364.0, 245.0, 172.0, 97.0, 72.0, 70.0, 38.0, 26.0, 18.0, 13.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.328857421875, -0.3187141418457031, -0.30857086181640625, -0.2984275817871094, -0.2882843017578125, -0.2781410217285156, -0.26799774169921875, -0.2578544616699219, -0.247711181640625, -0.23756790161132812, -0.22742462158203125, -0.21728134155273438, -0.2071380615234375, -0.19699478149414062, -0.18685150146484375, -0.17670822143554688, -0.16656494140625, -0.15642166137695312, -0.14627838134765625, -0.13613510131835938, -0.1259918212890625, -0.11584854125976562, -0.10570526123046875, -0.09556198120117188, -0.085418701171875, -0.07527542114257812, -0.06513214111328125, -0.054988861083984375, -0.0448455810546875, -0.034702301025390625, -0.02455902099609375, -0.014415740966796875, -0.0042724609375, 0.005870819091796875, 0.01601409912109375, 0.026157379150390625, 0.0363006591796875, 0.046443939208984375, 0.05658721923828125, 0.06673049926757812, 0.076873779296875, 0.08701705932617188, 0.09716033935546875, 0.10730361938476562, 0.1174468994140625, 0.12759017944335938, 0.13773345947265625, 0.14787673950195312, 0.15802001953125, 0.16816329956054688, 0.17830657958984375, 0.18844985961914062, 0.1985931396484375, 0.20873641967773438, 0.21887969970703125, 0.22902297973632812, 0.239166259765625, 0.24930953979492188, 0.25945281982421875, 0.2695960998535156, 0.2797393798828125, 0.2898826599121094, 0.30002593994140625, 0.3101692199707031, 0.3203125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 9.0, 11.0, 9.0, 15.0, 15.0, 17.0, 24.0, 20.0, 19.0, 28.0, 30.0, 44.0, 30.0, 45.0, 52.0, 40.0, 42.0, 53.0, 37.0, 42.0, 49.0, 37.0, 37.0, 30.0, 45.0, 42.0, 25.0, 22.0, 16.0, 14.0, 16.0, 10.0, 19.0, 8.0, 10.0, 13.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2496337890625, -0.24025535583496094, -0.23087692260742188, -0.2214984893798828, -0.21212005615234375, -0.2027416229248047, -0.19336318969726562, -0.18398475646972656, -0.1746063232421875, -0.16522789001464844, -0.15584945678710938, -0.1464710235595703, -0.13709259033203125, -0.1277141571044922, -0.11833572387695312, -0.10895729064941406, -0.099578857421875, -0.09020042419433594, -0.08082199096679688, -0.07144355773925781, -0.06206512451171875, -0.05268669128417969, -0.043308258056640625, -0.03392982482910156, -0.0245513916015625, -0.015172958374023438, -0.005794525146484375, 0.0035839080810546875, 0.01296234130859375, 0.022340774536132812, 0.031719207763671875, 0.04109764099121094, 0.05047607421875, 0.05985450744628906, 0.06923294067382812, 0.07861137390136719, 0.08798980712890625, 0.09736824035644531, 0.10674667358398438, 0.11612510681152344, 0.1255035400390625, 0.13488197326660156, 0.14426040649414062, 0.1536388397216797, 0.16301727294921875, 0.1723957061767578, 0.18177413940429688, 0.19115257263183594, 0.200531005859375, 0.20990943908691406, 0.21928787231445312, 0.2286663055419922, 0.23804473876953125, 0.2474231719970703, 0.2568016052246094, 0.26618003845214844, 0.2755584716796875, 0.28493690490722656, 0.2943153381347656, 0.3036937713623047, 0.31307220458984375, 0.3224506378173828, 0.3318290710449219, 0.34120750427246094, 0.3505859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 13.0, 20.0, 27.0, 28.0, 59.0, 77.0, 119.0, 162.0, 259.0, 391.0, 627.0, 1024.0, 1720.0, 3259.0, 6819.0, 16631.0, 51844.0, 216994.0, 1263039.0, 2101204.0, 401786.0, 84791.0, 24844.0, 9251.0, 4139.0, 2136.0, 1158.0, 675.0, 421.0, 261.0, 162.0, 102.0, 59.0, 51.0, 36.0, 25.0, 15.0, 10.0, 11.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.48291015625, -0.46691131591796875, -0.4509124755859375, -0.43491363525390625, -0.418914794921875, -0.40291595458984375, -0.3869171142578125, -0.37091827392578125, -0.35491943359375, -0.33892059326171875, -0.3229217529296875, -0.30692291259765625, -0.290924072265625, -0.27492523193359375, -0.2589263916015625, -0.24292755126953125, -0.2269287109375, -0.21092987060546875, -0.1949310302734375, -0.17893218994140625, -0.162933349609375, -0.14693450927734375, -0.1309356689453125, -0.11493682861328125, -0.09893798828125, -0.08293914794921875, -0.0669403076171875, -0.05094146728515625, -0.034942626953125, -0.01894378662109375, -0.0029449462890625, 0.01305389404296875, 0.029052734375, 0.04505157470703125, 0.0610504150390625, 0.07704925537109375, 0.093048095703125, 0.10904693603515625, 0.1250457763671875, 0.14104461669921875, 0.15704345703125, 0.17304229736328125, 0.1890411376953125, 0.20503997802734375, 0.221038818359375, 0.23703765869140625, 0.2530364990234375, 0.26903533935546875, 0.2850341796875, 0.30103302001953125, 0.3170318603515625, 0.33303070068359375, 0.349029541015625, 0.36502838134765625, 0.3810272216796875, 0.39702606201171875, 0.41302490234375, 0.42902374267578125, 0.4450225830078125, 0.46102142333984375, 0.477020263671875, 0.49301910400390625, 0.5090179443359375, 0.5250167846679688, 0.541015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 12.0, 13.0, 19.0, 26.0, 38.0, 55.0, 80.0, 112.0, 179.0, 264.0, 341.0, 437.0, 520.0, 464.0, 408.0, 336.0, 231.0, 137.0, 101.0, 78.0, 56.0, 54.0, 47.0, 16.0, 10.0, 19.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7880859375, -0.7640838623046875, -0.740081787109375, -0.7160797119140625, -0.69207763671875, -0.6680755615234375, -0.644073486328125, -0.6200714111328125, -0.5960693359375, -0.5720672607421875, -0.548065185546875, -0.5240631103515625, -0.50006103515625, -0.4760589599609375, -0.452056884765625, -0.4280548095703125, -0.404052734375, -0.3800506591796875, -0.356048583984375, -0.3320465087890625, -0.30804443359375, -0.2840423583984375, -0.260040283203125, -0.2360382080078125, -0.2120361328125, -0.1880340576171875, -0.164031982421875, -0.1400299072265625, -0.11602783203125, -0.0920257568359375, -0.068023681640625, -0.0440216064453125, -0.02001953125, 0.0039825439453125, 0.027984619140625, 0.0519866943359375, 0.07598876953125, 0.0999908447265625, 0.123992919921875, 0.1479949951171875, 0.1719970703125, 0.1959991455078125, 0.220001220703125, 0.2440032958984375, 0.26800537109375, 0.2920074462890625, 0.316009521484375, 0.3400115966796875, 0.364013671875, 0.3880157470703125, 0.412017822265625, 0.4360198974609375, 0.46002197265625, 0.4840240478515625, 0.508026123046875, 0.5320281982421875, 0.5560302734375, 0.5800323486328125, 0.604034423828125, 0.6280364990234375, 0.65203857421875, 0.6760406494140625, 0.700042724609375, 0.7240447998046875, 0.748046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 14.0, 23.0, 37.0, 64.0, 84.0, 122.0, 134.0, 152.0, 103.0, 81.0, 59.0, 34.0, 17.0, 10.0, 18.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.480592727661133, -4.240296840667725, -4.000000476837158, -3.75970458984375, -3.519408702850342, -3.2791125774383545, -3.038816452026367, -2.798520565032959, -2.5582244396209717, -2.3179283142089844, -2.077632427215576, -1.8373363018035889, -1.5970402956008911, -1.3567442893981934, -1.116448163986206, -0.8761521577835083, -0.6358561515808105, -0.3955601155757904, -0.15526407957077026, 0.08503198623657227, 0.32532799243927, 0.5656239986419678, 0.8059201240539551, 1.0462161302566528, 1.2865121364593506, 1.5268081426620483, 1.767104148864746, 2.0074002742767334, 2.2476963996887207, 2.487992286682129, 2.728288412094116, 2.9685845375061035, 3.2088804244995117, 3.449176549911499, 3.6894724369049072, 3.9297685623168945, 4.170064449310303, 4.410360336303711, 4.650656700134277, 4.8909525871276855, 5.131248474121094, 5.371544361114502, 5.611840724945068, 5.852136611938477, 6.092432498931885, 6.332728385925293, 6.573024749755859, 6.813320636749268, 7.053617000579834, 7.293912887573242, 7.534209251403809, 7.774505138397217, 8.014801025390625, 8.255097389221191, 8.495393753051758, 8.735689163208008, 8.975985527038574, 9.21628189086914, 9.45657730102539, 9.696873664855957, 9.937170028686523, 10.177465438842773, 10.41776180267334, 10.658058166503906, 10.898353576660156]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 14.0, 11.0, 17.0, 22.0, 25.0, 28.0, 33.0, 32.0, 38.0, 48.0, 48.0, 45.0, 46.0, 57.0, 48.0, 49.0, 40.0, 57.0, 43.0, 49.0, 36.0, 44.0, 28.0, 22.0, 19.0, 19.0, 21.0, 13.0, 10.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.3806939125061035, -3.2845141887664795, -3.1883344650268555, -3.0921547412872314, -2.9959750175476074, -2.8997952938079834, -2.8036155700683594, -2.7074358463287354, -2.6112561225891113, -2.5150763988494873, -2.4188966751098633, -2.3227169513702393, -2.2265372276306152, -2.130357503890991, -2.034177780151367, -1.9379980564117432, -1.8418183326721191, -1.7456386089324951, -1.649458885192871, -1.553279161453247, -1.457099437713623, -1.360919713973999, -1.264739990234375, -1.168560266494751, -1.072380542755127, -0.9762008190155029, -0.8800210952758789, -0.7838413715362549, -0.6876616477966309, -0.5914819240570068, -0.4953022003173828, -0.3991224765777588, -0.30294275283813477, -0.20676302909851074, -0.11058330535888672, -0.014403581619262695, 0.08177614212036133, 0.17795586585998535, 0.2741355895996094, 0.3703153133392334, 0.4664950370788574, 0.5626747608184814, 0.6588544845581055, 0.7550342082977295, 0.8512139320373535, 0.9473936557769775, 1.0435733795166016, 1.1397531032562256, 1.2359328269958496, 1.3321125507354736, 1.4282922744750977, 1.5244719982147217, 1.6206517219543457, 1.7168314456939697, 1.8130111694335938, 1.9091908931732178, 2.005370616912842, 2.101550340652466, 2.19773006439209, 2.293909788131714, 2.390089511871338, 2.486269235610962, 2.582448959350586, 2.67862868309021, 2.774808406829834]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 19.0, 20.0, 28.0, 42.0, 47.0, 59.0, 77.0, 139.0, 209.0, 255.0, 421.0, 610.0, 918.0, 1472.0, 2348.0, 4094.0, 7971.0, 16673.0, 39611.0, 109596.0, 300710.0, 340174.0, 134493.0, 47882.0, 19640.0, 8987.0, 4846.0, 2638.0, 1548.0, 947.0, 628.0, 461.0, 278.0, 220.0, 144.0, 110.0, 56.0, 44.0, 35.0, 22.0, 20.0, 11.0, 12.0, 9.0, 5.0, 3.0, 2.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.29541015625, -0.2862052917480469, -0.27700042724609375, -0.2677955627441406, -0.2585906982421875, -0.24938583374023438, -0.24018096923828125, -0.23097610473632812, -0.221771240234375, -0.21256637573242188, -0.20336151123046875, -0.19415664672851562, -0.1849517822265625, -0.17574691772460938, -0.16654205322265625, -0.15733718872070312, -0.14813232421875, -0.13892745971679688, -0.12972259521484375, -0.12051773071289062, -0.1113128662109375, -0.10210800170898438, -0.09290313720703125, -0.08369827270507812, -0.074493408203125, -0.06528854370117188, -0.05608367919921875, -0.046878814697265625, -0.0376739501953125, -0.028469085693359375, -0.01926422119140625, -0.010059356689453125, -0.0008544921875, 0.008350372314453125, 0.01755523681640625, 0.026760101318359375, 0.0359649658203125, 0.045169830322265625, 0.05437469482421875, 0.06357955932617188, 0.072784423828125, 0.08198928833007812, 0.09119415283203125, 0.10039901733398438, 0.1096038818359375, 0.11880874633789062, 0.12801361083984375, 0.13721847534179688, 0.14642333984375, 0.15562820434570312, 0.16483306884765625, 0.17403793334960938, 0.1832427978515625, 0.19244766235351562, 0.20165252685546875, 0.21085739135742188, 0.220062255859375, 0.22926712036132812, 0.23847198486328125, 0.24767684936523438, 0.2568817138671875, 0.2660865783691406, 0.27529144287109375, 0.2844963073730469, 0.293701171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 1.0, 6.0, 5.0, 8.0, 8.0, 9.0, 11.0, 21.0, 22.0, 19.0, 24.0, 35.0, 35.0, 32.0, 36.0, 37.0, 53.0, 36.0, 56.0, 45.0, 38.0, 45.0, 47.0, 42.0, 46.0, 43.0, 23.0, 28.0, 31.0, 26.0, 29.0, 16.0, 14.0, 16.0, 13.0, 12.0, 8.0, 8.0, 3.0, 7.0, 6.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.444580078125, -0.43247222900390625, -0.4203643798828125, -0.40825653076171875, -0.396148681640625, -0.38404083251953125, -0.3719329833984375, -0.35982513427734375, -0.34771728515625, -0.33560943603515625, -0.3235015869140625, -0.31139373779296875, -0.299285888671875, -0.28717803955078125, -0.2750701904296875, -0.26296234130859375, -0.2508544921875, -0.23874664306640625, -0.2266387939453125, -0.21453094482421875, -0.202423095703125, -0.19031524658203125, -0.1782073974609375, -0.16609954833984375, -0.15399169921875, -0.14188385009765625, -0.1297760009765625, -0.11766815185546875, -0.105560302734375, -0.09345245361328125, -0.0813446044921875, -0.06923675537109375, -0.05712890625, -0.04502105712890625, -0.0329132080078125, -0.02080535888671875, -0.008697509765625, 0.00341033935546875, 0.0155181884765625, 0.02762603759765625, 0.03973388671875, 0.05184173583984375, 0.0639495849609375, 0.07605743408203125, 0.088165283203125, 0.10027313232421875, 0.1123809814453125, 0.12448883056640625, 0.1365966796875, 0.14870452880859375, 0.1608123779296875, 0.17292022705078125, 0.185028076171875, 0.19713592529296875, 0.2092437744140625, 0.22135162353515625, 0.23345947265625, 0.24556732177734375, 0.2576751708984375, 0.26978302001953125, 0.281890869140625, 0.29399871826171875, 0.3061065673828125, 0.31821441650390625, 0.330322265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 11.0, 15.0, 9.0, 15.0, 27.0, 42.0, 43.0, 83.0, 128.0, 227.0, 425.0, 797.0, 1521.0, 3308.0, 7021.0, 18218.0, 52956.0, 202322.0, 556519.0, 140149.0, 39437.0, 14115.0, 5693.0, 2678.0, 1234.0, 636.0, 386.0, 191.0, 122.0, 70.0, 47.0, 27.0, 22.0, 16.0, 17.0, 10.0, 10.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.306640625, -0.2971687316894531, -0.28769683837890625, -0.2782249450683594, -0.2687530517578125, -0.2592811584472656, -0.24980926513671875, -0.24033737182617188, -0.230865478515625, -0.22139358520507812, -0.21192169189453125, -0.20244979858398438, -0.1929779052734375, -0.18350601196289062, -0.17403411865234375, -0.16456222534179688, -0.15509033203125, -0.14561843872070312, -0.13614654541015625, -0.12667465209960938, -0.1172027587890625, -0.10773086547851562, -0.09825897216796875, -0.08878707885742188, -0.079315185546875, -0.06984329223632812, -0.06037139892578125, -0.050899505615234375, -0.0414276123046875, -0.031955718994140625, -0.02248382568359375, -0.013011932373046875, -0.0035400390625, 0.005931854248046875, 0.01540374755859375, 0.024875640869140625, 0.0343475341796875, 0.043819427490234375, 0.05329132080078125, 0.06276321411132812, 0.072235107421875, 0.08170700073242188, 0.09117889404296875, 0.10065078735351562, 0.1101226806640625, 0.11959457397460938, 0.12906646728515625, 0.13853836059570312, 0.14801025390625, 0.15748214721679688, 0.16695404052734375, 0.17642593383789062, 0.1858978271484375, 0.19536972045898438, 0.20484161376953125, 0.21431350708007812, 0.223785400390625, 0.23325729370117188, 0.24272918701171875, 0.2522010803222656, 0.2616729736328125, 0.2711448669433594, 0.28061676025390625, 0.2900886535644531, 0.299560546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 8.0, 12.0, 9.0, 11.0, 16.0, 14.0, 17.0, 20.0, 23.0, 23.0, 29.0, 30.0, 29.0, 37.0, 45.0, 50.0, 52.0, 53.0, 39.0, 48.0, 44.0, 40.0, 37.0, 32.0, 35.0, 23.0, 33.0, 26.0, 27.0, 20.0, 23.0, 15.0, 7.0, 10.0, 10.0, 6.0, 4.0, 8.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72119140625, -0.6980514526367188, -0.6749114990234375, -0.6517715454101562, -0.628631591796875, -0.6054916381835938, -0.5823516845703125, -0.5592117309570312, -0.53607177734375, -0.5129318237304688, -0.4897918701171875, -0.46665191650390625, -0.443511962890625, -0.42037200927734375, -0.3972320556640625, -0.37409210205078125, -0.3509521484375, -0.32781219482421875, -0.3046722412109375, -0.28153228759765625, -0.258392333984375, -0.23525238037109375, -0.2121124267578125, -0.18897247314453125, -0.16583251953125, -0.14269256591796875, -0.1195526123046875, -0.09641265869140625, -0.073272705078125, -0.05013275146484375, -0.0269927978515625, -0.00385284423828125, 0.019287109375, 0.04242706298828125, 0.0655670166015625, 0.08870697021484375, 0.111846923828125, 0.13498687744140625, 0.1581268310546875, 0.18126678466796875, 0.20440673828125, 0.22754669189453125, 0.2506866455078125, 0.27382659912109375, 0.296966552734375, 0.32010650634765625, 0.3432464599609375, 0.36638641357421875, 0.3895263671875, 0.41266632080078125, 0.4358062744140625, 0.45894622802734375, 0.482086181640625, 0.5052261352539062, 0.5283660888671875, 0.5515060424804688, 0.57464599609375, 0.5977859497070312, 0.6209259033203125, 0.6440658569335938, 0.667205810546875, 0.6903457641601562, 0.7134857177734375, 0.7366256713867188, 0.759765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 9.0, 20.0, 33.0, 69.0, 98.0, 178.0, 351.0, 868.0, 3024.0, 22908.0, 542618.0, 452030.0, 21634.0, 2945.0, 916.0, 365.0, 202.0, 114.0, 52.0, 38.0, 17.0, 15.0, 7.0, 5.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.1932373046875, -0.1873798370361328, -0.18152236938476562, -0.17566490173339844, -0.16980743408203125, -0.16394996643066406, -0.15809249877929688, -0.1522350311279297, -0.1463775634765625, -0.1405200958251953, -0.13466262817382812, -0.12880516052246094, -0.12294769287109375, -0.11709022521972656, -0.11123275756835938, -0.10537528991699219, -0.099517822265625, -0.09366035461425781, -0.08780288696289062, -0.08194541931152344, -0.07608795166015625, -0.07023048400878906, -0.06437301635742188, -0.05851554870605469, -0.0526580810546875, -0.04680061340332031, -0.040943145751953125, -0.03508567810058594, -0.02922821044921875, -0.023370742797851562, -0.017513275146484375, -0.011655807495117188, -0.00579833984375, 5.91278076171875e-05, 0.005916595458984375, 0.011774063110351562, 0.01763153076171875, 0.023488998413085938, 0.029346466064453125, 0.03520393371582031, 0.0410614013671875, 0.04691886901855469, 0.052776336669921875, 0.05863380432128906, 0.06449127197265625, 0.07034873962402344, 0.07620620727539062, 0.08206367492675781, 0.087921142578125, 0.09377861022949219, 0.09963607788085938, 0.10549354553222656, 0.11135101318359375, 0.11720848083496094, 0.12306594848632812, 0.1289234161376953, 0.1347808837890625, 0.1406383514404297, 0.14649581909179688, 0.15235328674316406, 0.15821075439453125, 0.16406822204589844, 0.16992568969726562, 0.1757831573486328, 0.181640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 4.0, 8.0, 4.0, 5.0, 18.0, 9.0, 9.0, 13.0, 20.0, 20.0, 52.0, 44.0, 47.0, 55.0, 66.0, 60.0, 75.0, 72.0, 55.0, 82.0, 55.0, 42.0, 40.0, 32.0, 19.0, 28.0, 15.0, 16.0, 12.0, 5.0, 10.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.803971827030182e-05, -1.7423182725906372e-05, -1.6806647181510925e-05, -1.619011163711548e-05, -1.5573576092720032e-05, -1.4957040548324585e-05, -1.4340505003929138e-05, -1.3723969459533691e-05, -1.3107433915138245e-05, -1.2490898370742798e-05, -1.1874362826347351e-05, -1.1257827281951904e-05, -1.0641291737556458e-05, -1.002475619316101e-05, -9.408220648765564e-06, -8.791685104370117e-06, -8.17514955997467e-06, -7.558614015579224e-06, -6.942078471183777e-06, -6.32554292678833e-06, -5.709007382392883e-06, -5.0924718379974365e-06, -4.47593629360199e-06, -3.859400749206543e-06, -3.242865204811096e-06, -2.6263296604156494e-06, -2.0097941160202026e-06, -1.3932585716247559e-06, -7.767230272293091e-07, -1.601874828338623e-07, 4.5634806156158447e-07, 1.0728836059570312e-06, 1.689419150352478e-06, 2.305954694747925e-06, 2.9224902391433716e-06, 3.5390257835388184e-06, 4.155561327934265e-06, 4.772096872329712e-06, 5.388632416725159e-06, 6.0051679611206055e-06, 6.621703505516052e-06, 7.238239049911499e-06, 7.854774594306946e-06, 8.471310138702393e-06, 9.08784568309784e-06, 9.704381227493286e-06, 1.0320916771888733e-05, 1.093745231628418e-05, 1.1553987860679626e-05, 1.2170523405075073e-05, 1.278705894947052e-05, 1.3403594493865967e-05, 1.4020130038261414e-05, 1.463666558265686e-05, 1.5253201127052307e-05, 1.5869736671447754e-05, 1.64862722158432e-05, 1.7102807760238647e-05, 1.7719343304634094e-05, 1.833587884902954e-05, 1.8952414393424988e-05, 1.9568949937820435e-05, 2.018548548221588e-05, 2.0802021026611328e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 5.0, 5.0, 17.0, 21.0, 19.0, 19.0, 42.0, 51.0, 72.0, 135.0, 195.0, 336.0, 761.0, 1849.0, 6169.0, 27898.0, 192569.0, 691087.0, 102717.0, 17328.0, 4244.0, 1580.0, 654.0, 316.0, 179.0, 98.0, 54.0, 38.0, 15.0, 19.0, 15.0, 9.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22216796875, -0.216522216796875, -0.21087646484375, -0.205230712890625, -0.1995849609375, -0.193939208984375, -0.18829345703125, -0.182647705078125, -0.177001953125, -0.171356201171875, -0.16571044921875, -0.160064697265625, -0.1544189453125, -0.148773193359375, -0.14312744140625, -0.137481689453125, -0.1318359375, -0.126190185546875, -0.12054443359375, -0.114898681640625, -0.1092529296875, -0.103607177734375, -0.09796142578125, -0.092315673828125, -0.086669921875, -0.081024169921875, -0.07537841796875, -0.069732666015625, -0.0640869140625, -0.058441162109375, -0.05279541015625, -0.047149658203125, -0.04150390625, -0.035858154296875, -0.03021240234375, -0.024566650390625, -0.0189208984375, -0.013275146484375, -0.00762939453125, -0.001983642578125, 0.003662109375, 0.009307861328125, 0.01495361328125, 0.020599365234375, 0.0262451171875, 0.031890869140625, 0.03753662109375, 0.043182373046875, 0.048828125, 0.054473876953125, 0.06011962890625, 0.065765380859375, 0.0714111328125, 0.077056884765625, 0.08270263671875, 0.088348388671875, 0.093994140625, 0.099639892578125, 0.10528564453125, 0.110931396484375, 0.1165771484375, 0.122222900390625, 0.12786865234375, 0.133514404296875, 0.13916015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 6.0, 11.0, 11.0, 32.0, 40.0, 64.0, 82.0, 149.0, 159.0, 169.0, 109.0, 53.0, 30.0, 38.0, 17.0, 9.0, 9.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2484130859375, -0.24054527282714844, -0.23267745971679688, -0.2248096466064453, -0.21694183349609375, -0.2090740203857422, -0.20120620727539062, -0.19333839416503906, -0.1854705810546875, -0.17760276794433594, -0.16973495483398438, -0.1618671417236328, -0.15399932861328125, -0.1461315155029297, -0.13826370239257812, -0.13039588928222656, -0.122528076171875, -0.11466026306152344, -0.10679244995117188, -0.09892463684082031, -0.09105682373046875, -0.08318901062011719, -0.07532119750976562, -0.06745338439941406, -0.0595855712890625, -0.05171775817871094, -0.043849945068359375, -0.03598213195800781, -0.02811431884765625, -0.020246505737304688, -0.012378692626953125, -0.0045108795166015625, 0.00335693359375, 0.011224746704101562, 0.019092559814453125, 0.026960372924804688, 0.03482818603515625, 0.04269599914550781, 0.050563812255859375, 0.05843162536621094, 0.0662994384765625, 0.07416725158691406, 0.08203506469726562, 0.08990287780761719, 0.09777069091796875, 0.10563850402832031, 0.11350631713867188, 0.12137413024902344, 0.129241943359375, 0.13710975646972656, 0.14497756958007812, 0.1528453826904297, 0.16071319580078125, 0.1685810089111328, 0.17644882202148438, 0.18431663513183594, 0.1921844482421875, 0.20005226135253906, 0.20792007446289062, 0.2157878875732422, 0.22365570068359375, 0.2315235137939453, 0.23939132690429688, 0.24725914001464844, 0.255126953125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 8.0, 2.0, 11.0, 23.0, 51.0, 101.0, 156.0, 196.0, 201.0, 111.0, 66.0, 33.0, 22.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.291089057922363, -6.1569504737854, -6.022811412811279, -5.888672828674316, -5.754533767700195, -5.620395183563232, -5.486256122589111, -5.352117538452148, -5.217978477478027, -5.0838398933410645, -4.949700832366943, -4.8155622482299805, -4.681423187255859, -4.5472846031188965, -4.413145542144775, -4.2790069580078125, -4.14486837387085, -4.010729789733887, -3.8765907287597656, -3.7424519062042236, -3.6083130836486816, -3.4741744995117188, -3.3400356769561768, -3.2058968544006348, -3.0717580318450928, -2.937619209289551, -2.803480386734009, -2.669341564178467, -2.535202980041504, -2.401063919067383, -2.26692533493042, -2.132786512374878, -1.9986474514007568, -1.8645086288452148, -1.7303698062896729, -1.5962311029434204, -1.4620922803878784, -1.3279534578323364, -1.193814754486084, -1.059675931930542, -0.925537109375, -0.791398286819458, -0.6572595238685608, -0.5231207609176636, -0.3889819383621216, -0.2548431158065796, -0.12070435285568237, 0.013434410095214844, 0.14757323265075684, 0.28171202540397644, 0.41585081815719604, 0.5499895811080933, 0.6841284036636353, 0.8182672262191772, 0.9524059891700745, 1.0865447521209717, 1.2206835746765137, 1.3548223972320557, 1.4889612197875977, 1.62309992313385, 1.757238745689392, 1.891377568244934, 2.0255162715911865, 2.1596550941467285, 2.2937939167022705]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 6.0, 10.0, 9.0, 16.0, 11.0, 12.0, 20.0, 19.0, 15.0, 25.0, 38.0, 30.0, 32.0, 40.0, 55.0, 61.0, 53.0, 73.0, 61.0, 45.0, 40.0, 40.0, 41.0, 34.0, 29.0, 27.0, 14.0, 20.0, 17.0, 20.0, 18.0, 9.0, 6.0, 7.0, 12.0, 7.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-2.58965802192688, -2.516345977783203, -2.4430336952209473, -2.3697216510772705, -2.2964093685150146, -2.223097324371338, -2.149785041809082, -2.0764729976654053, -2.0031609535217285, -1.9298487901687622, -1.856536626815796, -1.7832244634628296, -1.7099123001098633, -1.6366002559661865, -1.5632880926132202, -1.489975929260254, -1.416663646697998, -1.3433514833450317, -1.2700393199920654, -1.1967271566390991, -1.1234149932861328, -1.050102949142456, -0.9767907857894897, -0.9034786224365234, -0.8301664590835571, -0.7568542957305908, -0.6835421323776245, -0.610230028629303, -0.5369178652763367, -0.46360570192337036, -0.39029356837272644, -0.3169814348220825, -0.2436692714691162, -0.1703571230173111, -0.09704497456550598, -0.023732826113700867, 0.04957932233810425, 0.12289148569107056, 0.19620361924171448, 0.2695157527923584, 0.3428279161453247, 0.416140079498291, 0.48945221304893494, 0.5627643465995789, 0.6360765099525452, 0.7093886733055115, 0.782700777053833, 0.8560129404067993, 0.9293251037597656, 1.002637267112732, 1.0759494304656982, 1.1492615938186646, 1.2225737571716309, 1.2958858013153076, 1.369197964668274, 1.4425101280212402, 1.5158222913742065, 1.5891344547271729, 1.6624466180801392, 1.7357587814331055, 1.8090708255767822, 1.882383108139038, 1.9556951522827148, 2.0290074348449707, 2.1023194789886475]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 4.0, 6.0, 11.0, 8.0, 7.0, 13.0, 9.0, 18.0, 21.0, 28.0, 26.0, 26.0, 46.0, 86.0, 227.0, 157.0, 63.0, 37.0, 22.0, 22.0, 25.0, 15.0, 17.0, 18.0, 17.0, 13.0, 8.0, 8.0, 10.0, 8.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467041015625, -0.4528350830078125, -0.438629150390625, -0.4244232177734375, -0.41021728515625, -0.3960113525390625, -0.381805419921875, -0.3675994873046875, -0.3533935546875, -0.3391876220703125, -0.324981689453125, -0.3107757568359375, -0.29656982421875, -0.2823638916015625, -0.268157958984375, -0.2539520263671875, -0.23974609375, -0.2255401611328125, -0.211334228515625, -0.1971282958984375, -0.18292236328125, -0.1687164306640625, -0.154510498046875, -0.1403045654296875, -0.1260986328125, -0.1118927001953125, -0.097686767578125, -0.0834808349609375, -0.06927490234375, -0.0550689697265625, -0.040863037109375, -0.0266571044921875, -0.012451171875, 0.0017547607421875, 0.015960693359375, 0.0301666259765625, 0.04437255859375, 0.0585784912109375, 0.072784423828125, 0.0869903564453125, 0.1011962890625, 0.1154022216796875, 0.129608154296875, 0.1438140869140625, 0.15802001953125, 0.1722259521484375, 0.186431884765625, 0.2006378173828125, 0.21484375, 0.2290496826171875, 0.243255615234375, 0.2574615478515625, 0.27166748046875, 0.2858734130859375, 0.300079345703125, 0.3142852783203125, 0.3284912109375, 0.3426971435546875, 0.356903076171875, 0.3711090087890625, 0.38531494140625, 0.3995208740234375, 0.413726806640625, 0.4279327392578125, 0.442138671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 8.0, 10.0, 4.0, 7.0, 9.0, 13.0, 20.0, 25.0, 33.0, 38.0, 82.0, 102.0, 192.0, 351.0, 515.0, 889.0, 1848.0, 4271.0, 12277.0, 80936.0, 8233709.0, 37565.0, 8900.0, 3390.0, 1497.0, 779.0, 430.0, 249.0, 145.0, 94.0, 53.0, 39.0, 32.0, 17.0, 14.0, 17.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5548295974731445, -1.5095940828323364, -1.4643585681915283, -1.4191230535507202, -1.373887538909912, -1.3286519050598145, -1.283416509628296, -1.2381808757781982, -1.1929453611373901, -1.147709846496582, -1.102474331855774, -1.0572388172149658, -1.0120033025741577, -0.9667677283287048, -0.9215322136878967, -0.8762966394424438, -0.8310611844062805, -0.7858256697654724, -0.7405901551246643, -0.6953545808792114, -0.6501190662384033, -0.6048835515975952, -0.5596480369567871, -0.514412522315979, -0.4691769778728485, -0.4239414632320404, -0.3787059187889099, -0.3334704041481018, -0.2882348895072937, -0.2429993450641632, -0.1977638304233551, -0.1525282859802246, -0.1072927713394165, -0.0620572455227375, -0.016821719706058502, 0.0284138023853302, 0.0736493319272995, 0.1188848614692688, 0.1641203761100769, 0.2093559205532074, 0.2545914351940155, 0.2998269498348236, 0.3450624942779541, 0.3902980089187622, 0.4355335235595703, 0.4807690680027008, 0.5260045528411865, 0.5712401270866394, 0.6164756417274475, 0.6617111563682556, 0.7069466710090637, 0.7521822452545166, 0.7974177598953247, 0.8426532745361328, 0.8878887891769409, 0.933124303817749, 0.9783598184585571, 1.0235953330993652, 1.0688308477401733, 1.1140663623809814, 1.1593018770217896, 1.2045373916625977, 1.2497730255126953, 1.2950085401535034, 1.3402440547943115]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 4.0, 8.0, 5.0, 6.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5159432888031006, -1.45436429977417, -1.3927853107452393, -1.3312063217163086, -1.269627332687378, -1.2080483436584473, -1.1464693546295166, -1.084890365600586, -1.0233113765716553, -0.9617323875427246, -0.900153398513794, -0.8385744094848633, -0.7769954204559326, -0.715416431427002, -0.6538373827934265, -0.5922583937644958, -0.5306793451309204, -0.46910035610198975, -0.4075213670730591, -0.34594234824180603, -0.28436335921287537, -0.2227843701839447, -0.16120535135269165, -0.09962636232376099, -0.03804737329483032, 0.02353162318468094, 0.0851106196641922, 0.14668962359428406, 0.20826861262321472, 0.2698476016521454, 0.33142662048339844, 0.3930056095123291, 0.45458459854125977, 0.5161635875701904, 0.5777425765991211, 0.6393215656280518, 0.7009005546569824, 0.7624795436859131, 0.8240585923194885, 0.8856375813484192, 0.9472165703773499, 1.0087956190109253, 1.070374608039856, 1.1319535970687866, 1.1935325860977173, 1.255111575126648, 1.3166905641555786, 1.3782695531845093, 1.43984854221344, 1.5014275312423706, 1.5630065202713013, 1.624585509300232, 1.6861644983291626, 1.7477434873580933, 1.8093225955963135, 1.8709015846252441, 1.9324805736541748, 1.9940595626831055, 2.055638551712036, 2.117217540740967, 2.1787965297698975, 2.240375518798828, 2.301954507827759, 2.3635334968566895, 2.42511248588562]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 6.0, 8.0, 9.0, 10.0, 14.0, 14.0, 27.0, 18.0, 26.0, 28.0, 35.0, 47.0, 40.0, 55.0, 42.0, 77.0, 62.0, 54.0, 49.0, 58.0, 47.0, 45.0, 36.0, 36.0, 39.0, 22.0, 26.0, 16.0, 9.0, 13.0, 7.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.19189453125, -0.18624114990234375, -0.1805877685546875, -0.17493438720703125, -0.169281005859375, -0.16362762451171875, -0.1579742431640625, -0.15232086181640625, -0.14666748046875, -0.14101409912109375, -0.1353607177734375, -0.12970733642578125, -0.124053955078125, -0.11840057373046875, -0.1127471923828125, -0.10709381103515625, -0.1014404296875, -0.09578704833984375, -0.0901336669921875, -0.08448028564453125, -0.078826904296875, -0.07317352294921875, -0.0675201416015625, -0.06186676025390625, -0.05621337890625, -0.05055999755859375, -0.0449066162109375, -0.03925323486328125, -0.033599853515625, -0.02794647216796875, -0.0222930908203125, -0.01663970947265625, -0.010986328125, -0.00533294677734375, 0.0003204345703125, 0.00597381591796875, 0.011627197265625, 0.01728057861328125, 0.0229339599609375, 0.02858734130859375, 0.03424072265625, 0.03989410400390625, 0.0455474853515625, 0.05120086669921875, 0.056854248046875, 0.06250762939453125, 0.0681610107421875, 0.07381439208984375, 0.0794677734375, 0.08512115478515625, 0.0907745361328125, 0.09642791748046875, 0.102081298828125, 0.10773468017578125, 0.1133880615234375, 0.11904144287109375, 0.12469482421875, 0.13034820556640625, 0.1360015869140625, 0.14165496826171875, 0.147308349609375, 0.15296173095703125, 0.1586151123046875, 0.16426849365234375, 0.169921875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 4.0, 5.0, 11.0, 14.0, 8.0, 27.0, 24.0, 38.0, 53.0, 73.0, 105.0, 183.0, 302.0, 523.0, 917.0, 1619.0, 3259.0, 7113.0, 19453.0, 74186.0, 258972.0, 113656.0, 26010.0, 9030.0, 3943.0, 2053.0, 1089.0, 613.0, 386.0, 209.0, 131.0, 72.0, 57.0, 34.0, 22.0, 22.0, 11.0, 4.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-6.4140625, -6.23895263671875, -6.0638427734375, -5.88873291015625, -5.713623046875, -5.53851318359375, -5.3634033203125, -5.18829345703125, -5.01318359375, -4.83807373046875, -4.6629638671875, -4.48785400390625, -4.312744140625, -4.13763427734375, -3.9625244140625, -3.78741455078125, -3.6123046875, -3.43719482421875, -3.2620849609375, -3.08697509765625, -2.911865234375, -2.73675537109375, -2.5616455078125, -2.38653564453125, -2.21142578125, -2.03631591796875, -1.8612060546875, -1.68609619140625, -1.510986328125, -1.33587646484375, -1.1607666015625, -0.98565673828125, -0.810546875, -0.63543701171875, -0.4603271484375, -0.28521728515625, -0.110107421875, 0.06500244140625, 0.2401123046875, 0.41522216796875, 0.59033203125, 0.76544189453125, 0.9405517578125, 1.11566162109375, 1.290771484375, 1.46588134765625, 1.6409912109375, 1.81610107421875, 1.9912109375, 2.16632080078125, 2.3414306640625, 2.51654052734375, 2.691650390625, 2.86676025390625, 3.0418701171875, 3.21697998046875, 3.39208984375, 3.56719970703125, 3.7423095703125, 3.91741943359375, 4.092529296875, 4.26763916015625, 4.4427490234375, 4.61785888671875, 4.79296875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 8.0, 10.0, 13.0, 11.0, 15.0, 27.0, 37.0, 46.0, 42.0, 41.0, 54.0, 71.0, 73.0, 63.0, 58.0, 48.0, 62.0, 43.0, 41.0, 37.0, 35.0, 33.0, 34.0, 20.0, 12.0, 14.0, 16.0, 13.0, 7.0, 9.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0], "bins": [-0.62158203125, -0.6067695617675781, -0.5919570922851562, -0.5771446228027344, -0.5623321533203125, -0.5475196838378906, -0.5327072143554688, -0.5178947448730469, -0.503082275390625, -0.4882698059082031, -0.47345733642578125, -0.4586448669433594, -0.4438323974609375, -0.4290199279785156, -0.41420745849609375, -0.3993949890136719, -0.38458251953125, -0.3697700500488281, -0.35495758056640625, -0.3401451110839844, -0.3253326416015625, -0.3105201721191406, -0.29570770263671875, -0.2808952331542969, -0.266082763671875, -0.2512702941894531, -0.23645782470703125, -0.22164535522460938, -0.2068328857421875, -0.19202041625976562, -0.17720794677734375, -0.16239547729492188, -0.1475830078125, -0.13277053833007812, -0.11795806884765625, -0.10314559936523438, -0.0883331298828125, -0.07352066040039062, -0.05870819091796875, -0.043895721435546875, -0.029083251953125, -0.014270782470703125, 0.00054168701171875, 0.015354156494140625, 0.0301666259765625, 0.044979095458984375, 0.05979156494140625, 0.07460403442382812, 0.08941650390625, 0.10422897338867188, 0.11904144287109375, 0.13385391235351562, 0.1486663818359375, 0.16347885131835938, 0.17829132080078125, 0.19310379028320312, 0.207916259765625, 0.22272872924804688, 0.23754119873046875, 0.2523536682128906, 0.2671661376953125, 0.2819786071777344, 0.29679107666015625, 0.3116035461425781, 0.326416015625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 2.0, 2.0, 11.0, 5.0, 8.0, 15.0, 20.0, 23.0, 20.0, 43.0, 48.0, 43.0, 50.0, 48.0, 37.0, 28.0, 20.0, 12.0, 2.0, 11.0, 4.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5814498662948608, -1.5361655950546265, -1.490881323814392, -1.4455970525741577, -1.4003127813339233, -1.3550283908843994, -1.309744119644165, -1.2644598484039307, -1.2191755771636963, -1.173891305923462, -1.1286070346832275, -1.0833227634429932, -1.0380384922027588, -0.9927541613578796, -0.9474698901176453, -0.9021855592727661, -0.8569013476371765, -0.8116170763969421, -0.7663328051567078, -0.7210484743118286, -0.6757642030715942, -0.6304799318313599, -0.5851956605911255, -0.5399113893508911, -0.49462708830833435, -0.4493428170681, -0.4040585160255432, -0.35877424478530884, -0.31348997354507446, -0.2682056725025177, -0.22292140126228333, -0.17763710021972656, -0.1323528289794922, -0.08706854283809662, -0.04178426414728165, 0.003500014543533325, 0.048784300684928894, 0.09406858682632446, 0.13935285806655884, 0.1846371591091156, 0.22992143034934998, 0.27520570158958435, 0.3204900026321411, 0.3657742738723755, 0.41105854511260986, 0.4563428461551666, 0.5016270875930786, 0.5469114184379578, 0.5921956896781921, 0.6374799609184265, 0.6827642321586609, 0.72804856300354, 0.7733328342437744, 0.8186171054840088, 0.8639013767242432, 0.9091856479644775, 0.9544699192047119, 0.9997541904449463, 1.0450384616851807, 1.090322732925415, 1.1356070041656494, 1.1808912754058838, 1.2261755466461182, 1.271459937095642, 1.3167442083358765]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 6.0, 3.0, 11.0, 14.0, 24.0, 32.0, 100.0, 128.0, 63.0, 15.0, 17.0, 5.0, 8.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9290261268615723, -1.8523635864257812, -1.7757010459899902, -1.6990385055541992, -1.6223760843276978, -1.5457135438919067, -1.4690510034561157, -1.3923885822296143, -1.3157260417938232, -1.2390635013580322, -1.1624009609222412, -1.0857384204864502, -1.0090759992599487, -0.9324134588241577, -0.8557509183883667, -0.7790884375572205, -0.7024258375167847, -0.6257632970809937, -0.5491008162498474, -0.4724382758140564, -0.39577576518058777, -0.31911325454711914, -0.24245071411132812, -0.16578823328018188, -0.08912569284439087, -0.012463174760341644, 0.06419934332370758, 0.1408618688583374, 0.21752437949180603, 0.29418689012527466, 0.3708494305610657, 0.4475119113922119, 0.5241744518280029, 0.600836992263794, 0.6774994730949402, 0.7541620135307312, 0.8308244943618774, 0.9074870347976685, 0.9841495752334595, 1.060811996459961, 1.137474536895752, 1.214137077331543, 1.290799617767334, 1.367462158203125, 1.4441245794296265, 1.5207871198654175, 1.5974496603012085, 1.67411208152771, 1.7507747411727905, 1.8274372816085815, 1.9040998220443726, 1.980762243270874, 2.057424783706665, 2.134087324142456, 2.210749864578247, 2.287412405014038, 2.364074945449829, 2.44073748588562, 2.517400026321411, 2.594062566757202, 2.670725107192993, 2.747387409210205, 2.824049949645996, 2.900712490081787, 2.977375030517578]}, "eval/loss": 1.8705445528030396, "eval/bleu": 4.138692653029469e-15, "eval/runtime": 2629.971, "eval/samples_per_second": 5.612, "eval/steps_per_second": 0.702} \ No newline at end of file